diff --git "a/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" --- "a/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" +++ "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 2.3435, "train/learning_rate": 9.412844036697248e-06, "train/epoch": 2.16, "train/global_step": 3500, "_runtime": 50252, "_timestamp": 1651822520, "_step": 3506, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 30.0, 298.0, 580.0, 108.0, 4.0], "bins": [-7.3556365966796875, -7.2355170249938965, -7.115396976470947, -6.995277404785156, -6.875157356262207, -6.755037784576416, -6.634918212890625, -6.514798164367676, -6.394678592681885, -6.274559020996094, -6.1544389724731445, -6.0343194007873535, -5.914199352264404, -5.794079780578613, -5.673960208892822, -5.553840160369873, -5.433720588684082, -5.313601016998291, -5.193480968475342, -5.073361396789551, -4.953241348266602, -4.8331217765808105, -4.7130022048950195, -4.59288215637207, -4.472762584686279, -4.352643013000488, -4.232522964477539, -4.112403392791748, -3.992283582687378, -3.872163772583008, -3.7520439624786377, -3.6319241523742676, -3.5118045806884766, -3.3916847705841064, -3.2715649604797363, -3.1514453887939453, -3.031325578689575, -2.911205768585205, -2.791085958480835, -2.670966148376465, -2.5508463382720947, -2.4307265281677246, -2.3106067180633545, -2.1904871463775635, -2.0703673362731934, -1.9502475261688232, -1.8301277160644531, -1.7100080251693726, -1.589888334274292, -1.4697685241699219, -1.3496488332748413, -1.2295290231704712, -1.1094093322753906, -0.9892895221710205, -0.8691697716712952, -0.7490500211715698, -0.6289303302764893, -0.5088105797767639, -0.3886908292770386, -0.26857104897499084, -0.1484512984752655, -0.028331518173217773, 0.09178823232650757, 0.2119079828262329, 0.33202776312828064]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 13.0, 10.0, 16.0, 23.0, 16.0, 23.0, 25.0, 29.0, 27.0, 28.0, 23.0, 28.0, 36.0, 34.0, 25.0, 34.0, 25.0, 38.0, 45.0, 41.0, 30.0, 36.0, 39.0, 40.0, 31.0, 29.0, 26.0, 25.0, 32.0, 22.0, 20.0, 17.0, 12.0, 12.0, 15.0, 11.0, 9.0, 4.0, 4.0, 5.0, 3.0, 10.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4490542411804199, -0.4343337416648865, -0.4196132719516754, -0.40489277243614197, -0.3901722729206085, -0.37545180320739746, -0.360731303691864, -0.34601080417633057, -0.3312903046607971, -0.31656980514526367, -0.3018493354320526, -0.28712883591651917, -0.2724083364009857, -0.25768786668777466, -0.2429673671722412, -0.22824686765670776, -0.2135263830423355, -0.19880589842796326, -0.1840853989124298, -0.16936491429805756, -0.1546444147825241, -0.13992393016815186, -0.1252034306526184, -0.11048294603824615, -0.0957624539732933, -0.08104196190834045, -0.0663214698433876, -0.05160098150372505, -0.0368804894387722, -0.02216000109910965, -0.007439509034156799, 0.007280983030796051, 0.0220014750957489, 0.03672196716070175, 0.0514424592256546, 0.06616294384002686, 0.0808834433555603, 0.09560392796993256, 0.1103244200348854, 0.12504491209983826, 0.1397654116153717, 0.15448589622974396, 0.1692063957452774, 0.18392688035964966, 0.1986473798751831, 0.21336786448955536, 0.2280883491039276, 0.24280884861946106, 0.2575293183326721, 0.27224981784820557, 0.2869702875614166, 0.3016907870769501, 0.3164112865924835, 0.3311317563056946, 0.345852255821228, 0.3605727553367615, 0.3752932548522949, 0.39001375436782837, 0.40473422408103943, 0.4194547235965729, 0.4341752231121063, 0.4488956928253174, 0.46361619234085083, 0.4783366918563843, 0.4930571913719177]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 6.0, 12.0, 17.0, 33.0, 23.0, 43.0, 69.0, 123.0, 140.0, 224.0, 312.0, 516.0, 898.0, 1677.0, 3361.0, 8169.0, 25346.0, 94675.0, 323303.0, 844062.0, 1446812.0, 921302.0, 360404.0, 112668.0, 32015.0, 9947.0, 3856.0, 1718.0, 959.0, 535.0, 346.0, 223.0, 141.0, 107.0, 58.0, 54.0, 37.0, 23.0, 14.0, 11.0, 12.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.8955078125, -0.8710098266601562, -0.8465118408203125, -0.8220138549804688, -0.797515869140625, -0.7730178833007812, -0.7485198974609375, -0.7240219116210938, -0.69952392578125, -0.6750259399414062, -0.6505279541015625, -0.6260299682617188, -0.601531982421875, -0.5770339965820312, -0.5525360107421875, -0.5280380249023438, -0.5035400390625, -0.47904205322265625, -0.4545440673828125, -0.43004608154296875, -0.405548095703125, -0.38105010986328125, -0.3565521240234375, -0.33205413818359375, -0.30755615234375, -0.28305816650390625, -0.2585601806640625, -0.23406219482421875, -0.209564208984375, -0.18506622314453125, -0.1605682373046875, -0.13607025146484375, -0.111572265625, -0.08707427978515625, -0.0625762939453125, -0.03807830810546875, -0.013580322265625, 0.01091766357421875, 0.0354156494140625, 0.05991363525390625, 0.08441162109375, 0.10890960693359375, 0.1334075927734375, 0.15790557861328125, 0.182403564453125, 0.20690155029296875, 0.2313995361328125, 0.25589752197265625, 0.2803955078125, 0.30489349365234375, 0.3293914794921875, 0.35388946533203125, 0.378387451171875, 0.40288543701171875, 0.4273834228515625, 0.45188140869140625, 0.47637939453125, 0.5008773803710938, 0.5253753662109375, 0.5498733520507812, 0.574371337890625, 0.5988693237304688, 0.6233673095703125, 0.6478652954101562, 0.67236328125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 17.0, 12.0, 13.0, 15.0, 21.0, 21.0, 22.0, 13.0, 25.0, 29.0, 23.0, 31.0, 29.0, 41.0, 37.0, 46.0, 38.0, 43.0, 50.0, 35.0, 39.0, 41.0, 26.0, 29.0, 34.0, 22.0, 28.0, 29.0, 26.0, 26.0, 12.0, 19.0, 15.0, 6.0, 10.0, 12.0, 5.0, 15.0, 4.0, 2.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.7109375, -0.6892776489257812, -0.6676177978515625, -0.6459579467773438, -0.624298095703125, -0.6026382446289062, -0.5809783935546875, -0.5593185424804688, -0.53765869140625, -0.5159988403320312, -0.4943389892578125, -0.47267913818359375, -0.451019287109375, -0.42935943603515625, -0.4076995849609375, -0.38603973388671875, -0.3643798828125, -0.34272003173828125, -0.3210601806640625, -0.29940032958984375, -0.277740478515625, -0.25608062744140625, -0.2344207763671875, -0.21276092529296875, -0.19110107421875, -0.16944122314453125, -0.1477813720703125, -0.12612152099609375, -0.104461669921875, -0.08280181884765625, -0.0611419677734375, -0.03948211669921875, -0.017822265625, 0.00383758544921875, 0.0254974365234375, 0.04715728759765625, 0.068817138671875, 0.09047698974609375, 0.1121368408203125, 0.13379669189453125, 0.15545654296875, 0.17711639404296875, 0.1987762451171875, 0.22043609619140625, 0.242095947265625, 0.26375579833984375, 0.2854156494140625, 0.30707550048828125, 0.3287353515625, 0.35039520263671875, 0.3720550537109375, 0.39371490478515625, 0.415374755859375, 0.43703460693359375, 0.4586944580078125, 0.48035430908203125, 0.50201416015625, 0.5236740112304688, 0.5453338623046875, 0.5669937133789062, 0.588653564453125, 0.6103134155273438, 0.6319732666015625, 0.6536331176757812, 0.67529296875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 6.0, 3.0, 12.0, 15.0, 26.0, 32.0, 52.0, 77.0, 134.0, 237.0, 525.0, 1847.0, 4184659.0, 5520.0, 552.0, 238.0, 117.0, 88.0, 48.0, 23.0, 21.0, 12.0, 6.0, 10.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.7532958984375, -7.358154296875, -6.9630126953125, -6.56787109375, -6.1727294921875, -5.777587890625, -5.3824462890625, -4.9873046875, -4.5921630859375, -4.197021484375, -3.8018798828125, -3.40673828125, -3.0115966796875, -2.616455078125, -2.2213134765625, -1.826171875, -1.4310302734375, -1.035888671875, -0.6407470703125, -0.24560546875, 0.1495361328125, 0.544677734375, 0.9398193359375, 1.3349609375, 1.7301025390625, 2.125244140625, 2.5203857421875, 2.91552734375, 3.3106689453125, 3.705810546875, 4.1009521484375, 4.49609375, 4.8912353515625, 5.286376953125, 5.6815185546875, 6.07666015625, 6.4718017578125, 6.866943359375, 7.2620849609375, 7.6572265625, 8.0523681640625, 8.447509765625, 8.8426513671875, 9.23779296875, 9.6329345703125, 10.028076171875, 10.4232177734375, 10.818359375, 11.2135009765625, 11.608642578125, 12.0037841796875, 12.39892578125, 12.7940673828125, 13.189208984375, 13.5843505859375, 13.9794921875, 14.3746337890625, 14.769775390625, 15.1649169921875, 15.56005859375, 15.9552001953125, 16.350341796875, 16.7454833984375, 17.140625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 6.0, 15.0, 14.0, 19.0, 35.0, 30.0, 68.0, 95.0, 117.0, 206.0, 351.0, 551.0, 774.0, 666.0, 441.0, 230.0, 142.0, 100.0, 69.0, 36.0, 33.0, 13.0, 13.0, 11.0, 11.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312255859375, -0.2996559143066406, -0.28705596923828125, -0.2744560241699219, -0.2618560791015625, -0.24925613403320312, -0.23665618896484375, -0.22405624389648438, -0.211456298828125, -0.19885635375976562, -0.18625640869140625, -0.17365646362304688, -0.1610565185546875, -0.14845657348632812, -0.13585662841796875, -0.12325668334960938, -0.11065673828125, -0.09805679321289062, -0.08545684814453125, -0.07285690307617188, -0.0602569580078125, -0.047657012939453125, -0.03505706787109375, -0.022457122802734375, -0.009857177734375, 0.002742767333984375, 0.01534271240234375, 0.027942657470703125, 0.0405426025390625, 0.053142547607421875, 0.06574249267578125, 0.07834243774414062, 0.0909423828125, 0.10354232788085938, 0.11614227294921875, 0.12874221801757812, 0.1413421630859375, 0.15394210815429688, 0.16654205322265625, 0.17914199829101562, 0.191741943359375, 0.20434188842773438, 0.21694183349609375, 0.22954177856445312, 0.2421417236328125, 0.2547416687011719, 0.26734161376953125, 0.2799415588378906, 0.29254150390625, 0.3051414489746094, 0.31774139404296875, 0.3303413391113281, 0.3429412841796875, 0.3555412292480469, 0.36814117431640625, 0.3807411193847656, 0.393341064453125, 0.4059410095214844, 0.41854095458984375, 0.4311408996582031, 0.4437408447265625, 0.4563407897949219, 0.46894073486328125, 0.4815406799316406, 0.494140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 19.0, 22.0, 14.0, 17.0, 32.0, 44.0, 44.0, 56.0, 77.0, 64.0, 67.0, 75.0, 79.0, 74.0, 63.0, 47.0, 54.0, 30.0, 17.0, 20.0, 23.0, 10.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9310712218284607, -0.8977305889129639, -0.8643900156021118, -0.831049382686615, -0.7977087497711182, -0.7643681764602661, -0.7310275435447693, -0.6976869106292725, -0.6643463373184204, -0.6310057044029236, -0.5976651310920715, -0.5643244981765747, -0.5309838652610779, -0.49764326214790344, -0.464302659034729, -0.4309620261192322, -0.39762139320373535, -0.3642807900905609, -0.3309401571750641, -0.29759955406188965, -0.2642589211463928, -0.23091831803321838, -0.19757771492004395, -0.1642370969057083, -0.13089647889137268, -0.09755586087703705, -0.06421525031328201, -0.030874639749526978, 0.002465978264808655, 0.03580659627914429, 0.06914719939231873, 0.10248781740665436, 0.13582849502563477, 0.1691691130399704, 0.20250973105430603, 0.23585033416748047, 0.2691909670829773, 0.30253157019615173, 0.33587217330932617, 0.369212806224823, 0.40255340933799744, 0.4358940124511719, 0.4692346453666687, 0.5025752782821655, 0.5359158515930176, 0.5692564845085144, 0.6025971174240112, 0.6359376907348633, 0.6692783236503601, 0.7026189565658569, 0.735959529876709, 0.7693001627922058, 0.8026407957077026, 0.8359813690185547, 0.8693220019340515, 0.9026626348495483, 0.9360032081604004, 0.9693438410758972, 1.002684473991394, 1.036025047302246, 1.0693656206130981, 1.1027063131332397, 1.1360468864440918, 1.1693874597549438, 1.2027281522750854]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 9.0, 7.0, 12.0, 8.0, 9.0, 17.0, 21.0, 25.0, 24.0, 21.0, 21.0, 27.0, 27.0, 25.0, 33.0, 39.0, 36.0, 40.0, 44.0, 44.0, 38.0, 51.0, 42.0, 33.0, 35.0, 35.0, 32.0, 28.0, 26.0, 22.0, 24.0, 28.0, 20.0, 14.0, 12.0, 12.0, 11.0, 11.0, 7.0, 5.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.7759767770767212, -0.7530622482299805, -0.7301477193832397, -0.707233190536499, -0.6843186616897583, -0.6614041328430176, -0.6384896039962769, -0.6155750751495361, -0.5926605463027954, -0.5697460174560547, -0.546831488609314, -0.5239169597625732, -0.5010024309158325, -0.4780879020690918, -0.4551733434200287, -0.43225881457328796, -0.40934425592422485, -0.38642972707748413, -0.3635151982307434, -0.3406006693840027, -0.31768614053726196, -0.29477161169052124, -0.27185705304145813, -0.2489425241947174, -0.22602799534797668, -0.20311346650123596, -0.18019893765449524, -0.15728439390659332, -0.1343698650598526, -0.11145533621311188, -0.08854079246520996, -0.06562626361846924, -0.04271179437637329, -0.01979726180434227, 0.0031172707676887512, 0.02603180706501007, 0.04894633591175079, 0.07186086475849152, 0.09477540850639343, 0.11768993735313416, 0.14060446619987488, 0.1635189950466156, 0.18643352389335632, 0.20934806764125824, 0.23226259648799896, 0.2551771402359009, 0.2780916690826416, 0.3010061979293823, 0.32392072677612305, 0.34683525562286377, 0.3697497844696045, 0.3926643133163452, 0.41557884216308594, 0.43849337100982666, 0.46140792965888977, 0.4843224585056305, 0.5072369575500488, 0.5301514863967896, 0.5530660152435303, 0.575980544090271, 0.5988950729370117, 0.6218096017837524, 0.6447241306304932, 0.6676386594772339, 0.6905532479286194]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 9.0, 11.0, 17.0, 36.0, 49.0, 64.0, 92.0, 164.0, 249.0, 416.0, 662.0, 945.0, 1705.0, 3049.0, 5622.0, 10958.0, 21575.0, 43460.0, 93191.0, 199033.0, 294202.0, 195155.0, 90552.0, 42797.0, 20854.0, 10663.0, 5601.0, 2978.0, 1722.0, 950.0, 611.0, 437.0, 265.0, 166.0, 84.0, 66.0, 49.0, 34.0, 28.0, 15.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.31005859375, -0.302001953125, -0.2939453125, -0.285888671875, -0.27783203125, -0.269775390625, -0.26171875, -0.253662109375, -0.24560546875, -0.237548828125, -0.2294921875, -0.221435546875, -0.21337890625, -0.205322265625, -0.197265625, -0.189208984375, -0.18115234375, -0.173095703125, -0.1650390625, -0.156982421875, -0.14892578125, -0.140869140625, -0.1328125, -0.124755859375, -0.11669921875, -0.108642578125, -0.1005859375, -0.092529296875, -0.08447265625, -0.076416015625, -0.068359375, -0.060302734375, -0.05224609375, -0.044189453125, -0.0361328125, -0.028076171875, -0.02001953125, -0.011962890625, -0.00390625, 0.004150390625, 0.01220703125, 0.020263671875, 0.0283203125, 0.036376953125, 0.04443359375, 0.052490234375, 0.060546875, 0.068603515625, 0.07666015625, 0.084716796875, 0.0927734375, 0.100830078125, 0.10888671875, 0.116943359375, 0.125, 0.133056640625, 0.14111328125, 0.149169921875, 0.1572265625, 0.165283203125, 0.17333984375, 0.181396484375, 0.189453125, 0.197509765625, 0.20556640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 5.0, 7.0, 11.0, 7.0, 11.0, 13.0, 15.0, 11.0, 19.0, 25.0, 23.0, 17.0, 32.0, 24.0, 45.0, 39.0, 42.0, 38.0, 44.0, 36.0, 40.0, 42.0, 38.0, 55.0, 35.0, 39.0, 38.0, 27.0, 31.0, 24.0, 26.0, 16.0, 21.0, 20.0, 13.0, 12.0, 11.0, 5.0, 9.0, 6.0, 9.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.544921875, -0.5270614624023438, -0.5092010498046875, -0.49134063720703125, -0.473480224609375, -0.45561981201171875, -0.4377593994140625, -0.41989898681640625, -0.40203857421875, -0.38417816162109375, -0.3663177490234375, -0.34845733642578125, -0.330596923828125, -0.31273651123046875, -0.2948760986328125, -0.27701568603515625, -0.2591552734375, -0.24129486083984375, -0.2234344482421875, -0.20557403564453125, -0.187713623046875, -0.16985321044921875, -0.1519927978515625, -0.13413238525390625, -0.11627197265625, -0.09841156005859375, -0.0805511474609375, -0.06269073486328125, -0.044830322265625, -0.02696990966796875, -0.0091094970703125, 0.00875091552734375, 0.026611328125, 0.04447174072265625, 0.0623321533203125, 0.08019256591796875, 0.098052978515625, 0.11591339111328125, 0.1337738037109375, 0.15163421630859375, 0.16949462890625, 0.18735504150390625, 0.2052154541015625, 0.22307586669921875, 0.240936279296875, 0.25879669189453125, 0.2766571044921875, 0.29451751708984375, 0.3123779296875, 0.33023834228515625, 0.3480987548828125, 0.36595916748046875, 0.383819580078125, 0.40167999267578125, 0.4195404052734375, 0.43740081787109375, 0.45526123046875, 0.47312164306640625, 0.4909820556640625, 0.5088424682617188, 0.526702880859375, 0.5445632934570312, 0.5624237060546875, 0.5802841186523438, 0.59814453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 15.0, 15.0, 24.0, 30.0, 49.0, 48.0, 77.0, 139.0, 247.0, 371.0, 743.0, 1455.0, 3019.0, 7156.0, 18270.0, 54243.0, 189400.0, 443614.0, 227684.0, 65032.0, 21614.0, 8236.0, 3472.0, 1675.0, 798.0, 411.0, 250.0, 146.0, 111.0, 48.0, 43.0, 26.0, 26.0, 11.0, 10.0, 7.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.4580078125, -0.4447593688964844, -0.43151092529296875, -0.4182624816894531, -0.4050140380859375, -0.3917655944824219, -0.37851715087890625, -0.3652687072753906, -0.352020263671875, -0.3387718200683594, -0.32552337646484375, -0.3122749328613281, -0.2990264892578125, -0.2857780456542969, -0.27252960205078125, -0.2592811584472656, -0.24603271484375, -0.23278427124023438, -0.21953582763671875, -0.20628738403320312, -0.1930389404296875, -0.17979049682617188, -0.16654205322265625, -0.15329360961914062, -0.140045166015625, -0.12679672241210938, -0.11354827880859375, -0.10029983520507812, -0.0870513916015625, -0.07380294799804688, -0.06055450439453125, -0.047306060791015625, -0.0340576171875, -0.020809173583984375, -0.00756072998046875, 0.005687713623046875, 0.0189361572265625, 0.032184600830078125, 0.04543304443359375, 0.058681488037109375, 0.071929931640625, 0.08517837524414062, 0.09842681884765625, 0.11167526245117188, 0.1249237060546875, 0.13817214965820312, 0.15142059326171875, 0.16466903686523438, 0.17791748046875, 0.19116592407226562, 0.20441436767578125, 0.21766281127929688, 0.2309112548828125, 0.24415969848632812, 0.25740814208984375, 0.2706565856933594, 0.283905029296875, 0.2971534729003906, 0.31040191650390625, 0.3236503601074219, 0.3368988037109375, 0.3501472473144531, 0.36339569091796875, 0.3766441345214844, 0.389892578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 3.0, 6.0, 5.0, 11.0, 13.0, 13.0, 12.0, 16.0, 18.0, 26.0, 23.0, 20.0, 31.0, 44.0, 32.0, 38.0, 48.0, 41.0, 44.0, 41.0, 41.0, 51.0, 48.0, 45.0, 45.0, 27.0, 30.0, 37.0, 25.0, 32.0, 25.0, 12.0, 9.0, 6.0, 14.0, 18.0, 15.0, 16.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1128997802734375, -1.074432373046875, -1.0359649658203125, -0.99749755859375, -0.9590301513671875, -0.920562744140625, -0.8820953369140625, -0.8436279296875, -0.8051605224609375, -0.766693115234375, -0.7282257080078125, -0.68975830078125, -0.6512908935546875, -0.612823486328125, -0.5743560791015625, -0.535888671875, -0.4974212646484375, -0.458953857421875, -0.4204864501953125, -0.38201904296875, -0.3435516357421875, -0.305084228515625, -0.2666168212890625, -0.2281494140625, -0.1896820068359375, -0.151214599609375, -0.1127471923828125, -0.07427978515625, -0.0358123779296875, 0.002655029296875, 0.0411224365234375, 0.07958984375, 0.1180572509765625, 0.156524658203125, 0.1949920654296875, 0.23345947265625, 0.2719268798828125, 0.310394287109375, 0.3488616943359375, 0.3873291015625, 0.4257965087890625, 0.464263916015625, 0.5027313232421875, 0.54119873046875, 0.5796661376953125, 0.618133544921875, 0.6566009521484375, 0.695068359375, 0.7335357666015625, 0.772003173828125, 0.8104705810546875, 0.84893798828125, 0.8874053955078125, 0.925872802734375, 0.9643402099609375, 1.0028076171875, 1.0412750244140625, 1.079742431640625, 1.1182098388671875, 1.15667724609375, 1.1951446533203125, 1.233612060546875, 1.2720794677734375, 1.310546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 16.0, 16.0, 26.0, 26.0, 53.0, 68.0, 108.0, 187.0, 278.0, 507.0, 774.0, 1396.0, 2621.0, 5424.0, 12151.0, 36466.0, 225238.0, 624613.0, 98398.0, 22430.0, 8517.0, 4154.0, 2107.0, 1185.0, 636.0, 394.0, 221.0, 190.0, 101.0, 73.0, 47.0, 36.0, 30.0, 12.0, 11.0, 6.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.240478515625, -0.23366737365722656, -0.22685623168945312, -0.2200450897216797, -0.21323394775390625, -0.2064228057861328, -0.19961166381835938, -0.19280052185058594, -0.1859893798828125, -0.17917823791503906, -0.17236709594726562, -0.1655559539794922, -0.15874481201171875, -0.1519336700439453, -0.14512252807617188, -0.13831138610839844, -0.131500244140625, -0.12468910217285156, -0.11787796020507812, -0.11106681823730469, -0.10425567626953125, -0.09744453430175781, -0.09063339233398438, -0.08382225036621094, -0.0770111083984375, -0.07019996643066406, -0.06338882446289062, -0.05657768249511719, -0.04976654052734375, -0.04295539855957031, -0.036144256591796875, -0.029333114624023438, -0.02252197265625, -0.015710830688476562, -0.008899688720703125, -0.0020885467529296875, 0.00472259521484375, 0.011533737182617188, 0.018344879150390625, 0.025156021118164062, 0.0319671630859375, 0.03877830505371094, 0.045589447021484375, 0.05240058898925781, 0.05921173095703125, 0.06602287292480469, 0.07283401489257812, 0.07964515686035156, 0.086456298828125, 0.09326744079589844, 0.10007858276367188, 0.10688972473144531, 0.11370086669921875, 0.12051200866699219, 0.12732315063476562, 0.13413429260253906, 0.1409454345703125, 0.14775657653808594, 0.15456771850585938, 0.1613788604736328, 0.16819000244140625, 0.1750011444091797, 0.18181228637695312, 0.18862342834472656, 0.1954345703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 4.0, 6.0, 5.0, 15.0, 18.0, 25.0, 71.0, 125.0, 213.0, 222.0, 144.0, 52.0, 31.0, 24.0, 10.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.226799011230469e-05, -8.741766214370728e-05, -8.256733417510986e-05, -7.771700620651245e-05, -7.286667823791504e-05, -6.801635026931763e-05, -6.316602230072021e-05, -5.83156943321228e-05, -5.346536636352539e-05, -4.861503839492798e-05, -4.3764710426330566e-05, -3.8914382457733154e-05, -3.406405448913574e-05, -2.921372652053833e-05, -2.4363398551940918e-05, -1.9513070583343506e-05, -1.4662742614746094e-05, -9.812414646148682e-06, -4.9620866775512695e-06, -1.1175870895385742e-07, 4.738569259643555e-06, 9.588897228240967e-06, 1.4439225196838379e-05, 1.928955316543579e-05, 2.4139881134033203e-05, 2.8990209102630615e-05, 3.384053707122803e-05, 3.869086503982544e-05, 4.354119300842285e-05, 4.8391520977020264e-05, 5.3241848945617676e-05, 5.809217691421509e-05, 6.29425048828125e-05, 6.779283285140991e-05, 7.264316082000732e-05, 7.749348878860474e-05, 8.234381675720215e-05, 8.719414472579956e-05, 9.204447269439697e-05, 9.689480066299438e-05, 0.0001017451286315918, 0.00010659545660018921, 0.00011144578456878662, 0.00011629611253738403, 0.00012114644050598145, 0.00012599676847457886, 0.00013084709644317627, 0.00013569742441177368, 0.0001405477523803711, 0.0001453980803489685, 0.00015024840831756592, 0.00015509873628616333, 0.00015994906425476074, 0.00016479939222335815, 0.00016964972019195557, 0.00017450004816055298, 0.0001793503761291504, 0.0001842007040977478, 0.00018905103206634521, 0.00019390136003494263, 0.00019875168800354004, 0.00020360201597213745, 0.00020845234394073486, 0.00021330267190933228, 0.0002181529998779297]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 7.0, 13.0, 12.0, 13.0, 10.0, 38.0, 43.0, 73.0, 135.0, 427.0, 2268.0, 17439.0, 726673.0, 289170.0, 10070.0, 1508.0, 300.0, 123.0, 65.0, 43.0, 23.0, 23.0, 10.0, 11.0, 7.0, 8.0, 9.0, 2.0, 2.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.56640625, -0.5496902465820312, -0.5329742431640625, -0.5162582397460938, -0.499542236328125, -0.48282623291015625, -0.4661102294921875, -0.44939422607421875, -0.43267822265625, -0.41596221923828125, -0.3992462158203125, -0.38253021240234375, -0.365814208984375, -0.34909820556640625, -0.3323822021484375, -0.31566619873046875, -0.2989501953125, -0.28223419189453125, -0.2655181884765625, -0.24880218505859375, -0.232086181640625, -0.21537017822265625, -0.1986541748046875, -0.18193817138671875, -0.16522216796875, -0.14850616455078125, -0.1317901611328125, -0.11507415771484375, -0.098358154296875, -0.08164215087890625, -0.0649261474609375, -0.04821014404296875, -0.031494140625, -0.01477813720703125, 0.0019378662109375, 0.01865386962890625, 0.035369873046875, 0.05208587646484375, 0.0688018798828125, 0.08551788330078125, 0.10223388671875, 0.11894989013671875, 0.1356658935546875, 0.15238189697265625, 0.169097900390625, 0.18581390380859375, 0.2025299072265625, 0.21924591064453125, 0.2359619140625, 0.25267791748046875, 0.2693939208984375, 0.28610992431640625, 0.302825927734375, 0.31954193115234375, 0.3362579345703125, 0.35297393798828125, 0.36968994140625, 0.38640594482421875, 0.4031219482421875, 0.41983795166015625, 0.436553955078125, 0.45326995849609375, 0.4699859619140625, 0.48670196533203125, 0.50341796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 6.0, 2.0, 9.0, 10.0, 10.0, 16.0, 31.0, 30.0, 48.0, 63.0, 83.0, 111.0, 107.0, 97.0, 91.0, 73.0, 50.0, 37.0, 32.0, 23.0, 11.0, 9.0, 12.0, 5.0, 6.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.059814453125, -0.058083534240722656, -0.05635261535644531, -0.05462169647216797, -0.052890777587890625, -0.05115985870361328, -0.04942893981933594, -0.047698020935058594, -0.04596710205078125, -0.044236183166503906, -0.04250526428222656, -0.04077434539794922, -0.039043426513671875, -0.03731250762939453, -0.03558158874511719, -0.033850669860839844, -0.0321197509765625, -0.030388832092285156, -0.028657913208007812, -0.02692699432373047, -0.025196075439453125, -0.02346515655517578, -0.021734237670898438, -0.020003318786621094, -0.01827239990234375, -0.016541481018066406, -0.014810562133789062, -0.013079643249511719, -0.011348724365234375, -0.009617805480957031, -0.007886886596679688, -0.006155967712402344, -0.004425048828125, -0.0026941299438476562, -0.0009632110595703125, 0.0007677078247070312, 0.002498626708984375, 0.004229545593261719, 0.0059604644775390625, 0.007691383361816406, 0.00942230224609375, 0.011153221130371094, 0.012884140014648438, 0.014615058898925781, 0.016345977783203125, 0.01807689666748047, 0.019807815551757812, 0.021538734436035156, 0.0232696533203125, 0.025000572204589844, 0.026731491088867188, 0.02846240997314453, 0.030193328857421875, 0.03192424774169922, 0.03365516662597656, 0.035386085510253906, 0.03711700439453125, 0.038847923278808594, 0.04057884216308594, 0.04230976104736328, 0.044040679931640625, 0.04577159881591797, 0.04750251770019531, 0.049233436584472656, 0.05096435546875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 22.0, 62.0, 169.0, 275.0, 257.0, 140.0, 50.0, 21.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.77331805229187, -2.680614948272705, -2.587911605834961, -2.495208501815796, -2.402505397796631, -2.309802293777466, -2.217099189758301, -2.1243958473205566, -2.0316927433013916, -1.9389896392822266, -1.846286416053772, -1.7535831928253174, -1.6608800888061523, -1.5681769847869873, -1.4754737615585327, -1.3827705383300781, -1.290067434310913, -1.197364330291748, -1.1046611070632935, -1.0119578838348389, -0.9192547798156738, -0.826551616191864, -0.7338484525680542, -0.6411452889442444, -0.5484421253204346, -0.45573896169662476, -0.36303579807281494, -0.2703326344490051, -0.1776294708251953, -0.0849263072013855, 0.007776856422424316, 0.10048002004623413, 0.19318294525146484, 0.28588610887527466, 0.3785892724990845, 0.4712924361228943, 0.5639955997467041, 0.6566987633705139, 0.7494019269943237, 0.8421050906181335, 0.9348082542419434, 1.0275113582611084, 1.120214581489563, 1.2129178047180176, 1.3056209087371826, 1.3983240127563477, 1.4910272359848022, 1.5837304592132568, 1.6764335632324219, 1.769136667251587, 1.8618398904800415, 1.954543113708496, 2.047246217727661, 2.139949321746826, 2.2326526641845703, 2.3253557682037354, 2.4180588722229004, 2.5107619762420654, 2.6034650802612305, 2.6961684226989746, 2.7888715267181396, 2.8815746307373047, 2.974277973175049, 3.066981077194214, 3.159684181213379]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 11.0, 6.0, 9.0, 6.0, 14.0, 12.0, 15.0, 13.0, 19.0, 19.0, 27.0, 24.0, 39.0, 25.0, 26.0, 41.0, 38.0, 37.0, 35.0, 43.0, 49.0, 48.0, 46.0, 40.0, 35.0, 36.0, 33.0, 29.0, 36.0, 25.0, 24.0, 21.0, 26.0, 11.0, 12.0, 13.0, 10.0, 4.0, 10.0, 9.0, 3.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5374580025672913, -0.5204207301139832, -0.503383457660675, -0.48634618520736694, -0.46930891275405884, -0.45227164030075073, -0.43523433804512024, -0.41819706559181213, -0.40115979313850403, -0.3841225206851959, -0.3670852482318878, -0.3500479757785797, -0.3330106735229492, -0.3159734010696411, -0.298936128616333, -0.2818988561630249, -0.2648615837097168, -0.2478243112564087, -0.23078703880310059, -0.2137497514486313, -0.19671247899532318, -0.17967520654201508, -0.16263791918754578, -0.14560064673423767, -0.12856337428092957, -0.11152610182762146, -0.09448882192373276, -0.07745154201984406, -0.06041426956653595, -0.043376997113227844, -0.026339717209339142, -0.00930243730545044, 0.007734894752502441, 0.024772170931100845, 0.04180944710969925, 0.05884672328829765, 0.07588399946689606, 0.09292127192020416, 0.10995855182409286, 0.12699583172798157, 0.14403310418128967, 0.16107037663459778, 0.17810764908790588, 0.19514493644237518, 0.2121822088956833, 0.2292194813489914, 0.2462567687034607, 0.2632940411567688, 0.2803313136100769, 0.297368586063385, 0.3144058585166931, 0.3314431309700012, 0.3484804034233093, 0.36551767587661743, 0.3825549781322479, 0.39959225058555603, 0.41662952303886414, 0.43366679549217224, 0.45070406794548035, 0.46774134039878845, 0.48477864265441895, 0.501815915107727, 0.5188531875610352, 0.5358904600143433, 0.5529277324676514]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 14.0, 28.0, 63.0, 88.0, 153.0, 336.0, 590.0, 1312.0, 3491.0, 10304.0, 39429.0, 158467.0, 406375.0, 305274.0, 89939.0, 22152.0, 6235.0, 2253.0, 962.0, 479.0, 254.0, 140.0, 74.0, 35.0, 28.0, 30.0, 5.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451171875, -0.4355010986328125, -0.419830322265625, -0.4041595458984375, -0.38848876953125, -0.3728179931640625, -0.357147216796875, -0.3414764404296875, -0.3258056640625, -0.3101348876953125, -0.294464111328125, -0.2787933349609375, -0.26312255859375, -0.2474517822265625, -0.231781005859375, -0.2161102294921875, -0.200439453125, -0.1847686767578125, -0.169097900390625, -0.1534271240234375, -0.13775634765625, -0.1220855712890625, -0.106414794921875, -0.0907440185546875, -0.0750732421875, -0.0594024658203125, -0.043731689453125, -0.0280609130859375, -0.01239013671875, 0.0032806396484375, 0.018951416015625, 0.0346221923828125, 0.05029296875, 0.0659637451171875, 0.081634521484375, 0.0973052978515625, 0.11297607421875, 0.1286468505859375, 0.144317626953125, 0.1599884033203125, 0.1756591796875, 0.1913299560546875, 0.207000732421875, 0.2226715087890625, 0.23834228515625, 0.2540130615234375, 0.269683837890625, 0.2853546142578125, 0.301025390625, 0.3166961669921875, 0.332366943359375, 0.3480377197265625, 0.36370849609375, 0.3793792724609375, 0.395050048828125, 0.4107208251953125, 0.4263916015625, 0.4420623779296875, 0.457733154296875, 0.4734039306640625, 0.48907470703125, 0.5047454833984375, 0.520416259765625, 0.5360870361328125, 0.5517578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 5.0, 5.0, 6.0, 7.0, 18.0, 22.0, 34.0, 36.0, 51.0, 38.0, 48.0, 70.0, 64.0, 65.0, 73.0, 69.0, 55.0, 63.0, 51.0, 42.0, 40.0, 31.0, 35.0, 29.0, 12.0, 14.0, 10.0, 5.0, 9.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.171875, -9.943115234375, -9.71435546875, -9.485595703125, -9.2568359375, -9.028076171875, -8.79931640625, -8.570556640625, -8.341796875, -8.113037109375, -7.88427734375, -7.655517578125, -7.4267578125, -7.197998046875, -6.96923828125, -6.740478515625, -6.51171875, -6.282958984375, -6.05419921875, -5.825439453125, -5.5966796875, -5.367919921875, -5.13916015625, -4.910400390625, -4.681640625, -4.452880859375, -4.22412109375, -3.995361328125, -3.7666015625, -3.537841796875, -3.30908203125, -3.080322265625, -2.8515625, -2.622802734375, -2.39404296875, -2.165283203125, -1.9365234375, -1.707763671875, -1.47900390625, -1.250244140625, -1.021484375, -0.792724609375, -0.56396484375, -0.335205078125, -0.1064453125, 0.122314453125, 0.35107421875, 0.579833984375, 0.80859375, 1.037353515625, 1.26611328125, 1.494873046875, 1.7236328125, 1.952392578125, 2.18115234375, 2.409912109375, 2.638671875, 2.867431640625, 3.09619140625, 3.324951171875, 3.5537109375, 3.782470703125, 4.01123046875, 4.239990234375, 4.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 48.0, 66.0, 73.0, 112.0, 170.0, 250.0, 478.0, 1262.0, 26006.0, 1004302.0, 13411.0, 1050.0, 450.0, 263.0, 169.0, 99.0, 75.0, 59.0, 37.0, 25.0, 22.0, 8.0, 17.0, 9.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.306640625, -3.222808837890625, -3.13897705078125, -3.055145263671875, -2.9713134765625, -2.887481689453125, -2.80364990234375, -2.719818115234375, -2.635986328125, -2.552154541015625, -2.46832275390625, -2.384490966796875, -2.3006591796875, -2.216827392578125, -2.13299560546875, -2.049163818359375, -1.96533203125, -1.881500244140625, -1.79766845703125, -1.713836669921875, -1.6300048828125, -1.546173095703125, -1.46234130859375, -1.378509521484375, -1.294677734375, -1.210845947265625, -1.12701416015625, -1.043182373046875, -0.9593505859375, -0.875518798828125, -0.79168701171875, -0.707855224609375, -0.6240234375, -0.540191650390625, -0.45635986328125, -0.372528076171875, -0.2886962890625, -0.204864501953125, -0.12103271484375, -0.037200927734375, 0.046630859375, 0.130462646484375, 0.21429443359375, 0.298126220703125, 0.3819580078125, 0.465789794921875, 0.54962158203125, 0.633453369140625, 0.71728515625, 0.801116943359375, 0.88494873046875, 0.968780517578125, 1.0526123046875, 1.136444091796875, 1.22027587890625, 1.304107666015625, 1.387939453125, 1.471771240234375, 1.55560302734375, 1.639434814453125, 1.7232666015625, 1.807098388671875, 1.89093017578125, 1.974761962890625, 2.05859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 14.0, 16.0, 28.0, 32.0, 35.0, 47.0, 52.0, 43.0, 58.0, 75.0, 70.0, 58.0, 67.0, 53.0, 54.0, 51.0, 45.0, 45.0, 30.0, 30.0, 19.0, 16.0, 13.0, 10.0, 9.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.8046875, -8.58111572265625, -8.3575439453125, -8.13397216796875, -7.910400390625, -7.68682861328125, -7.4632568359375, -7.23968505859375, -7.01611328125, -6.79254150390625, -6.5689697265625, -6.34539794921875, -6.121826171875, -5.89825439453125, -5.6746826171875, -5.45111083984375, -5.2275390625, -5.00396728515625, -4.7803955078125, -4.55682373046875, -4.333251953125, -4.10968017578125, -3.8861083984375, -3.66253662109375, -3.43896484375, -3.21539306640625, -2.9918212890625, -2.76824951171875, -2.544677734375, -2.32110595703125, -2.0975341796875, -1.87396240234375, -1.650390625, -1.42681884765625, -1.2032470703125, -0.97967529296875, -0.756103515625, -0.53253173828125, -0.3089599609375, -0.08538818359375, 0.13818359375, 0.36175537109375, 0.5853271484375, 0.80889892578125, 1.032470703125, 1.25604248046875, 1.4796142578125, 1.70318603515625, 1.9267578125, 2.15032958984375, 2.3739013671875, 2.59747314453125, 2.821044921875, 3.04461669921875, 3.2681884765625, 3.49176025390625, 3.71533203125, 3.93890380859375, 4.1624755859375, 4.38604736328125, 4.609619140625, 4.83319091796875, 5.0567626953125, 5.28033447265625, 5.50390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 5.0, 3.0, 10.0, 16.0, 8.0, 17.0, 24.0, 41.0, 43.0, 98.0, 168.0, 317.0, 705.0, 1780.0, 5908.0, 77296.0, 927290.0, 28394.0, 3863.0, 1378.0, 573.0, 258.0, 107.0, 75.0, 42.0, 35.0, 22.0, 29.0, 20.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.40087890625, -0.3911857604980469, -0.38149261474609375, -0.3717994689941406, -0.3621063232421875, -0.3524131774902344, -0.34272003173828125, -0.3330268859863281, -0.323333740234375, -0.3136405944824219, -0.30394744873046875, -0.2942543029785156, -0.2845611572265625, -0.2748680114746094, -0.26517486572265625, -0.2554817199707031, -0.24578857421875, -0.23609542846679688, -0.22640228271484375, -0.21670913696289062, -0.2070159912109375, -0.19732284545898438, -0.18762969970703125, -0.17793655395507812, -0.168243408203125, -0.15855026245117188, -0.14885711669921875, -0.13916397094726562, -0.1294708251953125, -0.11977767944335938, -0.11008453369140625, -0.10039138793945312, -0.0906982421875, -0.08100509643554688, -0.07131195068359375, -0.061618804931640625, -0.0519256591796875, -0.042232513427734375, -0.03253936767578125, -0.022846221923828125, -0.013153076171875, -0.003459930419921875, 0.00623321533203125, 0.015926361083984375, 0.0256195068359375, 0.035312652587890625, 0.04500579833984375, 0.054698944091796875, 0.06439208984375, 0.07408523559570312, 0.08377838134765625, 0.09347152709960938, 0.1031646728515625, 0.11285781860351562, 0.12255096435546875, 0.13224411010742188, 0.141937255859375, 0.15163040161132812, 0.16132354736328125, 0.17101669311523438, 0.1807098388671875, 0.19040298461914062, 0.20009613037109375, 0.20978927612304688, 0.219482421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 10.0, 18.0, 39.0, 51.0, 103.0, 191.0, 222.0, 167.0, 85.0, 37.0, 24.0, 8.0, 12.0, 11.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0384788513183594e-05, -1.9329600036144257e-05, -1.827441155910492e-05, -1.7219223082065582e-05, -1.6164034605026245e-05, -1.5108846127986908e-05, -1.405365765094757e-05, -1.2998469173908234e-05, -1.1943280696868896e-05, -1.088809221982956e-05, -9.832903742790222e-06, -8.777715265750885e-06, -7.722526788711548e-06, -6.667338311672211e-06, -5.6121498346328735e-06, -4.556961357593536e-06, -3.5017728805541992e-06, -2.446584403514862e-06, -1.391395926475525e-06, -3.3620744943618774e-07, 7.189810276031494e-07, 1.7741695046424866e-06, 2.8293579816818237e-06, 3.884546458721161e-06, 4.939734935760498e-06, 5.994923412799835e-06, 7.050111889839172e-06, 8.10530036687851e-06, 9.160488843917847e-06, 1.0215677320957184e-05, 1.1270865797996521e-05, 1.2326054275035858e-05, 1.3381242752075195e-05, 1.4436431229114532e-05, 1.549161970615387e-05, 1.6546808183193207e-05, 1.7601996660232544e-05, 1.865718513727188e-05, 1.9712373614311218e-05, 2.0767562091350555e-05, 2.1822750568389893e-05, 2.287793904542923e-05, 2.3933127522468567e-05, 2.4988315999507904e-05, 2.604350447654724e-05, 2.709869295358658e-05, 2.8153881430625916e-05, 2.9209069907665253e-05, 3.026425838470459e-05, 3.131944686174393e-05, 3.2374635338783264e-05, 3.34298238158226e-05, 3.448501229286194e-05, 3.5540200769901276e-05, 3.659538924694061e-05, 3.765057772397995e-05, 3.870576620101929e-05, 3.9760954678058624e-05, 4.081614315509796e-05, 4.18713316321373e-05, 4.2926520109176636e-05, 4.398170858621597e-05, 4.503689706325531e-05, 4.609208554029465e-05, 4.7147274017333984e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 5.0, 11.0, 13.0, 17.0, 28.0, 52.0, 121.0, 298.0, 1236.0, 9219.0, 480832.0, 544910.0, 9965.0, 1270.0, 287.0, 120.0, 64.0, 35.0, 16.0, 15.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.392822265625, -0.38368988037109375, -0.3745574951171875, -0.36542510986328125, -0.356292724609375, -0.34716033935546875, -0.3380279541015625, -0.32889556884765625, -0.31976318359375, -0.31063079833984375, -0.3014984130859375, -0.29236602783203125, -0.283233642578125, -0.27410125732421875, -0.2649688720703125, -0.25583648681640625, -0.2467041015625, -0.23757171630859375, -0.2284393310546875, -0.21930694580078125, -0.210174560546875, -0.20104217529296875, -0.1919097900390625, -0.18277740478515625, -0.17364501953125, -0.16451263427734375, -0.1553802490234375, -0.14624786376953125, -0.137115478515625, -0.12798309326171875, -0.1188507080078125, -0.10971832275390625, -0.1005859375, -0.09145355224609375, -0.0823211669921875, -0.07318878173828125, -0.064056396484375, -0.05492401123046875, -0.0457916259765625, -0.03665924072265625, -0.02752685546875, -0.01839447021484375, -0.0092620849609375, -0.00012969970703125, 0.009002685546875, 0.01813507080078125, 0.0272674560546875, 0.03639984130859375, 0.0455322265625, 0.05466461181640625, 0.0637969970703125, 0.07292938232421875, 0.082061767578125, 0.09119415283203125, 0.1003265380859375, 0.10945892333984375, 0.11859130859375, 0.12772369384765625, 0.1368560791015625, 0.14598846435546875, 0.155120849609375, 0.16425323486328125, 0.1733856201171875, 0.18251800537109375, 0.191650390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 8.0, 14.0, 13.0, 17.0, 33.0, 44.0, 54.0, 76.0, 81.0, 107.0, 97.0, 117.0, 93.0, 77.0, 50.0, 29.0, 25.0, 17.0, 11.0, 9.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.0681910514831543, -0.0664968490600586, -0.06480264663696289, -0.06310844421386719, -0.061414241790771484, -0.05972003936767578, -0.05802583694458008, -0.056331634521484375, -0.05463743209838867, -0.05294322967529297, -0.051249027252197266, -0.04955482482910156, -0.04786062240600586, -0.046166419982910156, -0.04447221755981445, -0.04277801513671875, -0.04108381271362305, -0.039389610290527344, -0.03769540786743164, -0.03600120544433594, -0.034307003021240234, -0.03261280059814453, -0.030918598175048828, -0.029224395751953125, -0.027530193328857422, -0.02583599090576172, -0.024141788482666016, -0.022447586059570312, -0.02075338363647461, -0.019059181213378906, -0.017364978790283203, -0.0156707763671875, -0.013976573944091797, -0.012282371520996094, -0.01058816909790039, -0.008893966674804688, -0.007199764251708984, -0.005505561828613281, -0.003811359405517578, -0.002117156982421875, -0.0004229545593261719, 0.0012712478637695312, 0.0029654502868652344, 0.0046596527099609375, 0.006353855133056641, 0.008048057556152344, 0.009742259979248047, 0.01143646240234375, 0.013130664825439453, 0.014824867248535156, 0.01651906967163086, 0.018213272094726562, 0.019907474517822266, 0.02160167694091797, 0.023295879364013672, 0.024990081787109375, 0.026684284210205078, 0.02837848663330078, 0.030072689056396484, 0.03176689147949219, 0.03346109390258789, 0.035155296325683594, 0.0368494987487793, 0.038543701171875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 1014.0, 1.0], "bins": [-92.85832214355469, -91.3709945678711, -89.88365936279297, -88.39633178710938, -86.90899658203125, -85.42166900634766, -83.93434143066406, -82.44700622558594, -80.95967864990234, -79.47235107421875, -77.98501586914062, -76.49768829345703, -75.0103530883789, -73.52302551269531, -72.03569030761719, -70.5483627319336, -69.06103515625, -67.5737075805664, -66.08637237548828, -64.59904479980469, -63.11171340942383, -61.62438201904297, -60.13705062866211, -58.64971923828125, -57.162384033203125, -55.675052642822266, -54.187721252441406, -52.70039367675781, -51.21306228637695, -49.725730895996094, -48.238399505615234, -46.751068115234375, -45.26374053955078, -43.77640914916992, -42.28907775878906, -40.80175018310547, -39.31441879272461, -37.82708740234375, -36.33975601196289, -34.85242462158203, -33.36509704589844, -31.877765655517578, -30.39043617248535, -28.903104782104492, -27.415775299072266, -25.928443908691406, -24.441112518310547, -22.953781127929688, -21.46645164489746, -19.9791202545166, -18.491790771484375, -17.004459381103516, -15.517128944396973, -14.02979850769043, -12.54246711730957, -11.055136680603027, -9.567806243896484, -8.080475807189941, -6.59314489364624, -5.105813980102539, -3.618483543395996, -2.131153106689453, -0.6438217163085938, 0.8435087203979492, 2.3308393955230713]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 4.0, 7.0, 10.0, 11.0, 10.0, 14.0, 26.0, 27.0, 26.0, 32.0, 39.0, 39.0, 42.0, 38.0, 40.0, 52.0, 59.0, 52.0, 51.0, 48.0, 39.0, 40.0, 41.0, 38.0, 43.0, 27.0, 22.0, 26.0, 17.0, 9.0, 12.0, 21.0, 5.0, 5.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.387990951538086, -9.131377220153809, -8.874763488769531, -8.618149757385254, -8.361536026000977, -8.1049222946167, -7.848308563232422, -7.5916948318481445, -7.335081100463867, -7.07846736907959, -6.8218536376953125, -6.565239906311035, -6.308626174926758, -6.0520124435424805, -5.795398712158203, -5.538784980773926, -5.28217077255249, -5.025557041168213, -4.7689433097839355, -4.512329578399658, -4.255715847015381, -3.9991021156311035, -3.742488145828247, -3.4858744144439697, -3.2292606830596924, -2.972646951675415, -2.7160332202911377, -2.4594192504882812, -2.202805519104004, -1.9461919069290161, -1.6895780563354492, -1.4329643249511719, -1.1763501167297363, -0.919736385345459, -0.6631225943565369, -0.40650880336761475, -0.1498950719833374, 0.10671865940093994, 0.36333250999450684, 0.6199462413787842, 0.8765599727630615, 1.1331737041473389, 1.3897874355316162, 1.646401286125183, 1.9030150175094604, 2.1596288681030273, 2.4162425994873047, 2.672856330871582, 2.9294700622558594, 3.1860837936401367, 3.442697525024414, 3.6993112564086914, 3.9559249877929688, 4.212538719177246, 4.469152450561523, 4.725766181945801, 4.982379913330078, 5.2389936447143555, 5.495607376098633, 5.75222110748291, 6.0088348388671875, 6.265448570251465, 6.522062301635742, 6.7786760330200195, 7.035290241241455]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 9.0, 8.0, 18.0, 25.0, 35.0, 31.0, 52.0, 72.0, 179.0, 966.0, 26147.0, 3171479.0, 988102.0, 6356.0, 451.0, 104.0, 43.0, 53.0, 34.0, 30.0, 19.0, 18.0, 13.0, 12.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.87359619140625, -2.7803955078125, -2.68719482421875, -2.593994140625, -2.50079345703125, -2.4075927734375, -2.31439208984375, -2.22119140625, -2.12799072265625, -2.0347900390625, -1.94158935546875, -1.848388671875, -1.75518798828125, -1.6619873046875, -1.56878662109375, -1.4755859375, -1.38238525390625, -1.2891845703125, -1.19598388671875, -1.102783203125, -1.00958251953125, -0.9163818359375, -0.82318115234375, -0.72998046875, -0.63677978515625, -0.5435791015625, -0.45037841796875, -0.357177734375, -0.26397705078125, -0.1707763671875, -0.07757568359375, 0.015625, 0.10882568359375, 0.2020263671875, 0.29522705078125, 0.388427734375, 0.48162841796875, 0.5748291015625, 0.66802978515625, 0.76123046875, 0.85443115234375, 0.9476318359375, 1.04083251953125, 1.134033203125, 1.22723388671875, 1.3204345703125, 1.41363525390625, 1.5068359375, 1.60003662109375, 1.6932373046875, 1.78643798828125, 1.879638671875, 1.97283935546875, 2.0660400390625, 2.15924072265625, 2.25244140625, 2.34564208984375, 2.4388427734375, 2.53204345703125, 2.625244140625, 2.71844482421875, 2.8116455078125, 2.90484619140625, 2.998046875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 10.0, 2.0, 8.0, 11.0, 9.0, 12.0, 19.0, 25.0, 26.0, 19.0, 25.0, 39.0, 29.0, 33.0, 43.0, 36.0, 43.0, 41.0, 40.0, 44.0, 44.0, 39.0, 43.0, 37.0, 52.0, 31.0, 35.0, 37.0, 20.0, 22.0, 19.0, 20.0, 16.0, 6.0, 12.0, 6.0, 10.0, 6.0, 9.0, 6.0, 2.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.80859375, -0.786376953125, -0.76416015625, -0.741943359375, -0.7197265625, -0.697509765625, -0.67529296875, -0.653076171875, -0.630859375, -0.608642578125, -0.58642578125, -0.564208984375, -0.5419921875, -0.519775390625, -0.49755859375, -0.475341796875, -0.453125, -0.430908203125, -0.40869140625, -0.386474609375, -0.3642578125, -0.342041015625, -0.31982421875, -0.297607421875, -0.275390625, -0.253173828125, -0.23095703125, -0.208740234375, -0.1865234375, -0.164306640625, -0.14208984375, -0.119873046875, -0.09765625, -0.075439453125, -0.05322265625, -0.031005859375, -0.0087890625, 0.013427734375, 0.03564453125, 0.057861328125, 0.080078125, 0.102294921875, 0.12451171875, 0.146728515625, 0.1689453125, 0.191162109375, 0.21337890625, 0.235595703125, 0.2578125, 0.280029296875, 0.30224609375, 0.324462890625, 0.3466796875, 0.368896484375, 0.39111328125, 0.413330078125, 0.435546875, 0.457763671875, 0.47998046875, 0.502197265625, 0.5244140625, 0.546630859375, 0.56884765625, 0.591064453125, 0.61328125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 10.0, 17.0, 29.0, 101.0, 3998666.0, 195279.0, 81.0, 37.0, 17.0, 10.0, 5.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5, -40.11572265625, -38.7314453125, -37.34716796875, -35.962890625, -34.57861328125, -33.1943359375, -31.81005859375, -30.42578125, -29.04150390625, -27.6572265625, -26.27294921875, -24.888671875, -23.50439453125, -22.1201171875, -20.73583984375, -19.3515625, -17.96728515625, -16.5830078125, -15.19873046875, -13.814453125, -12.43017578125, -11.0458984375, -9.66162109375, -8.27734375, -6.89306640625, -5.5087890625, -4.12451171875, -2.740234375, -1.35595703125, 0.0283203125, 1.41259765625, 2.796875, 4.18115234375, 5.5654296875, 6.94970703125, 8.333984375, 9.71826171875, 11.1025390625, 12.48681640625, 13.87109375, 15.25537109375, 16.6396484375, 18.02392578125, 19.408203125, 20.79248046875, 22.1767578125, 23.56103515625, 24.9453125, 26.32958984375, 27.7138671875, 29.09814453125, 30.482421875, 31.86669921875, 33.2509765625, 34.63525390625, 36.01953125, 37.40380859375, 38.7880859375, 40.17236328125, 41.556640625, 42.94091796875, 44.3251953125, 45.70947265625, 47.09375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 5.0, 12.0, 15.0, 41.0, 44.0, 69.0, 94.0, 181.0, 291.0, 501.0, 675.0, 753.0, 519.0, 328.0, 217.0, 119.0, 72.0, 51.0, 22.0, 25.0, 9.0, 10.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3505859375, -0.3381195068359375, -0.325653076171875, -0.3131866455078125, -0.30072021484375, -0.2882537841796875, -0.275787353515625, -0.2633209228515625, -0.2508544921875, -0.2383880615234375, -0.225921630859375, -0.2134552001953125, -0.20098876953125, -0.1885223388671875, -0.176055908203125, -0.1635894775390625, -0.151123046875, -0.1386566162109375, -0.126190185546875, -0.1137237548828125, -0.10125732421875, -0.0887908935546875, -0.076324462890625, -0.0638580322265625, -0.0513916015625, -0.0389251708984375, -0.026458740234375, -0.0139923095703125, -0.00152587890625, 0.0109405517578125, 0.023406982421875, 0.0358734130859375, 0.04833984375, 0.0608062744140625, 0.073272705078125, 0.0857391357421875, 0.09820556640625, 0.1106719970703125, 0.123138427734375, 0.1356048583984375, 0.1480712890625, 0.1605377197265625, 0.173004150390625, 0.1854705810546875, 0.19793701171875, 0.2104034423828125, 0.222869873046875, 0.2353363037109375, 0.247802734375, 0.2602691650390625, 0.272735595703125, 0.2852020263671875, 0.29766845703125, 0.3101348876953125, 0.322601318359375, 0.3350677490234375, 0.3475341796875, 0.3600006103515625, 0.372467041015625, 0.3849334716796875, 0.39739990234375, 0.4098663330078125, 0.422332763671875, 0.4347991943359375, 0.447265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 11.0, 23.0, 38.0, 59.0, 77.0, 107.0, 117.0, 134.0, 107.0, 95.0, 81.0, 60.0, 35.0, 26.0, 11.0, 12.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0482101440429688, -0.9975103735923767, -0.9468106031417847, -0.8961108326911926, -0.8454110622406006, -0.7947112321853638, -0.7440115213394165, -0.6933116912841797, -0.6426119804382324, -0.5919122099876404, -0.5412124395370483, -0.4905126690864563, -0.43981289863586426, -0.38911309838294983, -0.3384133279323578, -0.28771355748176575, -0.23701375722885132, -0.18631398677825928, -0.13561421632766724, -0.084914430975914, -0.03421466052532196, 0.016485124826431274, 0.06718489527702332, 0.11788466572761536, 0.1685844361782074, 0.21928420662879944, 0.2699839770793915, 0.3206837773323059, 0.37138354778289795, 0.42208331823349, 0.47278308868408203, 0.5234828591346741, 0.5741826295852661, 0.6248824000358582, 0.6755821704864502, 0.7262819409370422, 0.7769817113876343, 0.8276815414428711, 0.8783812522888184, 0.9290810823440552, 0.9797807931900024, 1.0304806232452393, 1.0811803340911865, 1.1318801641464233, 1.1825798749923706, 1.2332797050476074, 1.2839794158935547, 1.3346792459487915, 1.3853790760040283, 1.4360789060592651, 1.4867786169052124, 1.5374784469604492, 1.5881781578063965, 1.6388779878616333, 1.6895776987075806, 1.7402775287628174, 1.7909772396087646, 1.8416770696640015, 1.8923767805099487, 1.9430766105651855, 1.9937763214111328, 2.04447603225708, 2.0951759815216064, 2.1458756923675537, 2.196575403213501]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 11.0, 5.0, 16.0, 16.0, 21.0, 15.0, 32.0, 33.0, 34.0, 31.0, 39.0, 36.0, 38.0, 49.0, 45.0, 40.0, 49.0, 38.0, 46.0, 53.0, 35.0, 35.0, 43.0, 31.0, 36.0, 30.0, 28.0, 23.0, 19.0, 15.0, 11.0, 8.0, 6.0, 3.0, 9.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8198073506355286, -0.7944751977920532, -0.7691431045532227, -0.7438109517097473, -0.718478798866272, -0.6931467056274414, -0.6678145527839661, -0.6424823999404907, -0.6171503067016602, -0.5918181538581848, -0.5664860606193542, -0.5411539077758789, -0.5158218145370483, -0.490489661693573, -0.46515750885009766, -0.4398253858089447, -0.41449326276779175, -0.3891611397266388, -0.36382901668548584, -0.3384968638420105, -0.31316474080085754, -0.2878326177597046, -0.26250046491622925, -0.2371683418750763, -0.21183621883392334, -0.18650409579277039, -0.16117195785045624, -0.1358398199081421, -0.11050769686698914, -0.08517557382583618, -0.059843435883522034, -0.034511297941207886, -0.009179115295410156, 0.016153015196323395, 0.041485145688056946, 0.0668172761797905, 0.09214940667152405, 0.117481529712677, 0.14281366765499115, 0.1681458055973053, 0.19347792863845825, 0.2188100516796112, 0.24414218962192535, 0.2694743275642395, 0.29480645060539246, 0.3201385736465454, 0.34547072649002075, 0.3708028495311737, 0.39613497257232666, 0.4214670956134796, 0.44679921865463257, 0.4721313714981079, 0.49746349453926086, 0.5227956175804138, 0.5481277704238892, 0.5734598636627197, 0.5987920165061951, 0.6241241693496704, 0.649456262588501, 0.6747884154319763, 0.7001205682754517, 0.7254526615142822, 0.7507848143577576, 0.7761169672012329, 0.8014490604400635]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 13.0, 7.0, 28.0, 36.0, 72.0, 99.0, 172.0, 270.0, 488.0, 736.0, 1202.0, 1996.0, 3332.0, 5710.0, 11345.0, 25708.0, 71289.0, 216195.0, 393492.0, 201578.0, 66423.0, 24175.0, 10660.0, 5438.0, 3214.0, 1892.0, 1130.0, 688.0, 414.0, 249.0, 178.0, 120.0, 60.0, 49.0, 39.0, 17.0, 11.0, 9.0, 7.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31494140625, -0.3055305480957031, -0.29611968994140625, -0.2867088317871094, -0.2772979736328125, -0.2678871154785156, -0.25847625732421875, -0.24906539916992188, -0.239654541015625, -0.23024368286132812, -0.22083282470703125, -0.21142196655273438, -0.2020111083984375, -0.19260025024414062, -0.18318939208984375, -0.17377853393554688, -0.16436767578125, -0.15495681762695312, -0.14554595947265625, -0.13613510131835938, -0.1267242431640625, -0.11731338500976562, -0.10790252685546875, -0.09849166870117188, -0.089080810546875, -0.07966995239257812, -0.07025909423828125, -0.060848236083984375, -0.0514373779296875, -0.042026519775390625, -0.03261566162109375, -0.023204803466796875, -0.0137939453125, -0.004383087158203125, 0.00502777099609375, 0.014438629150390625, 0.0238494873046875, 0.033260345458984375, 0.04267120361328125, 0.052082061767578125, 0.061492919921875, 0.07090377807617188, 0.08031463623046875, 0.08972549438476562, 0.0991363525390625, 0.10854721069335938, 0.11795806884765625, 0.12736892700195312, 0.13677978515625, 0.14619064331054688, 0.15560150146484375, 0.16501235961914062, 0.1744232177734375, 0.18383407592773438, 0.19324493408203125, 0.20265579223632812, 0.212066650390625, 0.22147750854492188, 0.23088836669921875, 0.24029922485351562, 0.2497100830078125, 0.2591209411621094, 0.26853179931640625, 0.2779426574707031, 0.287353515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 11.0, 10.0, 16.0, 15.0, 18.0, 29.0, 20.0, 31.0, 30.0, 35.0, 34.0, 32.0, 40.0, 57.0, 52.0, 39.0, 44.0, 58.0, 36.0, 57.0, 42.0, 42.0, 35.0, 34.0, 24.0, 29.0, 27.0, 19.0, 19.0, 11.0, 10.0, 6.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.5526199340820312, -0.5363922119140625, -0.5201644897460938, -0.503936767578125, -0.48770904541015625, -0.4714813232421875, -0.45525360107421875, -0.43902587890625, -0.42279815673828125, -0.4065704345703125, -0.39034271240234375, -0.374114990234375, -0.35788726806640625, -0.3416595458984375, -0.32543182373046875, -0.3092041015625, -0.29297637939453125, -0.2767486572265625, -0.26052093505859375, -0.244293212890625, -0.22806549072265625, -0.2118377685546875, -0.19561004638671875, -0.17938232421875, -0.16315460205078125, -0.1469268798828125, -0.13069915771484375, -0.114471435546875, -0.09824371337890625, -0.0820159912109375, -0.06578826904296875, -0.049560546875, -0.03333282470703125, -0.0171051025390625, -0.00087738037109375, 0.015350341796875, 0.03157806396484375, 0.0478057861328125, 0.06403350830078125, 0.08026123046875, 0.09648895263671875, 0.1127166748046875, 0.12894439697265625, 0.145172119140625, 0.16139984130859375, 0.1776275634765625, 0.19385528564453125, 0.2100830078125, 0.22631072998046875, 0.2425384521484375, 0.25876617431640625, 0.274993896484375, 0.29122161865234375, 0.3074493408203125, 0.32367706298828125, 0.33990478515625, 0.35613250732421875, 0.3723602294921875, 0.38858795166015625, 0.404815673828125, 0.42104339599609375, 0.4372711181640625, 0.45349884033203125, 0.4697265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 12.0, 19.0, 20.0, 44.0, 58.0, 130.0, 261.0, 548.0, 1186.0, 2780.0, 7578.0, 30019.0, 193549.0, 606244.0, 168091.0, 26433.0, 6960.0, 2502.0, 1072.0, 457.0, 234.0, 133.0, 75.0, 40.0, 34.0, 21.0, 14.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6040611267089844, -0.5870285034179688, -0.5699958801269531, -0.5529632568359375, -0.5359306335449219, -0.5188980102539062, -0.5018653869628906, -0.484832763671875, -0.4678001403808594, -0.45076751708984375, -0.4337348937988281, -0.4167022705078125, -0.3996696472167969, -0.38263702392578125, -0.3656044006347656, -0.34857177734375, -0.3315391540527344, -0.31450653076171875, -0.2974739074707031, -0.2804412841796875, -0.2634086608886719, -0.24637603759765625, -0.22934341430664062, -0.212310791015625, -0.19527816772460938, -0.17824554443359375, -0.16121292114257812, -0.1441802978515625, -0.12714767456054688, -0.11011505126953125, -0.09308242797851562, -0.0760498046875, -0.059017181396484375, -0.04198455810546875, -0.024951934814453125, -0.0079193115234375, 0.009113311767578125, 0.02614593505859375, 0.043178558349609375, 0.060211181640625, 0.07724380493164062, 0.09427642822265625, 0.11130905151367188, 0.1283416748046875, 0.14537429809570312, 0.16240692138671875, 0.17943954467773438, 0.19647216796875, 0.21350479125976562, 0.23053741455078125, 0.24757003784179688, 0.2646026611328125, 0.2816352844238281, 0.29866790771484375, 0.3157005310058594, 0.332733154296875, 0.3497657775878906, 0.36679840087890625, 0.3838310241699219, 0.4008636474609375, 0.4178962707519531, 0.43492889404296875, 0.4519615173339844, 0.468994140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 13.0, 8.0, 13.0, 23.0, 23.0, 20.0, 27.0, 25.0, 24.0, 38.0, 24.0, 37.0, 39.0, 45.0, 54.0, 46.0, 43.0, 42.0, 54.0, 39.0, 34.0, 37.0, 35.0, 27.0, 29.0, 33.0, 34.0, 24.0, 9.0, 14.0, 11.0, 11.0, 9.0, 11.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8779296875, -0.8498916625976562, -0.8218536376953125, -0.7938156127929688, -0.765777587890625, -0.7377395629882812, -0.7097015380859375, -0.6816635131835938, -0.65362548828125, -0.6255874633789062, -0.5975494384765625, -0.5695114135742188, -0.541473388671875, -0.5134353637695312, -0.4853973388671875, -0.45735931396484375, -0.4293212890625, -0.40128326416015625, -0.3732452392578125, -0.34520721435546875, -0.317169189453125, -0.28913116455078125, -0.2610931396484375, -0.23305511474609375, -0.20501708984375, -0.17697906494140625, -0.1489410400390625, -0.12090301513671875, -0.092864990234375, -0.06482696533203125, -0.0367889404296875, -0.00875091552734375, 0.019287109375, 0.04732513427734375, 0.0753631591796875, 0.10340118408203125, 0.131439208984375, 0.15947723388671875, 0.1875152587890625, 0.21555328369140625, 0.24359130859375, 0.27162933349609375, 0.2996673583984375, 0.32770538330078125, 0.355743408203125, 0.38378143310546875, 0.4118194580078125, 0.43985748291015625, 0.4678955078125, 0.49593353271484375, 0.5239715576171875, 0.5520095825195312, 0.580047607421875, 0.6080856323242188, 0.6361236572265625, 0.6641616821289062, 0.69219970703125, 0.7202377319335938, 0.7482757568359375, 0.7763137817382812, 0.804351806640625, 0.8323898315429688, 0.8604278564453125, 0.8884658813476562, 0.91650390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 10.0, 11.0, 27.0, 30.0, 29.0, 44.0, 74.0, 120.0, 152.0, 271.0, 457.0, 719.0, 1384.0, 2607.0, 5301.0, 11607.0, 28468.0, 91792.0, 339343.0, 393281.0, 113570.0, 33626.0, 13199.0, 5885.0, 2853.0, 1492.0, 855.0, 489.0, 298.0, 208.0, 101.0, 91.0, 44.0, 29.0, 20.0, 15.0, 18.0, 6.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.09649658203125, -0.09366512298583984, -0.09083366394042969, -0.08800220489501953, -0.08517074584960938, -0.08233928680419922, -0.07950782775878906, -0.0766763687133789, -0.07384490966796875, -0.0710134506225586, -0.06818199157714844, -0.06535053253173828, -0.06251907348632812, -0.05968761444091797, -0.05685615539550781, -0.054024696350097656, -0.0511932373046875, -0.048361778259277344, -0.04553031921386719, -0.04269886016845703, -0.039867401123046875, -0.03703594207763672, -0.03420448303222656, -0.031373023986816406, -0.02854156494140625, -0.025710105895996094, -0.022878646850585938, -0.02004718780517578, -0.017215728759765625, -0.014384269714355469, -0.011552810668945312, -0.008721351623535156, -0.005889892578125, -0.0030584335327148438, -0.0002269744873046875, 0.0026044845581054688, 0.005435943603515625, 0.008267402648925781, 0.011098861694335938, 0.013930320739746094, 0.01676177978515625, 0.019593238830566406, 0.022424697875976562, 0.02525615692138672, 0.028087615966796875, 0.03091907501220703, 0.03375053405761719, 0.036581993103027344, 0.0394134521484375, 0.042244911193847656, 0.04507637023925781, 0.04790782928466797, 0.050739288330078125, 0.05357074737548828, 0.05640220642089844, 0.059233665466308594, 0.06206512451171875, 0.0648965835571289, 0.06772804260253906, 0.07055950164794922, 0.07339096069335938, 0.07622241973876953, 0.07905387878417969, 0.08188533782958984, 0.084716796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 9.0, 14.0, 13.0, 24.0, 33.0, 44.0, 73.0, 104.0, 131.0, 113.0, 115.0, 99.0, 70.0, 45.0, 33.0, 16.0, 18.0, 4.0, 10.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.221366882324219e-05, -5.031470209360123e-05, -4.8415735363960266e-05, -4.6516768634319305e-05, -4.4617801904678345e-05, -4.2718835175037384e-05, -4.081986844539642e-05, -3.892090171575546e-05, -3.70219349861145e-05, -3.512296825647354e-05, -3.322400152683258e-05, -3.132503479719162e-05, -2.942606806755066e-05, -2.75271013379097e-05, -2.5628134608268738e-05, -2.3729167878627777e-05, -2.1830201148986816e-05, -1.9931234419345856e-05, -1.8032267689704895e-05, -1.6133300960063934e-05, -1.4234334230422974e-05, -1.2335367500782013e-05, -1.0436400771141052e-05, -8.537434041500092e-06, -6.638467311859131e-06, -4.73950058221817e-06, -2.8405338525772095e-06, -9.415671229362488e-07, 9.57399606704712e-07, 2.8563663363456726e-06, 4.755333065986633e-06, 6.654299795627594e-06, 8.553266525268555e-06, 1.0452233254909515e-05, 1.2351199984550476e-05, 1.4250166714191437e-05, 1.6149133443832397e-05, 1.8048100173473358e-05, 1.994706690311432e-05, 2.184603363275528e-05, 2.374500036239624e-05, 2.56439670920372e-05, 2.754293382167816e-05, 2.9441900551319122e-05, 3.134086728096008e-05, 3.3239834010601044e-05, 3.5138800740242004e-05, 3.7037767469882965e-05, 3.8936734199523926e-05, 4.0835700929164886e-05, 4.273466765880585e-05, 4.463363438844681e-05, 4.653260111808777e-05, 4.843156784772873e-05, 5.033053457736969e-05, 5.222950130701065e-05, 5.412846803665161e-05, 5.602743476629257e-05, 5.792640149593353e-05, 5.9825368225574493e-05, 6.172433495521545e-05, 6.362330168485641e-05, 6.552226841449738e-05, 6.742123514413834e-05, 6.93202018737793e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 7.0, 3.0, 10.0, 9.0, 16.0, 15.0, 12.0, 28.0, 30.0, 44.0, 59.0, 82.0, 145.0, 393.0, 2868.0, 109018.0, 920109.0, 14172.0, 943.0, 221.0, 114.0, 64.0, 25.0, 40.0, 25.0, 17.0, 19.0, 17.0, 9.0, 7.0, 9.0, 7.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3515625, -0.3386688232421875, -0.325775146484375, -0.3128814697265625, -0.29998779296875, -0.2870941162109375, -0.274200439453125, -0.2613067626953125, -0.2484130859375, -0.2355194091796875, -0.222625732421875, -0.2097320556640625, -0.19683837890625, -0.1839447021484375, -0.171051025390625, -0.1581573486328125, -0.145263671875, -0.1323699951171875, -0.119476318359375, -0.1065826416015625, -0.09368896484375, -0.0807952880859375, -0.067901611328125, -0.0550079345703125, -0.0421142578125, -0.0292205810546875, -0.016326904296875, -0.0034332275390625, 0.00946044921875, 0.0223541259765625, 0.035247802734375, 0.0481414794921875, 0.06103515625, 0.0739288330078125, 0.086822509765625, 0.0997161865234375, 0.11260986328125, 0.1255035400390625, 0.138397216796875, 0.1512908935546875, 0.1641845703125, 0.1770782470703125, 0.189971923828125, 0.2028656005859375, 0.21575927734375, 0.2286529541015625, 0.241546630859375, 0.2544403076171875, 0.267333984375, 0.2802276611328125, 0.293121337890625, 0.3060150146484375, 0.31890869140625, 0.3318023681640625, 0.344696044921875, 0.3575897216796875, 0.3704833984375, 0.3833770751953125, 0.396270751953125, 0.4091644287109375, 0.42205810546875, 0.4349517822265625, 0.447845458984375, 0.4607391357421875, 0.4736328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 8.0, 4.0, 9.0, 13.0, 17.0, 26.0, 30.0, 45.0, 47.0, 77.0, 77.0, 81.0, 105.0, 107.0, 75.0, 69.0, 42.0, 43.0, 38.0, 27.0, 16.0, 10.0, 7.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033294677734375, -0.03223228454589844, -0.031169891357421875, -0.030107498168945312, -0.02904510498046875, -0.027982711791992188, -0.026920318603515625, -0.025857925415039062, -0.0247955322265625, -0.023733139038085938, -0.022670745849609375, -0.021608352661132812, -0.02054595947265625, -0.019483566284179688, -0.018421173095703125, -0.017358779907226562, -0.01629638671875, -0.015233993530273438, -0.014171600341796875, -0.013109207153320312, -0.01204681396484375, -0.010984420776367188, -0.009922027587890625, -0.008859634399414062, -0.0077972412109375, -0.0067348480224609375, -0.005672454833984375, -0.0046100616455078125, -0.00354766845703125, -0.0024852752685546875, -0.001422882080078125, -0.0003604888916015625, 0.000701904296875, 0.0017642974853515625, 0.002826690673828125, 0.0038890838623046875, 0.00495147705078125, 0.0060138702392578125, 0.007076263427734375, 0.008138656616210938, 0.0092010498046875, 0.010263442993164062, 0.011325836181640625, 0.012388229370117188, 0.01345062255859375, 0.014513015747070312, 0.015575408935546875, 0.016637802124023438, 0.0177001953125, 0.018762588500976562, 0.019824981689453125, 0.020887374877929688, 0.02194976806640625, 0.023012161254882812, 0.024074554443359375, 0.025136947631835938, 0.0261993408203125, 0.027261734008789062, 0.028324127197265625, 0.029386520385742188, 0.03044891357421875, 0.03151130676269531, 0.032573699951171875, 0.03363609313964844, 0.034698486328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 9.0, 14.0, 23.0, 48.0, 59.0, 95.0, 121.0, 122.0, 130.0, 126.0, 82.0, 67.0, 48.0, 20.0, 15.0, 10.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8252111077308655, -0.7936931252479553, -0.7621752023696899, -0.7306572198867798, -0.6991392374038696, -0.6676212549209595, -0.6361032724380493, -0.6045853495597839, -0.5730673670768738, -0.5415493845939636, -0.5100314617156982, -0.4785134792327881, -0.44699549674987793, -0.4154775142669678, -0.38395956158638, -0.35244160890579224, -0.3209236264228821, -0.2894056439399719, -0.25788769125938416, -0.2263697236776352, -0.19485175609588623, -0.16333378851413727, -0.1318158209323883, -0.10029785335063934, -0.06877988576889038, -0.03726191818714142, -0.005743950605392456, 0.025774016976356506, 0.05729198455810547, 0.08880995213985443, 0.1203279197216034, 0.15184588730335236, 0.1833639144897461, 0.21488188207149506, 0.24639984965324402, 0.2779178023338318, 0.30943578481674194, 0.3409537672996521, 0.37247171998023987, 0.40398967266082764, 0.4355076551437378, 0.46702563762664795, 0.4985435903072357, 0.5300615429878235, 0.5615795254707336, 0.5930975079536438, 0.6246154308319092, 0.6561334133148193, 0.6876513957977295, 0.7191693782806396, 0.7506873607635498, 0.7822052836418152, 0.8137232661247253, 0.8452412486076355, 0.8767591714859009, 0.908277153968811, 0.9397951364517212, 0.9713131189346313, 1.0028311014175415, 1.0343490839004517, 1.0658669471740723, 1.0973849296569824, 1.1289029121398926, 1.1604208946228027, 1.191938877105713]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 10.0, 9.0, 8.0, 17.0, 15.0, 20.0, 21.0, 24.0, 35.0, 35.0, 37.0, 26.0, 45.0, 37.0, 40.0, 50.0, 42.0, 49.0, 39.0, 48.0, 42.0, 42.0, 42.0, 31.0, 38.0, 35.0, 16.0, 32.0, 25.0, 19.0, 19.0, 9.0, 8.0, 4.0, 3.0, 7.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.507093608379364, -0.4918804466724396, -0.47666725516319275, -0.4614540934562683, -0.4462409019470215, -0.43102774024009705, -0.4158145785331726, -0.4006013870239258, -0.38538819551467896, -0.3701750338077545, -0.3549618422985077, -0.33974868059158325, -0.3245354890823364, -0.309322327375412, -0.29410916566848755, -0.2788959741592407, -0.2636828124523163, -0.24846963584423065, -0.23325645923614502, -0.21804329752922058, -0.20283010601997375, -0.18761694431304932, -0.17240376770496368, -0.15719059109687805, -0.14197741448879242, -0.1267642378807068, -0.11155106127262115, -0.09633789211511612, -0.08112471550703049, -0.06591153889894485, -0.05069836974143982, -0.03548519313335419, -0.020272016525268555, -0.005058841779828072, 0.010154332965612411, 0.025367505848407745, 0.04058068245649338, 0.05579385906457901, 0.07100702822208405, 0.08622020483016968, 0.10143338143825531, 0.11664655804634094, 0.13185973465442657, 0.1470729112625122, 0.16228607296943665, 0.17749926447868347, 0.1927124261856079, 0.20792560279369354, 0.22313877940177917, 0.2383519560098648, 0.25356513261795044, 0.2687782943248749, 0.2839914858341217, 0.29920464754104614, 0.31441783905029297, 0.3296310007572174, 0.34484416246414185, 0.3600573241710663, 0.3752705156803131, 0.39048367738723755, 0.4056968688964844, 0.4209100306034088, 0.43612319231033325, 0.4513363838195801, 0.4665495753288269]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 10.0, 16.0, 24.0, 33.0, 34.0, 48.0, 87.0, 93.0, 157.0, 233.0, 373.0, 643.0, 1114.0, 1991.0, 3648.0, 7407.0, 14453.0, 30218.0, 69800.0, 205582.0, 404208.0, 186942.0, 64137.0, 28265.0, 13862.0, 6895.0, 3636.0, 1873.0, 1056.0, 587.0, 385.0, 231.0, 165.0, 81.0, 84.0, 52.0, 38.0, 20.0, 20.0, 14.0, 6.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2992973327636719, -0.28878021240234375, -0.2782630920410156, -0.2677459716796875, -0.2572288513183594, -0.24671173095703125, -0.23619461059570312, -0.225677490234375, -0.21516036987304688, -0.20464324951171875, -0.19412612915039062, -0.1836090087890625, -0.17309188842773438, -0.16257476806640625, -0.15205764770507812, -0.14154052734375, -0.13102340698242188, -0.12050628662109375, -0.10998916625976562, -0.0994720458984375, -0.08895492553710938, -0.07843780517578125, -0.06792068481445312, -0.057403564453125, -0.046886444091796875, -0.03636932373046875, -0.025852203369140625, -0.0153350830078125, -0.004817962646484375, 0.00569915771484375, 0.016216278076171875, 0.0267333984375, 0.037250518798828125, 0.04776763916015625, 0.058284759521484375, 0.0688018798828125, 0.07931900024414062, 0.08983612060546875, 0.10035324096679688, 0.110870361328125, 0.12138748168945312, 0.13190460205078125, 0.14242172241210938, 0.1529388427734375, 0.16345596313476562, 0.17397308349609375, 0.18449020385742188, 0.19500732421875, 0.20552444458007812, 0.21604156494140625, 0.22655868530273438, 0.2370758056640625, 0.24759292602539062, 0.25811004638671875, 0.2686271667480469, 0.279144287109375, 0.2896614074707031, 0.30017852783203125, 0.3106956481933594, 0.3212127685546875, 0.3317298889160156, 0.34224700927734375, 0.3527641296386719, 0.36328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 5.0, 6.0, 6.0, 12.0, 13.0, 16.0, 14.0, 29.0, 20.0, 31.0, 22.0, 27.0, 32.0, 39.0, 38.0, 44.0, 57.0, 47.0, 47.0, 44.0, 46.0, 57.0, 36.0, 31.0, 43.0, 43.0, 38.0, 26.0, 19.0, 26.0, 21.0, 10.0, 11.0, 11.0, 3.0, 10.0, 3.0, 4.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.259765625, -2.1963653564453125, -2.132965087890625, -2.0695648193359375, -2.00616455078125, -1.9427642822265625, -1.879364013671875, -1.8159637451171875, -1.7525634765625, -1.6891632080078125, -1.625762939453125, -1.5623626708984375, -1.49896240234375, -1.4355621337890625, -1.372161865234375, -1.3087615966796875, -1.245361328125, -1.1819610595703125, -1.118560791015625, -1.0551605224609375, -0.99176025390625, -0.9283599853515625, -0.864959716796875, -0.8015594482421875, -0.7381591796875, -0.6747589111328125, -0.611358642578125, -0.5479583740234375, -0.48455810546875, -0.4211578369140625, -0.357757568359375, -0.2943572998046875, -0.23095703125, -0.1675567626953125, -0.104156494140625, -0.0407562255859375, 0.02264404296875, 0.0860443115234375, 0.149444580078125, 0.2128448486328125, 0.2762451171875, 0.3396453857421875, 0.403045654296875, 0.4664459228515625, 0.52984619140625, 0.5932464599609375, 0.656646728515625, 0.7200469970703125, 0.783447265625, 0.8468475341796875, 0.910247802734375, 0.9736480712890625, 1.03704833984375, 1.1004486083984375, 1.163848876953125, 1.2272491455078125, 1.2906494140625, 1.3540496826171875, 1.417449951171875, 1.4808502197265625, 1.54425048828125, 1.6076507568359375, 1.671051025390625, 1.7344512939453125, 1.7978515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 10.0, 7.0, 15.0, 17.0, 26.0, 30.0, 47.0, 35.0, 46.0, 80.0, 138.0, 485.0, 1037233.0, 9708.0, 267.0, 100.0, 52.0, 47.0, 40.0, 46.0, 27.0, 20.0, 15.0, 11.0, 8.0, 8.0, 10.0, 7.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-10.6171875, -10.34375, -10.0703125, -9.796875, -9.5234375, -9.25, -8.9765625, -8.703125, -8.4296875, -8.15625, -7.8828125, -7.609375, -7.3359375, -7.0625, -6.7890625, -6.515625, -6.2421875, -5.96875, -5.6953125, -5.421875, -5.1484375, -4.875, -4.6015625, -4.328125, -4.0546875, -3.78125, -3.5078125, -3.234375, -2.9609375, -2.6875, -2.4140625, -2.140625, -1.8671875, -1.59375, -1.3203125, -1.046875, -0.7734375, -0.5, -0.2265625, 0.046875, 0.3203125, 0.59375, 0.8671875, 1.140625, 1.4140625, 1.6875, 1.9609375, 2.234375, 2.5078125, 2.78125, 3.0546875, 3.328125, 3.6015625, 3.875, 4.1484375, 4.421875, 4.6953125, 4.96875, 5.2421875, 5.515625, 5.7890625, 6.0625, 6.3359375, 6.609375, 6.8828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 11.0, 7.0, 15.0, 15.0, 29.0, 34.0, 41.0, 34.0, 45.0, 61.0, 66.0, 83.0, 90.0, 64.0, 50.0, 52.0, 52.0, 42.0, 40.0, 41.0, 28.0, 21.0, 16.0, 11.0, 9.0, 9.0, 9.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.26171875, -4.151885986328125, -4.04205322265625, -3.932220458984375, -3.8223876953125, -3.712554931640625, -3.60272216796875, -3.492889404296875, -3.383056640625, -3.273223876953125, -3.16339111328125, -3.053558349609375, -2.9437255859375, -2.833892822265625, -2.72406005859375, -2.614227294921875, -2.50439453125, -2.394561767578125, -2.28472900390625, -2.174896240234375, -2.0650634765625, -1.955230712890625, -1.84539794921875, -1.735565185546875, -1.625732421875, -1.515899658203125, -1.40606689453125, -1.296234130859375, -1.1864013671875, -1.076568603515625, -0.96673583984375, -0.856903076171875, -0.7470703125, -0.637237548828125, -0.52740478515625, -0.417572021484375, -0.3077392578125, -0.197906494140625, -0.08807373046875, 0.021759033203125, 0.131591796875, 0.241424560546875, 0.35125732421875, 0.461090087890625, 0.5709228515625, 0.680755615234375, 0.79058837890625, 0.900421142578125, 1.01025390625, 1.120086669921875, 1.22991943359375, 1.339752197265625, 1.4495849609375, 1.559417724609375, 1.66925048828125, 1.779083251953125, 1.888916015625, 1.998748779296875, 2.10858154296875, 2.218414306640625, 2.3282470703125, 2.438079833984375, 2.54791259765625, 2.657745361328125, 2.767578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 12.0, 2.0, 17.0, 17.0, 21.0, 36.0, 52.0, 80.0, 134.0, 330.0, 1094.0, 6663.0, 110974.0, 884135.0, 40155.0, 3506.0, 672.0, 254.0, 115.0, 72.0, 39.0, 34.0, 30.0, 19.0, 21.0, 10.0, 6.0, 3.0, 3.0, 6.0, 7.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.468505859375, -0.4568939208984375, -0.445281982421875, -0.4336700439453125, -0.42205810546875, -0.4104461669921875, -0.398834228515625, -0.3872222900390625, -0.3756103515625, -0.3639984130859375, -0.352386474609375, -0.3407745361328125, -0.32916259765625, -0.3175506591796875, -0.305938720703125, -0.2943267822265625, -0.28271484375, -0.2711029052734375, -0.259490966796875, -0.2478790283203125, -0.23626708984375, -0.2246551513671875, -0.213043212890625, -0.2014312744140625, -0.1898193359375, -0.1782073974609375, -0.166595458984375, -0.1549835205078125, -0.14337158203125, -0.1317596435546875, -0.120147705078125, -0.1085357666015625, -0.096923828125, -0.0853118896484375, -0.073699951171875, -0.0620880126953125, -0.05047607421875, -0.0388641357421875, -0.027252197265625, -0.0156402587890625, -0.0040283203125, 0.0075836181640625, 0.019195556640625, 0.0308074951171875, 0.04241943359375, 0.0540313720703125, 0.065643310546875, 0.0772552490234375, 0.0888671875, 0.1004791259765625, 0.112091064453125, 0.1237030029296875, 0.13531494140625, 0.1469268798828125, 0.158538818359375, 0.1701507568359375, 0.1817626953125, 0.1933746337890625, 0.204986572265625, 0.2165985107421875, 0.22821044921875, 0.2398223876953125, 0.251434326171875, 0.2630462646484375, 0.274658203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 4.0, 3.0, 6.0, 7.0, 13.0, 22.0, 39.0, 63.0, 111.0, 176.0, 192.0, 130.0, 86.0, 53.0, 33.0, 21.0, 11.0, 9.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.035234451293945e-05, -3.909878432750702e-05, -3.7845224142074585e-05, -3.659166395664215e-05, -3.533810377120972e-05, -3.408454358577728e-05, -3.283098340034485e-05, -3.1577423214912415e-05, -3.032386302947998e-05, -2.9070302844047546e-05, -2.7816742658615112e-05, -2.6563182473182678e-05, -2.5309622287750244e-05, -2.405606210231781e-05, -2.2802501916885376e-05, -2.1548941731452942e-05, -2.0295381546020508e-05, -1.9041821360588074e-05, -1.778826117515564e-05, -1.6534700989723206e-05, -1.528114080429077e-05, -1.4027580618858337e-05, -1.2774020433425903e-05, -1.152046024799347e-05, -1.0266900062561035e-05, -9.013339877128601e-06, -7.759779691696167e-06, -6.506219506263733e-06, -5.252659320831299e-06, -3.999099135398865e-06, -2.7455389499664307e-06, -1.4919787645339966e-06, -2.384185791015625e-07, 1.0151416063308716e-06, 2.2687017917633057e-06, 3.5222619771957397e-06, 4.775822162628174e-06, 6.029382348060608e-06, 7.282942533493042e-06, 8.536502718925476e-06, 9.79006290435791e-06, 1.1043623089790344e-05, 1.2297183275222778e-05, 1.3550743460655212e-05, 1.4804303646087646e-05, 1.605786383152008e-05, 1.7311424016952515e-05, 1.856498420238495e-05, 1.9818544387817383e-05, 2.1072104573249817e-05, 2.232566475868225e-05, 2.3579224944114685e-05, 2.483278512954712e-05, 2.6086345314979553e-05, 2.7339905500411987e-05, 2.859346568584442e-05, 2.9847025871276855e-05, 3.110058605670929e-05, 3.2354146242141724e-05, 3.360770642757416e-05, 3.486126661300659e-05, 3.6114826798439026e-05, 3.736838698387146e-05, 3.8621947169303894e-05, 3.987550735473633e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 7.0, 8.0, 25.0, 19.0, 27.0, 53.0, 114.0, 334.0, 1705.0, 46802.0, 977262.0, 20562.0, 1105.0, 236.0, 105.0, 55.0, 31.0, 27.0, 16.0, 9.0, 11.0, 3.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5108261108398438, -0.4928436279296875, -0.47486114501953125, -0.456878662109375, -0.43889617919921875, -0.4209136962890625, -0.40293121337890625, -0.38494873046875, -0.36696624755859375, -0.3489837646484375, -0.33100128173828125, -0.313018798828125, -0.29503631591796875, -0.2770538330078125, -0.25907135009765625, -0.2410888671875, -0.22310638427734375, -0.2051239013671875, -0.18714141845703125, -0.169158935546875, -0.15117645263671875, -0.1331939697265625, -0.11521148681640625, -0.09722900390625, -0.07924652099609375, -0.0612640380859375, -0.04328155517578125, -0.025299072265625, -0.00731658935546875, 0.0106658935546875, 0.02864837646484375, 0.046630859375, 0.06461334228515625, 0.0825958251953125, 0.10057830810546875, 0.118560791015625, 0.13654327392578125, 0.1545257568359375, 0.17250823974609375, 0.19049072265625, 0.20847320556640625, 0.2264556884765625, 0.24443817138671875, 0.262420654296875, 0.28040313720703125, 0.2983856201171875, 0.31636810302734375, 0.3343505859375, 0.35233306884765625, 0.3703155517578125, 0.38829803466796875, 0.406280517578125, 0.42426300048828125, 0.4422454833984375, 0.46022796630859375, 0.47821044921875, 0.49619293212890625, 0.5141754150390625, 0.5321578979492188, 0.550140380859375, 0.5681228637695312, 0.5861053466796875, 0.6040878295898438, 0.6220703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 13.0, 12.0, 14.0, 24.0, 27.0, 38.0, 65.0, 78.0, 118.0, 120.0, 131.0, 109.0, 72.0, 49.0, 30.0, 23.0, 23.0, 7.0, 5.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08966064453125, -0.08701324462890625, -0.0843658447265625, -0.08171844482421875, -0.079071044921875, -0.07642364501953125, -0.0737762451171875, -0.07112884521484375, -0.0684814453125, -0.06583404541015625, -0.0631866455078125, -0.06053924560546875, -0.057891845703125, -0.05524444580078125, -0.0525970458984375, -0.04994964599609375, -0.04730224609375, -0.04465484619140625, -0.0420074462890625, -0.03936004638671875, -0.036712646484375, -0.03406524658203125, -0.0314178466796875, -0.02877044677734375, -0.026123046875, -0.02347564697265625, -0.0208282470703125, -0.01818084716796875, -0.015533447265625, -0.01288604736328125, -0.0102386474609375, -0.00759124755859375, -0.00494384765625, -0.00229644775390625, 0.0003509521484375, 0.00299835205078125, 0.005645751953125, 0.00829315185546875, 0.0109405517578125, 0.01358795166015625, 0.0162353515625, 0.01888275146484375, 0.0215301513671875, 0.02417755126953125, 0.026824951171875, 0.02947235107421875, 0.0321197509765625, 0.03476715087890625, 0.03741455078125, 0.04006195068359375, 0.0427093505859375, 0.04535675048828125, 0.048004150390625, 0.05065155029296875, 0.0532989501953125, 0.05594635009765625, 0.05859375, 0.06124114990234375, 0.0638885498046875, 0.06653594970703125, 0.069183349609375, 0.07183074951171875, 0.0744781494140625, 0.07712554931640625, 0.07977294921875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 43.0, 316.0, 512.0, 131.0, 18.0, 0.0, 2.0], "bins": [-15.802494049072266, -15.535966873168945, -15.269438743591309, -15.002910614013672, -14.736383438110352, -14.469856262207031, -14.203328132629395, -13.936800003051758, -13.670272827148438, -13.403745651245117, -13.13721752166748, -12.870689392089844, -12.604162216186523, -12.337635040283203, -12.071106910705566, -11.80457878112793, -11.53805160522461, -11.271524429321289, -11.004996299743652, -10.738468170166016, -10.471940994262695, -10.205413818359375, -9.938885688781738, -9.672357559204102, -9.405830383300781, -9.139303207397461, -8.872775077819824, -8.606246948242188, -8.339719772338867, -8.073192596435547, -7.80666446685791, -7.540136814117432, -7.273609161376953, -7.007081508636475, -6.740553855895996, -6.474026203155518, -6.207498550415039, -5.9409708976745605, -5.674443244934082, -5.4079155921936035, -5.141387939453125, -4.8748602867126465, -4.608332633972168, -4.3418049812316895, -4.075277328491211, -3.8087496757507324, -3.542222023010254, -3.2756943702697754, -3.009166717529297, -2.7426390647888184, -2.47611141204834, -2.2095837593078613, -1.9430561065673828, -1.6765284538269043, -1.4100008010864258, -1.1434731483459473, -0.8769453763961792, -0.6104177236557007, -0.34389007091522217, -0.07736241817474365, 0.18916523456573486, 0.4556928873062134, 0.7222205400466919, 0.9887481927871704, 1.255275845527649]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 6.0, 3.0, 6.0, 10.0, 17.0, 23.0, 10.0, 24.0, 21.0, 25.0, 24.0, 31.0, 26.0, 22.0, 25.0, 41.0, 49.0, 58.0, 49.0, 53.0, 42.0, 47.0, 39.0, 39.0, 37.0, 43.0, 23.0, 30.0, 22.0, 25.0, 23.0, 15.0, 18.0, 10.0, 16.0, 11.0, 8.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.842506170272827, -2.753528356552124, -2.664550542831421, -2.5755727291107178, -2.4865949153900146, -2.3976171016693115, -2.3086390495300293, -2.219661235809326, -2.130683422088623, -2.04170560836792, -1.9527277946472168, -1.8637499809265137, -1.7747721672058105, -1.6857943534851074, -1.5968164205551147, -1.5078386068344116, -1.418860912322998, -1.329883098602295, -1.2409052848815918, -1.1519274711608887, -1.0629496574401855, -0.9739717841148376, -0.8849939107894897, -0.7960160970687866, -0.7070382833480835, -0.6180604696273804, -0.5290826559066772, -0.44010478258132935, -0.3511269688606262, -0.2621491551399231, -0.1731712818145752, -0.08419346809387207, 0.004784345626831055, 0.09376217424869537, 0.1827400028705597, 0.2717178463935852, 0.36069566011428833, 0.44967347383499146, 0.5386513471603394, 0.6276291608810425, 0.7166069746017456, 0.8055847883224487, 0.8945626020431519, 0.9835404753684998, 1.0725183486938477, 1.1614961624145508, 1.250473976135254, 1.339451789855957, 1.4284296035766602, 1.5174074172973633, 1.6063852310180664, 1.6953630447387695, 1.7843408584594727, 1.8733186721801758, 1.9622966051101685, 2.051274299621582, 2.140252113342285, 2.2292299270629883, 2.3182077407836914, 2.4071855545043945, 2.4961633682250977, 2.585141181945801, 2.674118995666504, 2.763096809387207, 2.8520748615264893]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 9.0, 5.0, 4.0, 7.0, 10.0, 18.0, 15.0, 18.0, 21.0, 15.0, 25.0, 36.0, 41.0, 64.0, 102.0, 231.0, 678.0, 2838.0, 25137.0, 598526.0, 3148764.0, 394572.0, 19334.0, 2612.0, 600.0, 200.0, 110.0, 54.0, 48.0, 39.0, 24.0, 22.0, 26.0, 20.0, 11.0, 8.0, 9.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.521484375, -1.47149658203125, -1.4215087890625, -1.37152099609375, -1.321533203125, -1.27154541015625, -1.2215576171875, -1.17156982421875, -1.12158203125, -1.07159423828125, -1.0216064453125, -0.97161865234375, -0.921630859375, -0.87164306640625, -0.8216552734375, -0.77166748046875, -0.7216796875, -0.67169189453125, -0.6217041015625, -0.57171630859375, -0.521728515625, -0.47174072265625, -0.4217529296875, -0.37176513671875, -0.32177734375, -0.27178955078125, -0.2218017578125, -0.17181396484375, -0.121826171875, -0.07183837890625, -0.0218505859375, 0.02813720703125, 0.078125, 0.12811279296875, 0.1781005859375, 0.22808837890625, 0.278076171875, 0.32806396484375, 0.3780517578125, 0.42803955078125, 0.47802734375, 0.52801513671875, 0.5780029296875, 0.62799072265625, 0.677978515625, 0.72796630859375, 0.7779541015625, 0.82794189453125, 0.8779296875, 0.92791748046875, 0.9779052734375, 1.02789306640625, 1.077880859375, 1.12786865234375, 1.1778564453125, 1.22784423828125, 1.27783203125, 1.32781982421875, 1.3778076171875, 1.42779541015625, 1.477783203125, 1.52777099609375, 1.5777587890625, 1.62774658203125, 1.677734375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 11.0, 5.0, 9.0, 10.0, 10.0, 14.0, 21.0, 15.0, 20.0, 30.0, 34.0, 44.0, 43.0, 55.0, 45.0, 42.0, 55.0, 50.0, 54.0, 40.0, 57.0, 42.0, 41.0, 37.0, 34.0, 28.0, 35.0, 26.0, 19.0, 16.0, 17.0, 17.0, 10.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6865234375, -0.6667327880859375, -0.646942138671875, -0.6271514892578125, -0.60736083984375, -0.5875701904296875, -0.567779541015625, -0.5479888916015625, -0.5281982421875, -0.5084075927734375, -0.488616943359375, -0.4688262939453125, -0.44903564453125, -0.4292449951171875, -0.409454345703125, -0.3896636962890625, -0.369873046875, -0.3500823974609375, -0.330291748046875, -0.3105010986328125, -0.29071044921875, -0.2709197998046875, -0.251129150390625, -0.2313385009765625, -0.2115478515625, -0.1917572021484375, -0.171966552734375, -0.1521759033203125, -0.13238525390625, -0.1125946044921875, -0.092803955078125, -0.0730133056640625, -0.05322265625, -0.0334320068359375, -0.013641357421875, 0.0061492919921875, 0.02593994140625, 0.0457305908203125, 0.065521240234375, 0.0853118896484375, 0.1051025390625, 0.1248931884765625, 0.144683837890625, 0.1644744873046875, 0.18426513671875, 0.2040557861328125, 0.223846435546875, 0.2436370849609375, 0.263427734375, 0.2832183837890625, 0.303009033203125, 0.3227996826171875, 0.34259033203125, 0.3623809814453125, 0.382171630859375, 0.4019622802734375, 0.4217529296875, 0.4415435791015625, 0.461334228515625, 0.4811248779296875, 0.50091552734375, 0.5207061767578125, 0.540496826171875, 0.5602874755859375, 0.580078125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 3.0, 2.0, 9.0, 10.0, 28.0, 52.0, 89.0, 153.0, 335.0, 1050.0, 4145846.0, 45639.0, 546.0, 259.0, 120.0, 69.0, 26.0, 16.0, 10.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.7740478515625, -11.485595703125, -11.1971435546875, -10.90869140625, -10.6202392578125, -10.331787109375, -10.0433349609375, -9.7548828125, -9.4664306640625, -9.177978515625, -8.8895263671875, -8.60107421875, -8.3126220703125, -8.024169921875, -7.7357177734375, -7.447265625, -7.1588134765625, -6.870361328125, -6.5819091796875, -6.29345703125, -6.0050048828125, -5.716552734375, -5.4281005859375, -5.1396484375, -4.8511962890625, -4.562744140625, -4.2742919921875, -3.98583984375, -3.6973876953125, -3.408935546875, -3.1204833984375, -2.83203125, -2.5435791015625, -2.255126953125, -1.9666748046875, -1.67822265625, -1.3897705078125, -1.101318359375, -0.8128662109375, -0.5244140625, -0.2359619140625, 0.052490234375, 0.3409423828125, 0.62939453125, 0.9178466796875, 1.206298828125, 1.4947509765625, 1.783203125, 2.0716552734375, 2.360107421875, 2.6485595703125, 2.93701171875, 3.2254638671875, 3.513916015625, 3.8023681640625, 4.0908203125, 4.3792724609375, 4.667724609375, 4.9561767578125, 5.24462890625, 5.5330810546875, 5.821533203125, 6.1099853515625, 6.3984375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 14.0, 15.0, 13.0, 25.0, 35.0, 50.0, 72.0, 121.0, 143.0, 259.0, 380.0, 505.0, 568.0, 538.0, 419.0, 278.0, 195.0, 128.0, 87.0, 62.0, 48.0, 30.0, 25.0, 20.0, 8.0, 3.0, 9.0, 2.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.305908203125, -0.2962608337402344, -0.28661346435546875, -0.2769660949707031, -0.2673187255859375, -0.2576713562011719, -0.24802398681640625, -0.23837661743164062, -0.228729248046875, -0.21908187866210938, -0.20943450927734375, -0.19978713989257812, -0.1901397705078125, -0.18049240112304688, -0.17084503173828125, -0.16119766235351562, -0.15155029296875, -0.14190292358398438, -0.13225555419921875, -0.12260818481445312, -0.1129608154296875, -0.10331344604492188, -0.09366607666015625, -0.08401870727539062, -0.074371337890625, -0.06472396850585938, -0.05507659912109375, -0.045429229736328125, -0.0357818603515625, -0.026134490966796875, -0.01648712158203125, -0.006839752197265625, 0.0028076171875, 0.012454986572265625, 0.02210235595703125, 0.031749725341796875, 0.0413970947265625, 0.051044464111328125, 0.06069183349609375, 0.07033920288085938, 0.079986572265625, 0.08963394165039062, 0.09928131103515625, 0.10892868041992188, 0.1185760498046875, 0.12822341918945312, 0.13787078857421875, 0.14751815795898438, 0.15716552734375, 0.16681289672851562, 0.17646026611328125, 0.18610763549804688, 0.1957550048828125, 0.20540237426757812, 0.21504974365234375, 0.22469711303710938, 0.234344482421875, 0.24399185180664062, 0.25363922119140625, 0.2632865905761719, 0.2729339599609375, 0.2825813293457031, 0.29222869873046875, 0.3018760681152344, 0.3115234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 2.0, 14.0, 19.0, 28.0, 52.0, 65.0, 51.0, 79.0, 86.0, 89.0, 75.0, 80.0, 75.0, 67.0, 58.0, 38.0, 42.0, 14.0, 21.0, 9.0, 8.0, 6.0, 7.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0861214399337769, -1.0553040504455566, -1.024486780166626, -0.9936694502830505, -0.9628521203994751, -0.9320347905158997, -0.9012174606323242, -0.870400071144104, -0.8395828008651733, -0.8087654709815979, -0.7779481410980225, -0.747130811214447, -0.7163134813308716, -0.6854961514472961, -0.6546788215637207, -0.6238614320755005, -0.593044102191925, -0.5622267723083496, -0.5314094424247742, -0.5005921125411987, -0.4697747826576233, -0.43895745277404785, -0.40814009308815, -0.3773227632045746, -0.34650543332099915, -0.3156881034374237, -0.28487077355384827, -0.25405341386795044, -0.2232360988855362, -0.19241876900196075, -0.16160142421722412, -0.13078409433364868, -0.09996670484542847, -0.06914937496185303, -0.03833203762769699, -0.007514700293540955, 0.023302629590034485, 0.054119959473609924, 0.08493730425834656, 0.115754634141922, 0.14657196402549744, 0.17738929390907288, 0.20820662379264832, 0.23902396857738495, 0.2698413133621216, 0.300658643245697, 0.33147597312927246, 0.3622933030128479, 0.39311063289642334, 0.4239279627799988, 0.4547452926635742, 0.48556262254714966, 0.5163799524307251, 0.5471972823143005, 0.578014612197876, 0.6088320016860962, 0.6396492719650269, 0.6704666018486023, 0.7012839317321777, 0.7321012616157532, 0.7629185914993286, 0.793735921382904, 0.8245532512664795, 0.8553706407546997, 0.8861879706382751]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 9.0, 11.0, 23.0, 25.0, 28.0, 23.0, 29.0, 27.0, 28.0, 38.0, 52.0, 47.0, 46.0, 44.0, 49.0, 42.0, 47.0, 48.0, 42.0, 42.0, 28.0, 39.0, 23.0, 41.0, 24.0, 25.0, 16.0, 25.0, 19.0, 14.0, 8.0, 5.0, 4.0, 4.0, 0.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.725472629070282, -0.705382227897644, -0.6852918267250061, -0.6652014255523682, -0.6451110243797302, -0.6250206232070923, -0.6049302220344543, -0.5848398208618164, -0.5647494792938232, -0.5446590781211853, -0.5245686769485474, -0.5044782757759094, -0.4843878746032715, -0.46429747343063354, -0.444207102060318, -0.42411670088768005, -0.4040262699127197, -0.3839358687400818, -0.36384546756744385, -0.3437550663948059, -0.32366466522216797, -0.30357426404953003, -0.2834838926792145, -0.26339349150657654, -0.2433030903339386, -0.22321268916130066, -0.20312228798866272, -0.18303190171718597, -0.16294150054454803, -0.1428510993719101, -0.12276070564985275, -0.10267031192779541, -0.08257997035980225, -0.062489572912454605, -0.042399175465106964, -0.022308778017759323, -0.002218380570411682, 0.017872020602226257, 0.0379624143242836, 0.05805280804634094, 0.07814320921897888, 0.09823361039161682, 0.11832400411367416, 0.1384143978357315, 0.15850479900836945, 0.17859520018100739, 0.19868558645248413, 0.21877598762512207, 0.23886638879776, 0.25895678997039795, 0.2790471911430359, 0.29913759231567383, 0.31922799348831177, 0.3393183946609497, 0.35940876603126526, 0.3794991672039032, 0.39958956837654114, 0.4196799695491791, 0.439770370721817, 0.45986077189445496, 0.4799511432647705, 0.5000415444374084, 0.5201319456100464, 0.5402223467826843, 0.5603127479553223]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 9.0, 11.0, 11.0, 13.0, 19.0, 28.0, 29.0, 66.0, 114.0, 177.0, 300.0, 548.0, 961.0, 1890.0, 3819.0, 8370.0, 19682.0, 51665.0, 140191.0, 317595.0, 298876.0, 125295.0, 46035.0, 18017.0, 7467.0, 3517.0, 1747.0, 875.0, 488.0, 302.0, 160.0, 102.0, 75.0, 28.0, 25.0, 18.0, 9.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.28271484375, -0.2756366729736328, -0.2685585021972656, -0.26148033142089844, -0.25440216064453125, -0.24732398986816406, -0.24024581909179688, -0.2331676483154297, -0.2260894775390625, -0.2190113067626953, -0.21193313598632812, -0.20485496520996094, -0.19777679443359375, -0.19069862365722656, -0.18362045288085938, -0.1765422821044922, -0.169464111328125, -0.1623859405517578, -0.15530776977539062, -0.14822959899902344, -0.14115142822265625, -0.13407325744628906, -0.12699508666992188, -0.11991691589355469, -0.1128387451171875, -0.10576057434082031, -0.09868240356445312, -0.09160423278808594, -0.08452606201171875, -0.07744789123535156, -0.07036972045898438, -0.06329154968261719, -0.05621337890625, -0.04913520812988281, -0.042057037353515625, -0.03497886657714844, -0.02790069580078125, -0.020822525024414062, -0.013744354248046875, -0.0066661834716796875, 0.0004119873046875, 0.0074901580810546875, 0.014568328857421875, 0.021646499633789062, 0.02872467041015625, 0.03580284118652344, 0.042881011962890625, 0.04995918273925781, 0.057037353515625, 0.06411552429199219, 0.07119369506835938, 0.07827186584472656, 0.08535003662109375, 0.09242820739746094, 0.09950637817382812, 0.10658454895019531, 0.1136627197265625, 0.12074089050292969, 0.12781906127929688, 0.13489723205566406, 0.14197540283203125, 0.14905357360839844, 0.15613174438476562, 0.1632099151611328, 0.1702880859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 11.0, 12.0, 23.0, 21.0, 16.0, 22.0, 26.0, 37.0, 37.0, 31.0, 50.0, 42.0, 43.0, 53.0, 37.0, 47.0, 46.0, 44.0, 42.0, 37.0, 34.0, 40.0, 30.0, 26.0, 31.0, 29.0, 21.0, 27.0, 12.0, 13.0, 8.0, 11.0, 7.0, 2.0, 6.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.387939453125, -0.3764190673828125, -0.364898681640625, -0.3533782958984375, -0.34185791015625, -0.3303375244140625, -0.318817138671875, -0.3072967529296875, -0.2957763671875, -0.2842559814453125, -0.272735595703125, -0.2612152099609375, -0.24969482421875, -0.2381744384765625, -0.226654052734375, -0.2151336669921875, -0.20361328125, -0.1920928955078125, -0.180572509765625, -0.1690521240234375, -0.15753173828125, -0.1460113525390625, -0.134490966796875, -0.1229705810546875, -0.1114501953125, -0.0999298095703125, -0.088409423828125, -0.0768890380859375, -0.06536865234375, -0.0538482666015625, -0.042327880859375, -0.0308074951171875, -0.019287109375, -0.0077667236328125, 0.003753662109375, 0.0152740478515625, 0.02679443359375, 0.0383148193359375, 0.049835205078125, 0.0613555908203125, 0.0728759765625, 0.0843963623046875, 0.095916748046875, 0.1074371337890625, 0.11895751953125, 0.1304779052734375, 0.141998291015625, 0.1535186767578125, 0.1650390625, 0.1765594482421875, 0.188079833984375, 0.1996002197265625, 0.21112060546875, 0.2226409912109375, 0.234161376953125, 0.2456817626953125, 0.2572021484375, 0.2687225341796875, 0.280242919921875, 0.2917633056640625, 0.30328369140625, 0.3148040771484375, 0.326324462890625, 0.3378448486328125, 0.349365234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 9.0, 4.0, 8.0, 12.0, 16.0, 35.0, 45.0, 67.0, 93.0, 180.0, 324.0, 581.0, 1175.0, 2407.0, 5571.0, 15068.0, 46844.0, 157455.0, 377656.0, 293917.0, 99495.0, 29814.0, 10099.0, 3852.0, 1830.0, 846.0, 452.0, 271.0, 158.0, 85.0, 55.0, 33.0, 31.0, 14.0, 12.0, 7.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2344970703125, -0.2268848419189453, -0.21927261352539062, -0.21166038513183594, -0.20404815673828125, -0.19643592834472656, -0.18882369995117188, -0.1812114715576172, -0.1735992431640625, -0.1659870147705078, -0.15837478637695312, -0.15076255798339844, -0.14315032958984375, -0.13553810119628906, -0.12792587280273438, -0.12031364440917969, -0.112701416015625, -0.10508918762207031, -0.09747695922851562, -0.08986473083496094, -0.08225250244140625, -0.07464027404785156, -0.06702804565429688, -0.05941581726074219, -0.0518035888671875, -0.04419136047363281, -0.036579132080078125, -0.028966903686523438, -0.02135467529296875, -0.013742446899414062, -0.006130218505859375, 0.0014820098876953125, 0.00909423828125, 0.016706466674804688, 0.024318695068359375, 0.03193092346191406, 0.03954315185546875, 0.04715538024902344, 0.054767608642578125, 0.06237983703613281, 0.0699920654296875, 0.07760429382324219, 0.08521652221679688, 0.09282875061035156, 0.10044097900390625, 0.10805320739746094, 0.11566543579101562, 0.12327766418457031, 0.130889892578125, 0.1385021209716797, 0.14611434936523438, 0.15372657775878906, 0.16133880615234375, 0.16895103454589844, 0.17656326293945312, 0.1841754913330078, 0.1917877197265625, 0.1993999481201172, 0.20701217651367188, 0.21462440490722656, 0.22223663330078125, 0.22984886169433594, 0.23746109008789062, 0.2450733184814453, 0.252685546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 14.0, 9.0, 16.0, 12.0, 17.0, 20.0, 28.0, 20.0, 23.0, 30.0, 24.0, 44.0, 36.0, 42.0, 47.0, 52.0, 48.0, 44.0, 45.0, 39.0, 43.0, 35.0, 36.0, 29.0, 36.0, 24.0, 24.0, 23.0, 22.0, 20.0, 17.0, 16.0, 7.0, 11.0, 9.0, 5.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.62890625, -0.6099395751953125, -0.590972900390625, -0.5720062255859375, -0.55303955078125, -0.5340728759765625, -0.515106201171875, -0.4961395263671875, -0.4771728515625, -0.4582061767578125, -0.439239501953125, -0.4202728271484375, -0.40130615234375, -0.3823394775390625, -0.363372802734375, -0.3444061279296875, -0.325439453125, -0.3064727783203125, -0.287506103515625, -0.2685394287109375, -0.24957275390625, -0.2306060791015625, -0.211639404296875, -0.1926727294921875, -0.1737060546875, -0.1547393798828125, -0.135772705078125, -0.1168060302734375, -0.09783935546875, -0.0788726806640625, -0.059906005859375, -0.0409393310546875, -0.02197265625, -0.0030059814453125, 0.015960693359375, 0.0349273681640625, 0.05389404296875, 0.0728607177734375, 0.091827392578125, 0.1107940673828125, 0.1297607421875, 0.1487274169921875, 0.167694091796875, 0.1866607666015625, 0.20562744140625, 0.2245941162109375, 0.243560791015625, 0.2625274658203125, 0.281494140625, 0.3004608154296875, 0.319427490234375, 0.3383941650390625, 0.35736083984375, 0.3763275146484375, 0.395294189453125, 0.4142608642578125, 0.4332275390625, 0.4521942138671875, 0.471160888671875, 0.4901275634765625, 0.50909423828125, 0.5280609130859375, 0.547027587890625, 0.5659942626953125, 0.5849609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 12.0, 16.0, 18.0, 18.0, 34.0, 36.0, 66.0, 102.0, 164.0, 214.0, 345.0, 590.0, 992.0, 1792.0, 3734.0, 8140.0, 19763.0, 55430.0, 199331.0, 459286.0, 204764.0, 57146.0, 20055.0, 8165.0, 3753.0, 1858.0, 1024.0, 553.0, 362.0, 240.0, 160.0, 104.0, 75.0, 56.0, 34.0, 30.0, 29.0, 16.0, 4.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.094482421875, -0.09148406982421875, -0.0884857177734375, -0.08548736572265625, -0.082489013671875, -0.07949066162109375, -0.0764923095703125, -0.07349395751953125, -0.07049560546875, -0.06749725341796875, -0.0644989013671875, -0.06150054931640625, -0.058502197265625, -0.05550384521484375, -0.0525054931640625, -0.04950714111328125, -0.0465087890625, -0.04351043701171875, -0.0405120849609375, -0.03751373291015625, -0.034515380859375, -0.03151702880859375, -0.0285186767578125, -0.02552032470703125, -0.02252197265625, -0.01952362060546875, -0.0165252685546875, -0.01352691650390625, -0.010528564453125, -0.00753021240234375, -0.0045318603515625, -0.00153350830078125, 0.00146484375, 0.00446319580078125, 0.0074615478515625, 0.01045989990234375, 0.013458251953125, 0.01645660400390625, 0.0194549560546875, 0.02245330810546875, 0.02545166015625, 0.02845001220703125, 0.0314483642578125, 0.03444671630859375, 0.037445068359375, 0.04044342041015625, 0.0434417724609375, 0.04644012451171875, 0.0494384765625, 0.05243682861328125, 0.0554351806640625, 0.05843353271484375, 0.061431884765625, 0.06443023681640625, 0.0674285888671875, 0.07042694091796875, 0.07342529296875, 0.07642364501953125, 0.0794219970703125, 0.08242034912109375, 0.085418701171875, 0.08841705322265625, 0.0914154052734375, 0.09441375732421875, 0.097412109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 16.0, 26.0, 47.0, 58.0, 115.0, 163.0, 176.0, 145.0, 110.0, 54.0, 20.0, 25.0, 11.0, 8.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.870529174804688e-05, -9.58368182182312e-05, -9.296834468841553e-05, -9.009987115859985e-05, -8.723139762878418e-05, -8.43629240989685e-05, -8.149445056915283e-05, -7.862597703933716e-05, -7.575750350952148e-05, -7.288902997970581e-05, -7.002055644989014e-05, -6.715208292007446e-05, -6.428360939025879e-05, -6.141513586044312e-05, -5.854666233062744e-05, -5.567818880081177e-05, -5.2809715270996094e-05, -4.994124174118042e-05, -4.7072768211364746e-05, -4.420429468154907e-05, -4.13358211517334e-05, -3.8467347621917725e-05, -3.559887409210205e-05, -3.273040056228638e-05, -2.9861927032470703e-05, -2.699345350265503e-05, -2.4124979972839355e-05, -2.125650644302368e-05, -1.8388032913208008e-05, -1.5519559383392334e-05, -1.265108585357666e-05, -9.782612323760986e-06, -6.9141387939453125e-06, -4.045665264129639e-06, -1.1771917343139648e-06, 1.691281795501709e-06, 4.559755325317383e-06, 7.428228855133057e-06, 1.029670238494873e-05, 1.3165175914764404e-05, 1.6033649444580078e-05, 1.8902122974395752e-05, 2.1770596504211426e-05, 2.46390700340271e-05, 2.7507543563842773e-05, 3.0376017093658447e-05, 3.324449062347412e-05, 3.6112964153289795e-05, 3.898143768310547e-05, 4.184991121292114e-05, 4.4718384742736816e-05, 4.758685827255249e-05, 5.0455331802368164e-05, 5.332380533218384e-05, 5.619227886199951e-05, 5.9060752391815186e-05, 6.192922592163086e-05, 6.479769945144653e-05, 6.766617298126221e-05, 7.053464651107788e-05, 7.340312004089355e-05, 7.627159357070923e-05, 7.91400671005249e-05, 8.200854063034058e-05, 8.487701416015625e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 14.0, 17.0, 25.0, 25.0, 35.0, 56.0, 107.0, 332.0, 1284.0, 6415.0, 55218.0, 682159.0, 277762.0, 20898.0, 3080.0, 638.0, 221.0, 81.0, 54.0, 36.0, 21.0, 21.0, 12.0, 6.0, 8.0, 1.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.26171875, -0.2547931671142578, -0.24786758422851562, -0.24094200134277344, -0.23401641845703125, -0.22709083557128906, -0.22016525268554688, -0.2132396697998047, -0.2063140869140625, -0.1993885040283203, -0.19246292114257812, -0.18553733825683594, -0.17861175537109375, -0.17168617248535156, -0.16476058959960938, -0.1578350067138672, -0.150909423828125, -0.1439838409423828, -0.13705825805664062, -0.13013267517089844, -0.12320709228515625, -0.11628150939941406, -0.10935592651367188, -0.10243034362792969, -0.0955047607421875, -0.08857917785644531, -0.08165359497070312, -0.07472801208496094, -0.06780242919921875, -0.06087684631347656, -0.053951263427734375, -0.04702568054199219, -0.04010009765625, -0.03317451477050781, -0.026248931884765625, -0.019323348999023438, -0.01239776611328125, -0.0054721832275390625, 0.001453399658203125, 0.008378982543945312, 0.0153045654296875, 0.022230148315429688, 0.029155731201171875, 0.03608131408691406, 0.04300689697265625, 0.04993247985839844, 0.056858062744140625, 0.06378364562988281, 0.070709228515625, 0.07763481140136719, 0.08456039428710938, 0.09148597717285156, 0.09841156005859375, 0.10533714294433594, 0.11226272583007812, 0.11918830871582031, 0.1261138916015625, 0.1330394744873047, 0.13996505737304688, 0.14689064025878906, 0.15381622314453125, 0.16074180603027344, 0.16766738891601562, 0.1745929718017578, 0.1815185546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 8.0, 8.0, 14.0, 14.0, 17.0, 25.0, 28.0, 39.0, 47.0, 67.0, 70.0, 102.0, 96.0, 97.0, 81.0, 59.0, 57.0, 39.0, 30.0, 21.0, 18.0, 11.0, 7.0, 11.0, 8.0, 3.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0279083251953125, -0.027075767517089844, -0.026243209838867188, -0.02541065216064453, -0.024578094482421875, -0.02374553680419922, -0.022912979125976562, -0.022080421447753906, -0.02124786376953125, -0.020415306091308594, -0.019582748413085938, -0.01875019073486328, -0.017917633056640625, -0.01708507537841797, -0.016252517700195312, -0.015419960021972656, -0.01458740234375, -0.013754844665527344, -0.012922286987304688, -0.012089729309082031, -0.011257171630859375, -0.010424613952636719, -0.009592056274414062, -0.008759498596191406, -0.00792694091796875, -0.007094383239746094, -0.0062618255615234375, -0.005429267883300781, -0.004596710205078125, -0.0037641525268554688, -0.0029315948486328125, -0.0020990371704101562, -0.0012664794921875, -0.00043392181396484375, 0.0003986358642578125, 0.0012311935424804688, 0.002063751220703125, 0.0028963088989257812, 0.0037288665771484375, 0.004561424255371094, 0.00539398193359375, 0.006226539611816406, 0.0070590972900390625, 0.007891654968261719, 0.008724212646484375, 0.009556770324707031, 0.010389328002929688, 0.011221885681152344, 0.012054443359375, 0.012887001037597656, 0.013719558715820312, 0.014552116394042969, 0.015384674072265625, 0.01621723175048828, 0.017049789428710938, 0.017882347106933594, 0.01871490478515625, 0.019547462463378906, 0.020380020141601562, 0.02121257781982422, 0.022045135498046875, 0.02287769317626953, 0.023710250854492188, 0.024542808532714844, 0.0253753662109375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 5.0, 13.0, 21.0, 35.0, 68.0, 76.0, 88.0, 105.0, 128.0, 106.0, 102.0, 84.0, 62.0, 30.0, 30.0, 15.0, 7.0, 12.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.8337269425392151, -0.8109800219535828, -0.7882330417633057, -0.7654861211776733, -0.742739200592041, -0.7199922800064087, -0.6972452998161316, -0.6744983792304993, -0.6517513990402222, -0.6290044784545898, -0.6062574982643127, -0.5835105776786804, -0.5607636570930481, -0.538016676902771, -0.5152697563171387, -0.49252283573150635, -0.469775915145874, -0.4470289647579193, -0.424282044172287, -0.4015350937843323, -0.37878817319869995, -0.35604122281074524, -0.3332942724227905, -0.3105473518371582, -0.2878004014492035, -0.2650534510612488, -0.24230653047561646, -0.21955958008766174, -0.19681264460086823, -0.1740657091140747, -0.15131875872612, -0.12857182323932648, -0.10582482814788818, -0.08307789266109467, -0.06033094972372055, -0.037584006786346436, -0.014837071299552917, 0.0079098641872406, 0.030656814575195312, 0.05340375006198883, 0.07615068554878235, 0.09889762103557587, 0.12164456397294998, 0.1443915069103241, 0.16713844239711761, 0.18988537788391113, 0.21263232827186584, 0.23537926375865936, 0.2581261992454529, 0.2808731496334076, 0.3036200702190399, 0.32636702060699463, 0.34911394119262695, 0.37186089158058167, 0.3946078419685364, 0.4173547625541687, 0.4401017129421234, 0.4628486633300781, 0.48559558391571045, 0.5083425045013428, 0.5310894846916199, 0.5538364052772522, 0.5765833854675293, 0.5993303060531616, 0.622077226638794]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 0.0, 9.0, 9.0, 7.0, 6.0, 19.0, 18.0, 31.0, 27.0, 28.0, 31.0, 37.0, 40.0, 59.0, 48.0, 62.0, 47.0, 49.0, 52.0, 64.0, 42.0, 42.0, 37.0, 33.0, 33.0, 35.0, 29.0, 25.0, 19.0, 15.0, 17.0, 11.0, 8.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.46792328357696533, -0.45511922240257263, -0.4423151910305023, -0.4295111298561096, -0.4167070686817169, -0.4039030075073242, -0.3910989761352539, -0.3782949149608612, -0.3654908537864685, -0.3526867926120758, -0.3398827612400055, -0.3270787000656128, -0.3142746388912201, -0.3014705777168274, -0.2886665463447571, -0.2758624851703644, -0.26305845379829407, -0.25025439262390137, -0.23745034635066986, -0.22464630007743835, -0.21184223890304565, -0.19903819262981415, -0.18623414635658264, -0.17343008518218994, -0.16062603890895844, -0.14782199263572693, -0.13501793146133423, -0.12221388518810272, -0.10940983146429062, -0.09660577774047852, -0.08380173146724701, -0.0709976777434349, -0.0581936240196228, -0.0453895702958107, -0.032585520297288895, -0.01978147029876709, -0.006977416574954987, 0.005826637148857117, 0.018630683422088623, 0.031434737145900726, 0.04423879086971283, 0.05704284459352493, 0.06984689831733704, 0.08265094459056854, 0.09545499831438065, 0.10825905203819275, 0.12106309831142426, 0.13386714458465576, 0.14667120575904846, 0.15947525203227997, 0.17227931320667267, 0.18508335947990417, 0.19788742065429688, 0.21069146692752838, 0.2234955132007599, 0.2362995743751526, 0.2491036206483841, 0.2619076669216156, 0.2747117280960083, 0.2875157594680786, 0.3003198206424713, 0.313123881816864, 0.3259279131889343, 0.338731974363327, 0.3515360355377197]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 10.0, 18.0, 17.0, 24.0, 21.0, 55.0, 77.0, 109.0, 147.0, 234.0, 356.0, 598.0, 996.0, 1712.0, 3063.0, 5814.0, 11207.0, 23625.0, 51881.0, 117196.0, 245047.0, 291655.0, 160183.0, 71163.0, 31863.0, 14933.0, 7439.0, 3802.0, 2108.0, 1194.0, 736.0, 419.0, 278.0, 179.0, 133.0, 90.0, 53.0, 36.0, 31.0, 15.0, 6.0, 12.0, 3.0, 3.0, 8.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24245834350585938, -0.23442840576171875, -0.22639846801757812, -0.2183685302734375, -0.21033859252929688, -0.20230865478515625, -0.19427871704101562, -0.186248779296875, -0.17821884155273438, -0.17018890380859375, -0.16215896606445312, -0.1541290283203125, -0.14609909057617188, -0.13806915283203125, -0.13003921508789062, -0.12200927734375, -0.11397933959960938, -0.10594940185546875, -0.09791946411132812, -0.0898895263671875, -0.08185958862304688, -0.07382965087890625, -0.06579971313476562, -0.057769775390625, -0.049739837646484375, -0.04170989990234375, -0.033679962158203125, -0.0256500244140625, -0.017620086669921875, -0.00959014892578125, -0.001560211181640625, 0.0064697265625, 0.014499664306640625, 0.02252960205078125, 0.030559539794921875, 0.0385894775390625, 0.046619415283203125, 0.05464935302734375, 0.06267929077148438, 0.070709228515625, 0.07873916625976562, 0.08676910400390625, 0.09479904174804688, 0.1028289794921875, 0.11085891723632812, 0.11888885498046875, 0.12691879272460938, 0.13494873046875, 0.14297866821289062, 0.15100860595703125, 0.15903854370117188, 0.1670684814453125, 0.17509841918945312, 0.18312835693359375, 0.19115829467773438, 0.199188232421875, 0.20721817016601562, 0.21524810791015625, 0.22327804565429688, 0.2313079833984375, 0.23933792114257812, 0.24736785888671875, 0.2553977966308594, 0.263427734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 7.0, 4.0, 9.0, 16.0, 12.0, 13.0, 25.0, 34.0, 31.0, 27.0, 51.0, 45.0, 51.0, 44.0, 46.0, 55.0, 47.0, 47.0, 60.0, 56.0, 33.0, 42.0, 36.0, 38.0, 32.0, 30.0, 24.0, 21.0, 12.0, 8.0, 11.0, 9.0, 5.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96044921875, -0.931854248046875, -0.90325927734375, -0.874664306640625, -0.8460693359375, -0.817474365234375, -0.78887939453125, -0.760284423828125, -0.731689453125, -0.703094482421875, -0.67449951171875, -0.645904541015625, -0.6173095703125, -0.588714599609375, -0.56011962890625, -0.531524658203125, -0.5029296875, -0.474334716796875, -0.44573974609375, -0.417144775390625, -0.3885498046875, -0.359954833984375, -0.33135986328125, -0.302764892578125, -0.274169921875, -0.245574951171875, -0.21697998046875, -0.188385009765625, -0.1597900390625, -0.131195068359375, -0.10260009765625, -0.074005126953125, -0.04541015625, -0.016815185546875, 0.01177978515625, 0.040374755859375, 0.0689697265625, 0.097564697265625, 0.12615966796875, 0.154754638671875, 0.183349609375, 0.211944580078125, 0.24053955078125, 0.269134521484375, 0.2977294921875, 0.326324462890625, 0.35491943359375, 0.383514404296875, 0.412109375, 0.440704345703125, 0.46929931640625, 0.497894287109375, 0.5264892578125, 0.555084228515625, 0.58367919921875, 0.612274169921875, 0.640869140625, 0.669464111328125, 0.69805908203125, 0.726654052734375, 0.7552490234375, 0.783843994140625, 0.81243896484375, 0.841033935546875, 0.86962890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 6.0, 12.0, 14.0, 12.0, 11.0, 10.0, 13.0, 21.0, 19.0, 27.0, 30.0, 31.0, 29.0, 37.0, 46.0, 41.0, 92.0, 243.0, 2969.0, 1035870.0, 8231.0, 298.0, 100.0, 57.0, 32.0, 39.0, 40.0, 29.0, 25.0, 25.0, 29.0, 19.0, 11.0, 13.0, 8.0, 8.0, 8.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.32421875, -3.2252197265625, -3.126220703125, -3.0272216796875, -2.92822265625, -2.8292236328125, -2.730224609375, -2.6312255859375, -2.5322265625, -2.4332275390625, -2.334228515625, -2.2352294921875, -2.13623046875, -2.0372314453125, -1.938232421875, -1.8392333984375, -1.740234375, -1.6412353515625, -1.542236328125, -1.4432373046875, -1.34423828125, -1.2452392578125, -1.146240234375, -1.0472412109375, -0.9482421875, -0.8492431640625, -0.750244140625, -0.6512451171875, -0.55224609375, -0.4532470703125, -0.354248046875, -0.2552490234375, -0.15625, -0.0572509765625, 0.041748046875, 0.1407470703125, 0.23974609375, 0.3387451171875, 0.437744140625, 0.5367431640625, 0.6357421875, 0.7347412109375, 0.833740234375, 0.9327392578125, 1.03173828125, 1.1307373046875, 1.229736328125, 1.3287353515625, 1.427734375, 1.5267333984375, 1.625732421875, 1.7247314453125, 1.82373046875, 1.9227294921875, 2.021728515625, 2.1207275390625, 2.2197265625, 2.3187255859375, 2.417724609375, 2.5167236328125, 2.61572265625, 2.7147216796875, 2.813720703125, 2.9127197265625, 3.01171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 1.0, 4.0, 9.0, 7.0, 8.0, 8.0, 14.0, 13.0, 16.0, 11.0, 17.0, 19.0, 35.0, 22.0, 26.0, 38.0, 25.0, 34.0, 28.0, 43.0, 41.0, 42.0, 45.0, 39.0, 38.0, 42.0, 34.0, 36.0, 34.0, 36.0, 24.0, 32.0, 28.0, 25.0, 21.0, 18.0, 16.0, 12.0, 6.0, 9.0, 11.0, 8.0, 10.0, 2.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.806640625, -0.7836532592773438, -0.7606658935546875, -0.7376785278320312, -0.714691162109375, -0.6917037963867188, -0.6687164306640625, -0.6457290649414062, -0.62274169921875, -0.5997543334960938, -0.5767669677734375, -0.5537796020507812, -0.530792236328125, -0.5078048706054688, -0.4848175048828125, -0.46183013916015625, -0.4388427734375, -0.41585540771484375, -0.3928680419921875, -0.36988067626953125, -0.346893310546875, -0.32390594482421875, -0.3009185791015625, -0.27793121337890625, -0.25494384765625, -0.23195648193359375, -0.2089691162109375, -0.18598175048828125, -0.162994384765625, -0.14000701904296875, -0.1170196533203125, -0.09403228759765625, -0.071044921875, -0.04805755615234375, -0.0250701904296875, -0.00208282470703125, 0.020904541015625, 0.04389190673828125, 0.0668792724609375, 0.08986663818359375, 0.11285400390625, 0.13584136962890625, 0.1588287353515625, 0.18181610107421875, 0.204803466796875, 0.22779083251953125, 0.2507781982421875, 0.27376556396484375, 0.2967529296875, 0.31974029541015625, 0.3427276611328125, 0.36571502685546875, 0.388702392578125, 0.41168975830078125, 0.4346771240234375, 0.45766448974609375, 0.48065185546875, 0.5036392211914062, 0.5266265869140625, 0.5496139526367188, 0.572601318359375, 0.5955886840820312, 0.6185760498046875, 0.6415634155273438, 0.66455078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 13.0, 13.0, 14.0, 20.0, 31.0, 34.0, 49.0, 84.0, 157.0, 318.0, 594.0, 1344.0, 3820.0, 13727.0, 83078.0, 722226.0, 190224.0, 23544.0, 5618.0, 1940.0, 778.0, 368.0, 195.0, 108.0, 83.0, 41.0, 30.0, 24.0, 16.0, 11.0, 2.0, 8.0, 8.0, 8.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.283203125, -0.274261474609375, -0.26531982421875, -0.256378173828125, -0.2474365234375, -0.238494873046875, -0.22955322265625, -0.220611572265625, -0.211669921875, -0.202728271484375, -0.19378662109375, -0.184844970703125, -0.1759033203125, -0.166961669921875, -0.15802001953125, -0.149078369140625, -0.14013671875, -0.131195068359375, -0.12225341796875, -0.113311767578125, -0.1043701171875, -0.095428466796875, -0.08648681640625, -0.077545166015625, -0.068603515625, -0.059661865234375, -0.05072021484375, -0.041778564453125, -0.0328369140625, -0.023895263671875, -0.01495361328125, -0.006011962890625, 0.0029296875, 0.011871337890625, 0.02081298828125, 0.029754638671875, 0.0386962890625, 0.047637939453125, 0.05657958984375, 0.065521240234375, 0.074462890625, 0.083404541015625, 0.09234619140625, 0.101287841796875, 0.1102294921875, 0.119171142578125, 0.12811279296875, 0.137054443359375, 0.14599609375, 0.154937744140625, 0.16387939453125, 0.172821044921875, 0.1817626953125, 0.190704345703125, 0.19964599609375, 0.208587646484375, 0.217529296875, 0.226470947265625, 0.23541259765625, 0.244354248046875, 0.2532958984375, 0.262237548828125, 0.27117919921875, 0.280120849609375, 0.2890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 11.0, 10.0, 31.0, 28.0, 49.0, 69.0, 103.0, 166.0, 159.0, 107.0, 75.0, 56.0, 34.0, 18.0, 17.0, 20.0, 10.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.629922866821289e-05, -3.505125641822815e-05, -3.380328416824341e-05, -3.255531191825867e-05, -3.1307339668273926e-05, -3.0059367418289185e-05, -2.8811395168304443e-05, -2.7563422918319702e-05, -2.631545066833496e-05, -2.506747841835022e-05, -2.381950616836548e-05, -2.2571533918380737e-05, -2.1323561668395996e-05, -2.0075589418411255e-05, -1.8827617168426514e-05, -1.7579644918441772e-05, -1.633167266845703e-05, -1.508370041847229e-05, -1.3835728168487549e-05, -1.2587755918502808e-05, -1.1339783668518066e-05, -1.0091811418533325e-05, -8.843839168548584e-06, -7.595866918563843e-06, -6.3478946685791016e-06, -5.09992241859436e-06, -3.851950168609619e-06, -2.603977918624878e-06, -1.3560056686401367e-06, -1.0803341865539551e-07, 1.1399388313293457e-06, 2.387911081314087e-06, 3.635883331298828e-06, 4.883855581283569e-06, 6.1318278312683105e-06, 7.379800081253052e-06, 8.627772331237793e-06, 9.875744581222534e-06, 1.1123716831207275e-05, 1.2371689081192017e-05, 1.3619661331176758e-05, 1.4867633581161499e-05, 1.611560583114624e-05, 1.736357808113098e-05, 1.8611550331115723e-05, 1.9859522581100464e-05, 2.1107494831085205e-05, 2.2355467081069946e-05, 2.3603439331054688e-05, 2.485141158103943e-05, 2.609938383102417e-05, 2.734735608100891e-05, 2.8595328330993652e-05, 2.9843300580978394e-05, 3.1091272830963135e-05, 3.2339245080947876e-05, 3.358721733093262e-05, 3.483518958091736e-05, 3.60831618309021e-05, 3.733113408088684e-05, 3.857910633087158e-05, 3.982707858085632e-05, 4.1075050830841064e-05, 4.2323023080825806e-05, 4.357099533081055e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 7.0, 13.0, 15.0, 23.0, 38.0, 63.0, 96.0, 137.0, 193.0, 365.0, 629.0, 1152.0, 2475.0, 5267.0, 14111.0, 47929.0, 239474.0, 568726.0, 121567.0, 28732.0, 9564.0, 3936.0, 1803.0, 892.0, 541.0, 316.0, 165.0, 101.0, 72.0, 45.0, 30.0, 25.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1568603515625, -0.15089797973632812, -0.14493560791015625, -0.13897323608398438, -0.1330108642578125, -0.12704849243164062, -0.12108612060546875, -0.11512374877929688, -0.109161376953125, -0.10319900512695312, -0.09723663330078125, -0.09127426147460938, -0.0853118896484375, -0.07934951782226562, -0.07338714599609375, -0.06742477416992188, -0.06146240234375, -0.055500030517578125, -0.04953765869140625, -0.043575286865234375, -0.0376129150390625, -0.031650543212890625, -0.02568817138671875, -0.019725799560546875, -0.013763427734375, -0.007801055908203125, -0.00183868408203125, 0.004123687744140625, 0.0100860595703125, 0.016048431396484375, 0.02201080322265625, 0.027973175048828125, 0.033935546875, 0.039897918701171875, 0.04586029052734375, 0.051822662353515625, 0.0577850341796875, 0.06374740600585938, 0.06970977783203125, 0.07567214965820312, 0.081634521484375, 0.08759689331054688, 0.09355926513671875, 0.09952163696289062, 0.1054840087890625, 0.11144638061523438, 0.11740875244140625, 0.12337112426757812, 0.12933349609375, 0.13529586791992188, 0.14125823974609375, 0.14722061157226562, 0.1531829833984375, 0.15914535522460938, 0.16510772705078125, 0.17107009887695312, 0.177032470703125, 0.18299484252929688, 0.18895721435546875, 0.19491958618164062, 0.2008819580078125, 0.20684432983398438, 0.21280670166015625, 0.21876907348632812, 0.2247314453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 1.0, 4.0, 4.0, 10.0, 11.0, 17.0, 11.0, 13.0, 20.0, 33.0, 23.0, 36.0, 57.0, 53.0, 61.0, 73.0, 77.0, 88.0, 73.0, 64.0, 63.0, 43.0, 31.0, 18.0, 23.0, 18.0, 14.0, 6.0, 12.0, 10.0, 9.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057830810546875, -0.05566740036010742, -0.053503990173339844, -0.051340579986572266, -0.04917716979980469, -0.04701375961303711, -0.04485034942626953, -0.04268693923950195, -0.040523529052734375, -0.0383601188659668, -0.03619670867919922, -0.03403329849243164, -0.03186988830566406, -0.029706478118896484, -0.027543067932128906, -0.025379657745361328, -0.02321624755859375, -0.021052837371826172, -0.018889427185058594, -0.016726016998291016, -0.014562606811523438, -0.01239919662475586, -0.010235786437988281, -0.008072376251220703, -0.005908966064453125, -0.003745555877685547, -0.0015821456909179688, 0.0005812644958496094, 0.0027446746826171875, 0.004908084869384766, 0.007071495056152344, 0.009234905242919922, 0.0113983154296875, 0.013561725616455078, 0.015725135803222656, 0.017888545989990234, 0.020051956176757812, 0.02221536636352539, 0.02437877655029297, 0.026542186737060547, 0.028705596923828125, 0.030869007110595703, 0.03303241729736328, 0.03519582748413086, 0.03735923767089844, 0.039522647857666016, 0.041686058044433594, 0.04384946823120117, 0.04601287841796875, 0.04817628860473633, 0.050339698791503906, 0.052503108978271484, 0.05466651916503906, 0.05682992935180664, 0.05899333953857422, 0.0611567497253418, 0.06332015991210938, 0.06548357009887695, 0.06764698028564453, 0.06981039047241211, 0.07197380065917969, 0.07413721084594727, 0.07630062103271484, 0.07846403121948242, 0.08062744140625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 9.0, 33.0, 82.0, 158.0, 222.0, 225.0, 152.0, 84.0, 21.0, 11.0, 10.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0914006233215332, -0.9922460913658142, -0.8930915594100952, -0.7939370274543762, -0.6947824954986572, -0.5956279635429382, -0.49647343158721924, -0.39731889963150024, -0.29816436767578125, -0.19900983572006226, -0.09985530376434326, -0.0007007718086242676, 0.09845376014709473, 0.19760829210281372, 0.2967628240585327, 0.3959173560142517, 0.4950718879699707, 0.5942264199256897, 0.6933809518814087, 0.7925354838371277, 0.8916900157928467, 0.9908445477485657, 1.0899990797042847, 1.1891536712646484, 1.2883081436157227, 1.3874626159667969, 1.4866172075271606, 1.5857717990875244, 1.6849262714385986, 1.7840807437896729, 1.8832353353500366, 1.9823899269104004, 2.0815443992614746, 2.180698871612549, 2.279853343963623, 2.3790080547332764, 2.4781625270843506, 2.577316999435425, 2.676471710205078, 2.7756261825561523, 2.8747806549072266, 2.973935127258301, 3.073089599609375, 3.1722443103790283, 3.2713987827301025, 3.3705532550811768, 3.46970796585083, 3.5688624382019043, 3.6680169105529785, 3.7671713829040527, 3.866325855255127, 3.9654805660247803, 4.064635276794434, 4.163789749145508, 4.262944221496582, 4.362098693847656, 4.4612531661987305, 4.560407638549805, 4.659562110900879, 4.758716583251953, 4.857871055603027, 4.95702600479126, 5.056180477142334, 5.155334949493408, 5.254489421844482]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 2.0, 2.0, 5.0, 4.0, 9.0, 12.0, 13.0, 13.0, 23.0, 17.0, 24.0, 18.0, 36.0, 28.0, 39.0, 43.0, 44.0, 57.0, 39.0, 47.0, 54.0, 42.0, 43.0, 45.0, 47.0, 39.0, 40.0, 33.0, 24.0, 38.0, 25.0, 10.0, 26.0, 15.0, 6.0, 8.0, 7.0, 2.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.376570701599121, -1.3364779949188232, -1.2963852882385254, -1.2562925815582275, -1.2161998748779297, -1.1761071681976318, -1.136014461517334, -1.0959217548370361, -1.0558290481567383, -1.0157363414764404, -0.9756436347961426, -0.9355509281158447, -0.8954582214355469, -0.855365514755249, -0.8152728080749512, -0.7751801013946533, -0.7350874543190002, -0.6949947476387024, -0.6549020409584045, -0.6148093342781067, -0.5747166275978088, -0.534623920917511, -0.4945312440395355, -0.45443853735923767, -0.4143458306789398, -0.37425312399864197, -0.3341604173183441, -0.29406774044036865, -0.2539750337600708, -0.21388231217861176, -0.1737896203994751, -0.13369691371917725, -0.0936042070388794, -0.05351150408387184, -0.013418801128864288, 0.026673898100852966, 0.06676660478115082, 0.10685931146144867, 0.14695200324058533, 0.18704470992088318, 0.22713741660118103, 0.2672301232814789, 0.30732282996177673, 0.3474155068397522, 0.38750821352005005, 0.4276009202003479, 0.46769362688064575, 0.5077863335609436, 0.5478790402412415, 0.5879717469215393, 0.6280644536018372, 0.668157160282135, 0.7082498669624329, 0.7483425736427307, 0.7884352207183838, 0.8285279273986816, 0.8686206340789795, 0.9087133407592773, 0.9488060474395752, 0.988898754119873, 1.028991460800171, 1.0690841674804688, 1.1091768741607666, 1.1492695808410645, 1.1893622875213623]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 10.0, 11.0, 18.0, 26.0, 32.0, 25.0, 53.0, 83.0, 127.0, 182.0, 326.0, 738.0, 1880.0, 6262.0, 30429.0, 206677.0, 1580113.0, 1985799.0, 330026.0, 39180.0, 8188.0, 2263.0, 816.0, 373.0, 191.0, 106.0, 82.0, 57.0, 37.0, 31.0, 22.0, 13.0, 11.0, 16.0, 9.0, 6.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.990234375, -0.9603118896484375, -0.930389404296875, -0.9004669189453125, -0.87054443359375, -0.8406219482421875, -0.810699462890625, -0.7807769775390625, -0.7508544921875, -0.7209320068359375, -0.691009521484375, -0.6610870361328125, -0.63116455078125, -0.6012420654296875, -0.571319580078125, -0.5413970947265625, -0.511474609375, -0.4815521240234375, -0.451629638671875, -0.4217071533203125, -0.39178466796875, -0.3618621826171875, -0.331939697265625, -0.3020172119140625, -0.2720947265625, -0.2421722412109375, -0.212249755859375, -0.1823272705078125, -0.15240478515625, -0.1224822998046875, -0.092559814453125, -0.0626373291015625, -0.03271484375, -0.0027923583984375, 0.027130126953125, 0.0570526123046875, 0.08697509765625, 0.1168975830078125, 0.146820068359375, 0.1767425537109375, 0.2066650390625, 0.2365875244140625, 0.266510009765625, 0.2964324951171875, 0.32635498046875, 0.3562774658203125, 0.386199951171875, 0.4161224365234375, 0.446044921875, 0.4759674072265625, 0.505889892578125, 0.5358123779296875, 0.56573486328125, 0.5956573486328125, 0.625579833984375, 0.6555023193359375, 0.6854248046875, 0.7153472900390625, 0.745269775390625, 0.7751922607421875, 0.80511474609375, 0.8350372314453125, 0.864959716796875, 0.8948822021484375, 0.9248046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 10.0, 8.0, 10.0, 20.0, 14.0, 14.0, 24.0, 31.0, 32.0, 46.0, 42.0, 49.0, 56.0, 72.0, 64.0, 69.0, 47.0, 45.0, 57.0, 54.0, 62.0, 29.0, 39.0, 18.0, 23.0, 22.0, 6.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7705078125, -0.7491607666015625, -0.727813720703125, -0.7064666748046875, -0.68511962890625, -0.6637725830078125, -0.642425537109375, -0.6210784912109375, -0.5997314453125, -0.5783843994140625, -0.557037353515625, -0.5356903076171875, -0.51434326171875, -0.4929962158203125, -0.471649169921875, -0.4503021240234375, -0.428955078125, -0.4076080322265625, -0.386260986328125, -0.3649139404296875, -0.34356689453125, -0.3222198486328125, -0.300872802734375, -0.2795257568359375, -0.2581787109375, -0.2368316650390625, -0.215484619140625, -0.1941375732421875, -0.17279052734375, -0.1514434814453125, -0.130096435546875, -0.1087493896484375, -0.08740234375, -0.0660552978515625, -0.044708251953125, -0.0233612060546875, -0.00201416015625, 0.0193328857421875, 0.040679931640625, 0.0620269775390625, 0.0833740234375, 0.1047210693359375, 0.126068115234375, 0.1474151611328125, 0.16876220703125, 0.1901092529296875, 0.211456298828125, 0.2328033447265625, 0.254150390625, 0.2754974365234375, 0.296844482421875, 0.3181915283203125, 0.33953857421875, 0.3608856201171875, 0.382232666015625, 0.4035797119140625, 0.4249267578125, 0.4462738037109375, 0.467620849609375, 0.4889678955078125, 0.51031494140625, 0.5316619873046875, 0.553009033203125, 0.5743560791015625, 0.595703125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 9.0, 8.0, 5.0, 8.0, 18.0, 37.0, 51.0, 138.0, 476.0, 7483.0, 4072915.0, 111332.0, 1347.0, 240.0, 88.0, 53.0, 25.0, 17.0, 17.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.578125, -3.45361328125, -3.3291015625, -3.20458984375, -3.080078125, -2.95556640625, -2.8310546875, -2.70654296875, -2.58203125, -2.45751953125, -2.3330078125, -2.20849609375, -2.083984375, -1.95947265625, -1.8349609375, -1.71044921875, -1.5859375, -1.46142578125, -1.3369140625, -1.21240234375, -1.087890625, -0.96337890625, -0.8388671875, -0.71435546875, -0.58984375, -0.46533203125, -0.3408203125, -0.21630859375, -0.091796875, 0.03271484375, 0.1572265625, 0.28173828125, 0.40625, 0.53076171875, 0.6552734375, 0.77978515625, 0.904296875, 1.02880859375, 1.1533203125, 1.27783203125, 1.40234375, 1.52685546875, 1.6513671875, 1.77587890625, 1.900390625, 2.02490234375, 2.1494140625, 2.27392578125, 2.3984375, 2.52294921875, 2.6474609375, 2.77197265625, 2.896484375, 3.02099609375, 3.1455078125, 3.27001953125, 3.39453125, 3.51904296875, 3.6435546875, 3.76806640625, 3.892578125, 4.01708984375, 4.1416015625, 4.26611328125, 4.390625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 19.0, 13.0, 16.0, 21.0, 30.0, 54.0, 85.0, 112.0, 169.0, 256.0, 384.0, 527.0, 598.0, 533.0, 405.0, 271.0, 175.0, 116.0, 83.0, 59.0, 40.0, 27.0, 21.0, 15.0, 14.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30859375, -0.2999114990234375, -0.291229248046875, -0.2825469970703125, -0.27386474609375, -0.2651824951171875, -0.256500244140625, -0.2478179931640625, -0.2391357421875, -0.2304534912109375, -0.221771240234375, -0.2130889892578125, -0.20440673828125, -0.1957244873046875, -0.187042236328125, -0.1783599853515625, -0.169677734375, -0.1609954833984375, -0.152313232421875, -0.1436309814453125, -0.13494873046875, -0.1262664794921875, -0.117584228515625, -0.1089019775390625, -0.1002197265625, -0.0915374755859375, -0.082855224609375, -0.0741729736328125, -0.06549072265625, -0.0568084716796875, -0.048126220703125, -0.0394439697265625, -0.03076171875, -0.0220794677734375, -0.013397216796875, -0.0047149658203125, 0.00396728515625, 0.0126495361328125, 0.021331787109375, 0.0300140380859375, 0.0386962890625, 0.0473785400390625, 0.056060791015625, 0.0647430419921875, 0.07342529296875, 0.0821075439453125, 0.090789794921875, 0.0994720458984375, 0.108154296875, 0.1168365478515625, 0.125518798828125, 0.1342010498046875, 0.14288330078125, 0.1515655517578125, 0.160247802734375, 0.1689300537109375, 0.1776123046875, 0.1862945556640625, 0.194976806640625, 0.2036590576171875, 0.21234130859375, 0.2210235595703125, 0.229705810546875, 0.2383880615234375, 0.2470703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 2.0, 11.0, 11.0, 22.0, 26.0, 45.0, 58.0, 67.0, 96.0, 104.0, 115.0, 102.0, 95.0, 71.0, 49.0, 45.0, 25.0, 22.0, 12.0, 11.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.981998085975647, -0.9462701678276062, -0.9105421900749207, -0.8748142719268799, -0.8390862941741943, -0.8033583760261536, -0.7676304578781128, -0.7319024801254272, -0.6961745619773865, -0.6604466438293457, -0.6247186660766602, -0.5889907479286194, -0.5532628297805786, -0.5175348520278931, -0.4818069338798523, -0.44607898592948914, -0.410351037979126, -0.3746230900287628, -0.33889514207839966, -0.3031672239303589, -0.2674392759799957, -0.23171132802963257, -0.1959833949804306, -0.16025546193122864, -0.12452751398086548, -0.08879957348108292, -0.053071632981300354, -0.017343692481517792, 0.01838424801826477, 0.05411219596862793, 0.0898401290178299, 0.12556806206703186, 0.16129612922668457, 0.19702407717704773, 0.2327520102262497, 0.26847994327545166, 0.3042078912258148, 0.339935839176178, 0.37566375732421875, 0.4113917052745819, 0.44711965322494507, 0.4828476011753082, 0.5185755491256714, 0.5543034672737122, 0.5900313854217529, 0.6257593631744385, 0.6614872813224792, 0.69721519947052, 0.7329431772232056, 0.7686710953712463, 0.8043990731239319, 0.8401269912719727, 0.8758549690246582, 0.911582887172699, 0.9473108053207397, 0.9830387830734253, 1.0187666416168213, 1.0544946193695068, 1.0902224779129028, 1.1259504556655884, 1.161678433418274, 1.19740629196167, 1.2331342697143555, 1.268862247467041, 1.3045902252197266]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 12.0, 8.0, 11.0, 16.0, 22.0, 30.0, 25.0, 29.0, 29.0, 35.0, 46.0, 47.0, 63.0, 57.0, 68.0, 52.0, 39.0, 48.0, 47.0, 42.0, 53.0, 47.0, 27.0, 37.0, 22.0, 16.0, 16.0, 13.0, 11.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.8157256245613098, -0.7943438291549683, -0.7729619741439819, -0.7515801787376404, -0.7301983833312988, -0.7088165283203125, -0.687434732913971, -0.6660529375076294, -0.6446710824966431, -0.6232892870903015, -0.6019074320793152, -0.5805256366729736, -0.5591438412666321, -0.5377619862556458, -0.5163801908493042, -0.49499836564064026, -0.4736165702342987, -0.45223474502563477, -0.4308529496192932, -0.4094711244106293, -0.38808929920196533, -0.3667075037956238, -0.34532567858695984, -0.3239438533782959, -0.30256205797195435, -0.2811802327632904, -0.25979843735694885, -0.2384166121482849, -0.21703478693962097, -0.19565297663211823, -0.17427116632461548, -0.15288934111595154, -0.1315075159072876, -0.11012569814920425, -0.08874388039112091, -0.06736207008361816, -0.04598025232553482, -0.024598434567451477, -0.0032166242599487305, 0.01816520094871521, 0.03954701125621796, 0.0609288290143013, 0.08231064677238464, 0.10369245707988739, 0.12507426738739014, 0.14645609259605408, 0.16783790290355682, 0.18921972811222076, 0.2106015384197235, 0.23198334872722626, 0.253365159034729, 0.27474698424339294, 0.2961288094520569, 0.31751060485839844, 0.3388924300670624, 0.3602742552757263, 0.38165605068206787, 0.4030378758907318, 0.42441967129707336, 0.4458014965057373, 0.46718332171440125, 0.4885651469230652, 0.5099469423294067, 0.5313287973403931, 0.5527105927467346]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 6.0, 15.0, 24.0, 19.0, 68.0, 133.0, 305.0, 787.0, 2403.0, 9596.0, 61347.0, 582549.0, 347261.0, 34852.0, 6326.0, 1768.0, 606.0, 244.0, 116.0, 54.0, 35.0, 14.0, 7.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497314453125, -0.4834480285644531, -0.46958160400390625, -0.4557151794433594, -0.4418487548828125, -0.4279823303222656, -0.41411590576171875, -0.4002494812011719, -0.386383056640625, -0.3725166320800781, -0.35865020751953125, -0.3447837829589844, -0.3309173583984375, -0.3170509338378906, -0.30318450927734375, -0.2893180847167969, -0.27545166015625, -0.2615852355957031, -0.24771881103515625, -0.23385238647460938, -0.2199859619140625, -0.20611953735351562, -0.19225311279296875, -0.17838668823242188, -0.164520263671875, -0.15065383911132812, -0.13678741455078125, -0.12292098999023438, -0.1090545654296875, -0.09518814086914062, -0.08132171630859375, -0.06745529174804688, -0.0535888671875, -0.039722442626953125, -0.02585601806640625, -0.011989593505859375, 0.0018768310546875, 0.015743255615234375, 0.02960968017578125, 0.043476104736328125, 0.057342529296875, 0.07120895385742188, 0.08507537841796875, 0.09894180297851562, 0.1128082275390625, 0.12667465209960938, 0.14054107666015625, 0.15440750122070312, 0.16827392578125, 0.18214035034179688, 0.19600677490234375, 0.20987319946289062, 0.2237396240234375, 0.23760604858398438, 0.25147247314453125, 0.2653388977050781, 0.279205322265625, 0.2930717468261719, 0.30693817138671875, 0.3208045959472656, 0.3346710205078125, 0.3485374450683594, 0.36240386962890625, 0.3762702941894531, 0.39013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 15.0, 19.0, 17.0, 22.0, 28.0, 46.0, 32.0, 39.0, 63.0, 61.0, 68.0, 64.0, 57.0, 68.0, 66.0, 58.0, 50.0, 46.0, 40.0, 29.0, 22.0, 22.0, 22.0, 10.0, 2.0, 2.0, 8.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.490966796875, -0.47652435302734375, -0.4620819091796875, -0.44763946533203125, -0.433197021484375, -0.41875457763671875, -0.4043121337890625, -0.38986968994140625, -0.37542724609375, -0.36098480224609375, -0.3465423583984375, -0.33209991455078125, -0.317657470703125, -0.30321502685546875, -0.2887725830078125, -0.27433013916015625, -0.2598876953125, -0.24544525146484375, -0.2310028076171875, -0.21656036376953125, -0.202117919921875, -0.18767547607421875, -0.1732330322265625, -0.15879058837890625, -0.14434814453125, -0.12990570068359375, -0.1154632568359375, -0.10102081298828125, -0.086578369140625, -0.07213592529296875, -0.0576934814453125, -0.04325103759765625, -0.02880859375, -0.01436614990234375, 7.62939453125e-05, 0.01451873779296875, 0.028961181640625, 0.04340362548828125, 0.0578460693359375, 0.07228851318359375, 0.08673095703125, 0.10117340087890625, 0.1156158447265625, 0.13005828857421875, 0.144500732421875, 0.15894317626953125, 0.1733856201171875, 0.18782806396484375, 0.2022705078125, 0.21671295166015625, 0.2311553955078125, 0.24559783935546875, 0.260040283203125, 0.27448272705078125, 0.2889251708984375, 0.30336761474609375, 0.31781005859375, 0.33225250244140625, 0.3466949462890625, 0.36113739013671875, 0.375579833984375, 0.39002227783203125, 0.4044647216796875, 0.41890716552734375, 0.433349609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 3.0, 5.0, 7.0, 13.0, 17.0, 23.0, 26.0, 30.0, 50.0, 86.0, 115.0, 175.0, 297.0, 486.0, 849.0, 1623.0, 3064.0, 6310.0, 14380.0, 34951.0, 95938.0, 269365.0, 365552.0, 159840.0, 55882.0, 21398.0, 9084.0, 4138.0, 2113.0, 1084.0, 637.0, 343.0, 206.0, 157.0, 85.0, 46.0, 41.0, 28.0, 26.0, 19.0, 14.0, 13.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.178466796875, -0.1730976104736328, -0.16772842407226562, -0.16235923767089844, -0.15699005126953125, -0.15162086486816406, -0.14625167846679688, -0.1408824920654297, -0.1355133056640625, -0.1301441192626953, -0.12477493286132812, -0.11940574645996094, -0.11403656005859375, -0.10866737365722656, -0.10329818725585938, -0.09792900085449219, -0.092559814453125, -0.08719062805175781, -0.08182144165039062, -0.07645225524902344, -0.07108306884765625, -0.06571388244628906, -0.060344696044921875, -0.05497550964355469, -0.0496063232421875, -0.04423713684082031, -0.038867950439453125, -0.03349876403808594, -0.02812957763671875, -0.022760391235351562, -0.017391204833984375, -0.012022018432617188, -0.00665283203125, -0.0012836456298828125, 0.004085540771484375, 0.009454727172851562, 0.01482391357421875, 0.020193099975585938, 0.025562286376953125, 0.030931472778320312, 0.0363006591796875, 0.04166984558105469, 0.047039031982421875, 0.05240821838378906, 0.05777740478515625, 0.06314659118652344, 0.06851577758789062, 0.07388496398925781, 0.079254150390625, 0.08462333679199219, 0.08999252319335938, 0.09536170959472656, 0.10073089599609375, 0.10610008239746094, 0.11146926879882812, 0.11683845520019531, 0.1222076416015625, 0.1275768280029297, 0.13294601440429688, 0.13831520080566406, 0.14368438720703125, 0.14905357360839844, 0.15442276000976562, 0.1597919464111328, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 10.0, 8.0, 16.0, 14.0, 17.0, 34.0, 15.0, 19.0, 27.0, 24.0, 41.0, 39.0, 41.0, 49.0, 41.0, 44.0, 42.0, 32.0, 43.0, 38.0, 37.0, 43.0, 32.0, 28.0, 31.0, 43.0, 26.0, 26.0, 23.0, 16.0, 21.0, 6.0, 14.0, 12.0, 12.0, 6.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5322265625, -0.513916015625, -0.49560546875, -0.477294921875, -0.458984375, -0.440673828125, -0.42236328125, -0.404052734375, -0.3857421875, -0.367431640625, -0.34912109375, -0.330810546875, -0.3125, -0.294189453125, -0.27587890625, -0.257568359375, -0.2392578125, -0.220947265625, -0.20263671875, -0.184326171875, -0.166015625, -0.147705078125, -0.12939453125, -0.111083984375, -0.0927734375, -0.074462890625, -0.05615234375, -0.037841796875, -0.01953125, -0.001220703125, 0.01708984375, 0.035400390625, 0.0537109375, 0.072021484375, 0.09033203125, 0.108642578125, 0.126953125, 0.145263671875, 0.16357421875, 0.181884765625, 0.2001953125, 0.218505859375, 0.23681640625, 0.255126953125, 0.2734375, 0.291748046875, 0.31005859375, 0.328369140625, 0.3466796875, 0.364990234375, 0.38330078125, 0.401611328125, 0.419921875, 0.438232421875, 0.45654296875, 0.474853515625, 0.4931640625, 0.511474609375, 0.52978515625, 0.548095703125, 0.56640625, 0.584716796875, 0.60302734375, 0.621337890625, 0.6396484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 15.0, 20.0, 30.0, 43.0, 61.0, 74.0, 98.0, 172.0, 258.0, 421.0, 740.0, 1224.0, 2213.0, 4364.0, 8949.0, 19334.0, 44785.0, 113768.0, 315500.0, 329384.0, 120320.0, 46943.0, 20203.0, 9363.0, 4601.0, 2336.0, 1339.0, 712.0, 474.0, 270.0, 142.0, 135.0, 74.0, 53.0, 28.0, 25.0, 17.0, 13.0, 12.0, 9.0, 3.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.061676025390625, -0.05986356735229492, -0.058051109313964844, -0.056238651275634766, -0.05442619323730469, -0.05261373519897461, -0.05080127716064453, -0.04898881912231445, -0.047176361083984375, -0.0453639030456543, -0.04355144500732422, -0.04173898696899414, -0.03992652893066406, -0.038114070892333984, -0.036301612854003906, -0.03448915481567383, -0.03267669677734375, -0.030864238739013672, -0.029051780700683594, -0.027239322662353516, -0.025426864624023438, -0.02361440658569336, -0.02180194854736328, -0.019989490509033203, -0.018177032470703125, -0.016364574432373047, -0.014552116394042969, -0.01273965835571289, -0.010927200317382812, -0.009114742279052734, -0.007302284240722656, -0.005489826202392578, -0.0036773681640625, -0.0018649101257324219, -5.245208740234375e-05, 0.0017600059509277344, 0.0035724639892578125, 0.005384922027587891, 0.007197380065917969, 0.009009838104248047, 0.010822296142578125, 0.012634754180908203, 0.014447212219238281, 0.01625967025756836, 0.018072128295898438, 0.019884586334228516, 0.021697044372558594, 0.023509502410888672, 0.02532196044921875, 0.027134418487548828, 0.028946876525878906, 0.030759334564208984, 0.03257179260253906, 0.03438425064086914, 0.03619670867919922, 0.0380091667175293, 0.039821624755859375, 0.04163408279418945, 0.04344654083251953, 0.04525899887084961, 0.04707145690917969, 0.048883914947509766, 0.050696372985839844, 0.05250883102416992, 0.0543212890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 6.0, 2.0, 8.0, 5.0, 9.0, 12.0, 17.0, 21.0, 24.0, 36.0, 44.0, 68.0, 92.0, 117.0, 140.0, 109.0, 75.0, 59.0, 52.0, 33.0, 26.0, 20.0, 14.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1021575927734375e-05, -4.9620866775512695e-05, -4.8220157623291016e-05, -4.6819448471069336e-05, -4.5418739318847656e-05, -4.4018030166625977e-05, -4.26173210144043e-05, -4.121661186218262e-05, -3.981590270996094e-05, -3.841519355773926e-05, -3.701448440551758e-05, -3.56137752532959e-05, -3.421306610107422e-05, -3.281235694885254e-05, -3.141164779663086e-05, -3.001093864440918e-05, -2.86102294921875e-05, -2.720952033996582e-05, -2.580881118774414e-05, -2.440810203552246e-05, -2.300739288330078e-05, -2.16066837310791e-05, -2.0205974578857422e-05, -1.8805265426635742e-05, -1.7404556274414062e-05, -1.6003847122192383e-05, -1.4603137969970703e-05, -1.3202428817749023e-05, -1.1801719665527344e-05, -1.0401010513305664e-05, -9.000301361083984e-06, -7.599592208862305e-06, -6.198883056640625e-06, -4.798173904418945e-06, -3.3974647521972656e-06, -1.996755599975586e-06, -5.960464477539062e-07, 8.046627044677734e-07, 2.205371856689453e-06, 3.606081008911133e-06, 5.0067901611328125e-06, 6.407499313354492e-06, 7.808208465576172e-06, 9.208917617797852e-06, 1.0609626770019531e-05, 1.2010335922241211e-05, 1.341104507446289e-05, 1.481175422668457e-05, 1.621246337890625e-05, 1.761317253112793e-05, 1.901388168334961e-05, 2.041459083557129e-05, 2.181529998779297e-05, 2.321600914001465e-05, 2.4616718292236328e-05, 2.6017427444458008e-05, 2.7418136596679688e-05, 2.8818845748901367e-05, 3.0219554901123047e-05, 3.1620264053344727e-05, 3.3020973205566406e-05, 3.4421682357788086e-05, 3.5822391510009766e-05, 3.7223100662231445e-05, 3.8623809814453125e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 10.0, 12.0, 20.0, 20.0, 21.0, 34.0, 59.0, 74.0, 196.0, 506.0, 1583.0, 6123.0, 27407.0, 166828.0, 658876.0, 153225.0, 25229.0, 5775.0, 1583.0, 494.0, 199.0, 76.0, 49.0, 32.0, 24.0, 14.0, 13.0, 11.0, 15.0, 6.0, 3.0, 6.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.13232421875, -0.1282501220703125, -0.124176025390625, -0.1201019287109375, -0.11602783203125, -0.1119537353515625, -0.107879638671875, -0.1038055419921875, -0.0997314453125, -0.0956573486328125, -0.091583251953125, -0.0875091552734375, -0.08343505859375, -0.0793609619140625, -0.075286865234375, -0.0712127685546875, -0.067138671875, -0.0630645751953125, -0.058990478515625, -0.0549163818359375, -0.05084228515625, -0.0467681884765625, -0.042694091796875, -0.0386199951171875, -0.0345458984375, -0.0304718017578125, -0.026397705078125, -0.0223236083984375, -0.01824951171875, -0.0141754150390625, -0.010101318359375, -0.0060272216796875, -0.001953125, 0.0021209716796875, 0.006195068359375, 0.0102691650390625, 0.01434326171875, 0.0184173583984375, 0.022491455078125, 0.0265655517578125, 0.0306396484375, 0.0347137451171875, 0.038787841796875, 0.0428619384765625, 0.04693603515625, 0.0510101318359375, 0.055084228515625, 0.0591583251953125, 0.063232421875, 0.0673065185546875, 0.071380615234375, 0.0754547119140625, 0.07952880859375, 0.0836029052734375, 0.087677001953125, 0.0917510986328125, 0.0958251953125, 0.0998992919921875, 0.103973388671875, 0.1080474853515625, 0.11212158203125, 0.1161956787109375, 0.120269775390625, 0.1243438720703125, 0.12841796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 3.0, 4.0, 7.0, 9.0, 7.0, 9.0, 13.0, 7.0, 19.0, 23.0, 30.0, 39.0, 49.0, 61.0, 54.0, 89.0, 81.0, 87.0, 79.0, 72.0, 51.0, 47.0, 32.0, 23.0, 17.0, 18.0, 10.0, 16.0, 8.0, 6.0, 6.0, 9.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0197601318359375, -0.019194602966308594, -0.018629074096679688, -0.01806354522705078, -0.017498016357421875, -0.01693248748779297, -0.016366958618164062, -0.015801429748535156, -0.01523590087890625, -0.014670372009277344, -0.014104843139648438, -0.013539314270019531, -0.012973785400390625, -0.012408256530761719, -0.011842727661132812, -0.011277198791503906, -0.010711669921875, -0.010146141052246094, -0.009580612182617188, -0.009015083312988281, -0.008449554443359375, -0.007884025573730469, -0.0073184967041015625, -0.006752967834472656, -0.00618743896484375, -0.005621910095214844, -0.0050563812255859375, -0.004490852355957031, -0.003925323486328125, -0.0033597946166992188, -0.0027942657470703125, -0.0022287368774414062, -0.0016632080078125, -0.0010976791381835938, -0.0005321502685546875, 3.337860107421875e-05, 0.000598907470703125, 0.0011644363403320312, 0.0017299652099609375, 0.0022954940795898438, 0.00286102294921875, 0.0034265518188476562, 0.0039920806884765625, 0.004557609558105469, 0.005123138427734375, 0.005688667297363281, 0.0062541961669921875, 0.006819725036621094, 0.00738525390625, 0.007950782775878906, 0.008516311645507812, 0.009081840515136719, 0.009647369384765625, 0.010212898254394531, 0.010778427124023438, 0.011343955993652344, 0.01190948486328125, 0.012475013732910156, 0.013040542602539062, 0.013606071472167969, 0.014171600341796875, 0.014737129211425781, 0.015302658081054688, 0.015868186950683594, 0.0164337158203125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 12.0, 14.0, 23.0, 40.0, 64.0, 111.0, 125.0, 157.0, 151.0, 113.0, 77.0, 46.0, 26.0, 15.0, 13.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7934081554412842, -0.7666274309158325, -0.7398466467857361, -0.7130659222602844, -0.6862851977348328, -0.6595044136047363, -0.6327236890792847, -0.605942964553833, -0.5791621804237366, -0.5523814558982849, -0.5256006717681885, -0.4988199472427368, -0.47203919291496277, -0.4452584385871887, -0.41847771406173706, -0.391696959733963, -0.36491623520851135, -0.3381354808807373, -0.31135475635528564, -0.2845740020275116, -0.25779324769973755, -0.2310125082731247, -0.20423176884651184, -0.1774510145187378, -0.15067027509212494, -0.12388952821493149, -0.09710878133773804, -0.07032804191112518, -0.04354729503393173, -0.01676654815673828, 0.010014191269874573, 0.03679494559764862, 0.06357568502426147, 0.09035643190145493, 0.11713717877864838, 0.14391791820526123, 0.17069867253303528, 0.19747941195964813, 0.224260151386261, 0.25104090571403503, 0.2778216600418091, 0.30460241436958313, 0.3313831388950348, 0.35816389322280884, 0.3849446475505829, 0.41172540187835693, 0.4385061264038086, 0.46528688073158264, 0.4920676052570343, 0.5188483595848083, 0.54562908411026, 0.5724098682403564, 0.5991905927658081, 0.6259713172912598, 0.6527520418167114, 0.6795328259468079, 0.7063135504722595, 0.7330942749977112, 0.7598750591278076, 0.7866557836532593, 0.8134365081787109, 0.8402172923088074, 0.866998016834259, 0.8937788009643555, 0.9205595254898071]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 12.0, 8.0, 21.0, 23.0, 25.0, 27.0, 35.0, 35.0, 50.0, 56.0, 69.0, 73.0, 65.0, 70.0, 53.0, 59.0, 59.0, 57.0, 47.0, 26.0, 31.0, 25.0, 18.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5352803468704224, -0.5211170315742493, -0.5069537162780762, -0.4927903711795807, -0.4786270260810852, -0.4644637107849121, -0.450300395488739, -0.43613705039024353, -0.42197373509407043, -0.40781041979789734, -0.39364707469940186, -0.37948375940322876, -0.3653204143047333, -0.3511570990085602, -0.3369937539100647, -0.3228304386138916, -0.3086671233177185, -0.2945038080215454, -0.2803404629230499, -0.26617714762687683, -0.25201380252838135, -0.23785048723220825, -0.22368715703487396, -0.20952382683753967, -0.1953604817390442, -0.1811971515417099, -0.1670338213443756, -0.15287050604820251, -0.13870717585086823, -0.12454384565353394, -0.11038051545619965, -0.09621719270944595, -0.08205386996269226, -0.06789053976535797, -0.05372721701860428, -0.03956388682126999, -0.025400560349225998, -0.011237233877182007, 0.0029260963201522827, 0.017089419066905975, 0.031252749264240265, 0.045416075736284256, 0.05957940220832825, 0.07374273240566254, 0.08790606260299683, 0.10206938534975052, 0.11623271554708481, 0.1303960382938385, 0.1445593684911728, 0.15872269868850708, 0.17288602888584137, 0.18704935908317566, 0.20121267437934875, 0.21537600457668304, 0.22953933477401733, 0.24370265007019043, 0.2578659951686859, 0.272029310464859, 0.2861926555633545, 0.3003559708595276, 0.31451931595802307, 0.32868263125419617, 0.34284597635269165, 0.35700929164886475, 0.37117260694503784]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 14.0, 20.0, 28.0, 46.0, 115.0, 221.0, 469.0, 1016.0, 2217.0, 5295.0, 14487.0, 58932.0, 319425.0, 492555.0, 116650.0, 23922.0, 7526.0, 2987.0, 1342.0, 642.0, 295.0, 164.0, 85.0, 44.0, 26.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5859375, -0.5692901611328125, -0.552642822265625, -0.5359954833984375, -0.51934814453125, -0.5027008056640625, -0.486053466796875, -0.4694061279296875, -0.4527587890625, -0.4361114501953125, -0.419464111328125, -0.4028167724609375, -0.38616943359375, -0.3695220947265625, -0.352874755859375, -0.3362274169921875, -0.319580078125, -0.3029327392578125, -0.286285400390625, -0.2696380615234375, -0.25299072265625, -0.2363433837890625, -0.219696044921875, -0.2030487060546875, -0.1864013671875, -0.1697540283203125, -0.153106689453125, -0.1364593505859375, -0.11981201171875, -0.1031646728515625, -0.086517333984375, -0.0698699951171875, -0.05322265625, -0.0365753173828125, -0.019927978515625, -0.0032806396484375, 0.01336669921875, 0.0300140380859375, 0.046661376953125, 0.0633087158203125, 0.0799560546875, 0.0966033935546875, 0.113250732421875, 0.1298980712890625, 0.14654541015625, 0.1631927490234375, 0.179840087890625, 0.1964874267578125, 0.213134765625, 0.2297821044921875, 0.246429443359375, 0.2630767822265625, 0.27972412109375, 0.2963714599609375, 0.313018798828125, 0.3296661376953125, 0.3463134765625, 0.3629608154296875, 0.379608154296875, 0.3962554931640625, 0.41290283203125, 0.4295501708984375, 0.446197509765625, 0.4628448486328125, 0.4794921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 8.0, 6.0, 5.0, 10.0, 10.0, 15.0, 12.0, 36.0, 25.0, 33.0, 32.0, 49.0, 47.0, 48.0, 79.0, 53.0, 50.0, 58.0, 66.0, 62.0, 56.0, 53.0, 40.0, 38.0, 21.0, 34.0, 9.0, 13.0, 8.0, 8.0, 9.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.17578125, -1.1461410522460938, -1.1165008544921875, -1.0868606567382812, -1.057220458984375, -1.0275802612304688, -0.9979400634765625, -0.9682998657226562, -0.93865966796875, -0.9090194702148438, -0.8793792724609375, -0.8497390747070312, -0.820098876953125, -0.7904586791992188, -0.7608184814453125, -0.7311782836914062, -0.7015380859375, -0.6718978881835938, -0.6422576904296875, -0.6126174926757812, -0.582977294921875, -0.5533370971679688, -0.5236968994140625, -0.49405670166015625, -0.46441650390625, -0.43477630615234375, -0.4051361083984375, -0.37549591064453125, -0.345855712890625, -0.31621551513671875, -0.2865753173828125, -0.25693511962890625, -0.227294921875, -0.19765472412109375, -0.1680145263671875, -0.13837432861328125, -0.108734130859375, -0.07909393310546875, -0.0494537353515625, -0.01981353759765625, 0.00982666015625, 0.03946685791015625, 0.0691070556640625, 0.09874725341796875, 0.128387451171875, 0.15802764892578125, 0.1876678466796875, 0.21730804443359375, 0.2469482421875, 0.27658843994140625, 0.3062286376953125, 0.33586883544921875, 0.365509033203125, 0.39514923095703125, 0.4247894287109375, 0.45442962646484375, 0.48406982421875, 0.5137100219726562, 0.5433502197265625, 0.5729904174804688, 0.602630615234375, 0.6322708129882812, 0.6619110107421875, 0.6915512084960938, 0.72119140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 6.0, 5.0, 6.0, 9.0, 17.0, 19.0, 13.0, 17.0, 24.0, 38.0, 35.0, 47.0, 58.0, 83.0, 158.0, 356.0, 1908.0, 102731.0, 934510.0, 7205.0, 588.0, 233.0, 115.0, 67.0, 58.0, 31.0, 31.0, 28.0, 25.0, 24.0, 14.0, 11.0, 16.0, 8.0, 11.0, 2.0, 8.0, 5.0, 2.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.977264404296875, -1.90960693359375, -1.841949462890625, -1.7742919921875, -1.706634521484375, -1.63897705078125, -1.571319580078125, -1.503662109375, -1.436004638671875, -1.36834716796875, -1.300689697265625, -1.2330322265625, -1.165374755859375, -1.09771728515625, -1.030059814453125, -0.96240234375, -0.894744873046875, -0.82708740234375, -0.759429931640625, -0.6917724609375, -0.624114990234375, -0.55645751953125, -0.488800048828125, -0.421142578125, -0.353485107421875, -0.28582763671875, -0.218170166015625, -0.1505126953125, -0.082855224609375, -0.01519775390625, 0.052459716796875, 0.1201171875, 0.187774658203125, 0.25543212890625, 0.323089599609375, 0.3907470703125, 0.458404541015625, 0.52606201171875, 0.593719482421875, 0.661376953125, 0.729034423828125, 0.79669189453125, 0.864349365234375, 0.9320068359375, 0.999664306640625, 1.06732177734375, 1.134979248046875, 1.20263671875, 1.270294189453125, 1.33795166015625, 1.405609130859375, 1.4732666015625, 1.540924072265625, 1.60858154296875, 1.676239013671875, 1.743896484375, 1.811553955078125, 1.87921142578125, 1.946868896484375, 2.0145263671875, 2.082183837890625, 2.14984130859375, 2.217498779296875, 2.28515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 0.0, 4.0, 4.0, 8.0, 7.0, 2.0, 7.0, 8.0, 15.0, 16.0, 19.0, 25.0, 18.0, 33.0, 31.0, 45.0, 35.0, 42.0, 31.0, 35.0, 56.0, 49.0, 50.0, 48.0, 50.0, 31.0, 47.0, 38.0, 33.0, 31.0, 26.0, 23.0, 21.0, 27.0, 21.0, 12.0, 4.0, 11.0, 9.0, 9.0, 4.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5908203125, -0.56829833984375, -0.5457763671875, -0.52325439453125, -0.500732421875, -0.47821044921875, -0.4556884765625, -0.43316650390625, -0.41064453125, -0.38812255859375, -0.3656005859375, -0.34307861328125, -0.320556640625, -0.29803466796875, -0.2755126953125, -0.25299072265625, -0.23046875, -0.20794677734375, -0.1854248046875, -0.16290283203125, -0.140380859375, -0.11785888671875, -0.0953369140625, -0.07281494140625, -0.05029296875, -0.02777099609375, -0.0052490234375, 0.01727294921875, 0.039794921875, 0.06231689453125, 0.0848388671875, 0.10736083984375, 0.1298828125, 0.15240478515625, 0.1749267578125, 0.19744873046875, 0.219970703125, 0.24249267578125, 0.2650146484375, 0.28753662109375, 0.31005859375, 0.33258056640625, 0.3551025390625, 0.37762451171875, 0.400146484375, 0.42266845703125, 0.4451904296875, 0.46771240234375, 0.490234375, 0.51275634765625, 0.5352783203125, 0.55780029296875, 0.580322265625, 0.60284423828125, 0.6253662109375, 0.64788818359375, 0.67041015625, 0.69293212890625, 0.7154541015625, 0.73797607421875, 0.760498046875, 0.78302001953125, 0.8055419921875, 0.82806396484375, 0.8505859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 11.0, 11.0, 6.0, 22.0, 27.0, 40.0, 75.0, 153.0, 233.0, 566.0, 1494.0, 6152.0, 40330.0, 421303.0, 516974.0, 50753.0, 7358.0, 1833.0, 570.0, 253.0, 139.0, 76.0, 60.0, 21.0, 23.0, 13.0, 17.0, 14.0, 6.0, 2.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.20017623901367188, -0.19393157958984375, -0.18768692016601562, -0.1814422607421875, -0.17519760131835938, -0.16895294189453125, -0.16270828247070312, -0.156463623046875, -0.15021896362304688, -0.14397430419921875, -0.13772964477539062, -0.1314849853515625, -0.12524032592773438, -0.11899566650390625, -0.11275100708007812, -0.10650634765625, -0.10026168823242188, -0.09401702880859375, -0.08777236938476562, -0.0815277099609375, -0.07528305053710938, -0.06903839111328125, -0.06279373168945312, -0.056549072265625, -0.050304412841796875, -0.04405975341796875, -0.037815093994140625, -0.0315704345703125, -0.025325775146484375, -0.01908111572265625, -0.012836456298828125, -0.006591796875, -0.000347137451171875, 0.00589752197265625, 0.012142181396484375, 0.0183868408203125, 0.024631500244140625, 0.03087615966796875, 0.037120819091796875, 0.043365478515625, 0.049610137939453125, 0.05585479736328125, 0.062099456787109375, 0.0683441162109375, 0.07458877563476562, 0.08083343505859375, 0.08707809448242188, 0.09332275390625, 0.09956741333007812, 0.10581207275390625, 0.11205673217773438, 0.1183013916015625, 0.12454605102539062, 0.13079071044921875, 0.13703536987304688, 0.143280029296875, 0.14952468872070312, 0.15576934814453125, 0.16201400756835938, 0.1682586669921875, 0.17450332641601562, 0.18074798583984375, 0.18699264526367188, 0.1932373046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 3.0, 7.0, 13.0, 18.0, 13.0, 32.0, 25.0, 35.0, 63.0, 58.0, 76.0, 90.0, 87.0, 93.0, 75.0, 65.0, 55.0, 44.0, 38.0, 26.0, 10.0, 13.0, 14.0, 7.0, 10.0, 2.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6808509826660156e-05, -1.6178004443645477e-05, -1.55474990606308e-05, -1.491699367761612e-05, -1.428648829460144e-05, -1.3655982911586761e-05, -1.3025477528572083e-05, -1.2394972145557404e-05, -1.1764466762542725e-05, -1.1133961379528046e-05, -1.0503455996513367e-05, -9.872950613498688e-06, -9.242445230484009e-06, -8.61193984746933e-06, -7.981434464454651e-06, -7.350929081439972e-06, -6.720423698425293e-06, -6.089918315410614e-06, -5.459412932395935e-06, -4.828907549381256e-06, -4.198402166366577e-06, -3.567896783351898e-06, -2.9373914003372192e-06, -2.3068860173225403e-06, -1.6763806343078613e-06, -1.0458752512931824e-06, -4.153698682785034e-07, 2.1513551473617554e-07, 8.456408977508545e-07, 1.4761462807655334e-06, 2.1066516637802124e-06, 2.7371570467948914e-06, 3.3676624298095703e-06, 3.998167812824249e-06, 4.628673195838928e-06, 5.259178578853607e-06, 5.889683961868286e-06, 6.520189344882965e-06, 7.150694727897644e-06, 7.781200110912323e-06, 8.411705493927002e-06, 9.042210876941681e-06, 9.67271625995636e-06, 1.0303221642971039e-05, 1.0933727025985718e-05, 1.1564232409000397e-05, 1.2194737792015076e-05, 1.2825243175029755e-05, 1.3455748558044434e-05, 1.4086253941059113e-05, 1.4716759324073792e-05, 1.534726470708847e-05, 1.597777009010315e-05, 1.660827547311783e-05, 1.7238780856132507e-05, 1.7869286239147186e-05, 1.8499791622161865e-05, 1.9130297005176544e-05, 1.9760802388191223e-05, 2.0391307771205902e-05, 2.102181315422058e-05, 2.165231853723526e-05, 2.228282392024994e-05, 2.2913329303264618e-05, 2.3543834686279297e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 0.0, 1.0, 3.0, 7.0, 13.0, 19.0, 30.0, 30.0, 54.0, 120.0, 213.0, 375.0, 844.0, 2124.0, 6845.0, 32125.0, 235833.0, 621913.0, 121637.0, 18707.0, 4674.0, 1550.0, 663.0, 353.0, 168.0, 84.0, 62.0, 23.0, 30.0, 13.0, 6.0, 9.0, 4.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1787109375, -0.1731853485107422, -0.16765975952148438, -0.16213417053222656, -0.15660858154296875, -0.15108299255371094, -0.14555740356445312, -0.1400318145751953, -0.1345062255859375, -0.1289806365966797, -0.12345504760742188, -0.11792945861816406, -0.11240386962890625, -0.10687828063964844, -0.10135269165039062, -0.09582710266113281, -0.090301513671875, -0.08477592468261719, -0.07925033569335938, -0.07372474670410156, -0.06819915771484375, -0.06267356872558594, -0.057147979736328125, -0.05162239074707031, -0.0460968017578125, -0.04057121276855469, -0.035045623779296875, -0.029520034790039062, -0.02399444580078125, -0.018468856811523438, -0.012943267822265625, -0.0074176788330078125, -0.00189208984375, 0.0036334991455078125, 0.009159088134765625, 0.014684677124023438, 0.02021026611328125, 0.025735855102539062, 0.031261444091796875, 0.03678703308105469, 0.0423126220703125, 0.04783821105957031, 0.053363800048828125, 0.05888938903808594, 0.06441497802734375, 0.06994056701660156, 0.07546615600585938, 0.08099174499511719, 0.086517333984375, 0.09204292297363281, 0.09756851196289062, 0.10309410095214844, 0.10861968994140625, 0.11414527893066406, 0.11967086791992188, 0.1251964569091797, 0.1307220458984375, 0.1362476348876953, 0.14177322387695312, 0.14729881286621094, 0.15282440185546875, 0.15834999084472656, 0.16387557983398438, 0.1694011688232422, 0.1749267578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 12.0, 2.0, 10.0, 11.0, 15.0, 16.0, 33.0, 34.0, 45.0, 70.0, 72.0, 91.0, 75.0, 80.0, 84.0, 69.0, 52.0, 61.0, 43.0, 28.0, 26.0, 13.0, 13.0, 7.0, 7.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043853759765625, -0.042017459869384766, -0.04018115997314453, -0.0383448600769043, -0.03650856018066406, -0.03467226028442383, -0.032835960388183594, -0.03099966049194336, -0.029163360595703125, -0.02732706069946289, -0.025490760803222656, -0.023654460906982422, -0.021818161010742188, -0.019981861114501953, -0.01814556121826172, -0.016309261322021484, -0.01447296142578125, -0.012636661529541016, -0.010800361633300781, -0.008964061737060547, -0.0071277618408203125, -0.005291461944580078, -0.0034551620483398438, -0.0016188621520996094, 0.000217437744140625, 0.0020537376403808594, 0.0038900375366210938, 0.005726337432861328, 0.0075626373291015625, 0.009398937225341797, 0.011235237121582031, 0.013071537017822266, 0.0149078369140625, 0.016744136810302734, 0.01858043670654297, 0.020416736602783203, 0.022253036499023438, 0.024089336395263672, 0.025925636291503906, 0.02776193618774414, 0.029598236083984375, 0.03143453598022461, 0.033270835876464844, 0.03510713577270508, 0.03694343566894531, 0.03877973556518555, 0.04061603546142578, 0.042452335357666016, 0.04428863525390625, 0.046124935150146484, 0.04796123504638672, 0.04979753494262695, 0.05163383483886719, 0.05347013473510742, 0.055306434631347656, 0.05714273452758789, 0.058979034423828125, 0.06081533432006836, 0.0626516342163086, 0.06448793411254883, 0.06632423400878906, 0.0681605339050293, 0.06999683380126953, 0.07183313369750977, 0.07366943359375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 17.0, 68.0, 283.0, 443.0, 158.0, 37.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.233718752861023, -1.0636543035507202, -0.8935897350311279, -0.7235252857208252, -0.5534607768058777, -0.3833962678909302, -0.21333181858062744, -0.043267250061035156, 0.12679719924926758, 0.2968617081642151, 0.4669261872768402, 0.6369906663894653, 0.8070551753044128, 0.9771196842193604, 1.147184133529663, 1.3172487020492554, 1.487313151359558, 1.6573776006698608, 1.8274421691894531, 1.9975066184997559, 2.1675710678100586, 2.3376355171203613, 2.507699966430664, 2.677764654159546, 2.8478291034698486, 3.0178935527801514, 3.187958002090454, 3.358022689819336, 3.5280871391296387, 3.6981515884399414, 3.868216037750244, 4.038280487060547, 4.20834493637085, 4.378409385681152, 4.548473834991455, 4.718538284301758, 4.8886027336120605, 5.058667182922363, 5.228732109069824, 5.398796558380127, 5.56886100769043, 5.738925457000732, 5.908989906311035, 6.079054355621338, 6.249118804931641, 6.419183731079102, 6.589247703552246, 6.759312629699707, 6.929376602172852, 7.099441051483154, 7.269505500793457, 7.43956995010376, 7.6096343994140625, 7.779699325561523, 7.949763298034668, 8.119828224182129, 8.28989315032959, 8.45995807647705, 8.630022048950195, 8.800086975097656, 8.9701509475708, 9.140215873718262, 9.310279846191406, 9.480344772338867, 9.650408744812012]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 9.0, 4.0, 13.0, 8.0, 15.0, 8.0, 15.0, 20.0, 15.0, 17.0, 18.0, 21.0, 26.0, 34.0, 32.0, 34.0, 49.0, 41.0, 42.0, 50.0, 52.0, 34.0, 40.0, 50.0, 43.0, 37.0, 32.0, 31.0, 29.0, 21.0, 29.0, 18.0, 23.0, 18.0, 16.0, 17.0, 7.0, 5.0, 7.0, 3.0, 5.0, 8.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1883381605148315, -1.1523001194000244, -1.1162620782852173, -1.0802240371704102, -1.044185996055603, -1.008147954940796, -0.9721099138259888, -0.9360718727111816, -0.9000338315963745, -0.8639957904815674, -0.8279577493667603, -0.7919197082519531, -0.755881667137146, -0.7198436260223389, -0.6838055849075317, -0.6477675437927246, -0.6117295026779175, -0.5756914615631104, -0.5396534204483032, -0.5036153793334961, -0.46757733821868896, -0.43153929710388184, -0.3955012559890747, -0.3594632148742676, -0.32342517375946045, -0.2873871326446533, -0.2513490915298462, -0.21531105041503906, -0.17927300930023193, -0.1432349681854248, -0.10719692707061768, -0.07115888595581055, -0.03512084484100342, 0.0009171962738037109, 0.03695523738861084, 0.07299327850341797, 0.1090313196182251, 0.14506936073303223, 0.18110740184783936, 0.21714544296264648, 0.2531834840774536, 0.28922152519226074, 0.32525956630706787, 0.361297607421875, 0.39733564853668213, 0.43337368965148926, 0.4694117307662964, 0.5054497718811035, 0.5414878129959106, 0.5775258541107178, 0.6135638952255249, 0.649601936340332, 0.6856399774551392, 0.7216780185699463, 0.7577160596847534, 0.7937541007995605, 0.8297921419143677, 0.8658301830291748, 0.9018682241439819, 0.9379062652587891, 0.9739443063735962, 1.0099823474884033, 1.0460203886032104, 1.0820584297180176, 1.1180964708328247]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 14.0, 8.0, 27.0, 39.0, 59.0, 118.0, 196.0, 382.0, 733.0, 1719.0, 4458.0, 15463.0, 76874.0, 580417.0, 2328468.0, 1015790.0, 136126.0, 23294.0, 6122.0, 2162.0, 874.0, 404.0, 247.0, 133.0, 64.0, 39.0, 22.0, 15.0, 10.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.958984375, -0.9335098266601562, -0.9080352783203125, -0.8825607299804688, -0.857086181640625, -0.8316116333007812, -0.8061370849609375, -0.7806625366210938, -0.75518798828125, -0.7297134399414062, -0.7042388916015625, -0.6787643432617188, -0.653289794921875, -0.6278152465820312, -0.6023406982421875, -0.5768661499023438, -0.5513916015625, -0.5259170532226562, -0.5004425048828125, -0.47496795654296875, -0.449493408203125, -0.42401885986328125, -0.3985443115234375, -0.37306976318359375, -0.34759521484375, -0.32212066650390625, -0.2966461181640625, -0.27117156982421875, -0.245697021484375, -0.22022247314453125, -0.1947479248046875, -0.16927337646484375, -0.143798828125, -0.11832427978515625, -0.0928497314453125, -0.06737518310546875, -0.041900634765625, -0.01642608642578125, 0.0090484619140625, 0.03452301025390625, 0.05999755859375, 0.08547210693359375, 0.1109466552734375, 0.13642120361328125, 0.161895751953125, 0.18737030029296875, 0.2128448486328125, 0.23831939697265625, 0.2637939453125, 0.28926849365234375, 0.3147430419921875, 0.34021759033203125, 0.365692138671875, 0.39116668701171875, 0.4166412353515625, 0.44211578369140625, 0.46759033203125, 0.49306488037109375, 0.5185394287109375, 0.5440139770507812, 0.569488525390625, 0.5949630737304688, 0.6204376220703125, 0.6459121704101562, 0.67138671875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 9.0, 11.0, 14.0, 16.0, 19.0, 26.0, 29.0, 44.0, 33.0, 46.0, 62.0, 57.0, 55.0, 69.0, 59.0, 60.0, 70.0, 50.0, 39.0, 40.0, 33.0, 31.0, 32.0, 25.0, 20.0, 6.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6259765625, -0.6056747436523438, -0.5853729248046875, -0.5650711059570312, -0.544769287109375, -0.5244674682617188, -0.5041656494140625, -0.48386383056640625, -0.46356201171875, -0.44326019287109375, -0.4229583740234375, -0.40265655517578125, -0.382354736328125, -0.36205291748046875, -0.3417510986328125, -0.32144927978515625, -0.3011474609375, -0.28084564208984375, -0.2605438232421875, -0.24024200439453125, -0.219940185546875, -0.19963836669921875, -0.1793365478515625, -0.15903472900390625, -0.13873291015625, -0.11843109130859375, -0.0981292724609375, -0.07782745361328125, -0.057525634765625, -0.03722381591796875, -0.0169219970703125, 0.00337982177734375, 0.023681640625, 0.04398345947265625, 0.0642852783203125, 0.08458709716796875, 0.104888916015625, 0.12519073486328125, 0.1454925537109375, 0.16579437255859375, 0.18609619140625, 0.20639801025390625, 0.2266998291015625, 0.24700164794921875, 0.267303466796875, 0.28760528564453125, 0.3079071044921875, 0.32820892333984375, 0.3485107421875, 0.36881256103515625, 0.3891143798828125, 0.40941619873046875, 0.429718017578125, 0.45001983642578125, 0.4703216552734375, 0.49062347412109375, 0.51092529296875, 0.5312271118164062, 0.5515289306640625, 0.5718307495117188, 0.592132568359375, 0.6124343872070312, 0.6327362060546875, 0.6530380249023438, 0.67333984375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 3.0, 9.0, 12.0, 7.0, 18.0, 25.0, 35.0, 35.0, 54.0, 83.0, 152.0, 363.0, 2123.0, 177834.0, 4001585.0, 10610.0, 760.0, 214.0, 106.0, 74.0, 42.0, 33.0, 19.0, 19.0, 18.0, 8.0, 9.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.90625, -2.81884765625, -2.7314453125, -2.64404296875, -2.556640625, -2.46923828125, -2.3818359375, -2.29443359375, -2.20703125, -2.11962890625, -2.0322265625, -1.94482421875, -1.857421875, -1.77001953125, -1.6826171875, -1.59521484375, -1.5078125, -1.42041015625, -1.3330078125, -1.24560546875, -1.158203125, -1.07080078125, -0.9833984375, -0.89599609375, -0.80859375, -0.72119140625, -0.6337890625, -0.54638671875, -0.458984375, -0.37158203125, -0.2841796875, -0.19677734375, -0.109375, -0.02197265625, 0.0654296875, 0.15283203125, 0.240234375, 0.32763671875, 0.4150390625, 0.50244140625, 0.58984375, 0.67724609375, 0.7646484375, 0.85205078125, 0.939453125, 1.02685546875, 1.1142578125, 1.20166015625, 1.2890625, 1.37646484375, 1.4638671875, 1.55126953125, 1.638671875, 1.72607421875, 1.8134765625, 1.90087890625, 1.98828125, 2.07568359375, 2.1630859375, 2.25048828125, 2.337890625, 2.42529296875, 2.5126953125, 2.60009765625, 2.6875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 0.0, 8.0, 7.0, 8.0, 12.0, 17.0, 31.0, 36.0, 47.0, 70.0, 118.0, 133.0, 236.0, 297.0, 423.0, 534.0, 486.0, 465.0, 348.0, 247.0, 174.0, 124.0, 67.0, 59.0, 34.0, 27.0, 11.0, 8.0, 11.0, 8.0, 5.0, 9.0, 3.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2325439453125, -0.2257232666015625, -0.218902587890625, -0.2120819091796875, -0.20526123046875, -0.1984405517578125, -0.191619873046875, -0.1847991943359375, -0.177978515625, -0.1711578369140625, -0.164337158203125, -0.1575164794921875, -0.15069580078125, -0.1438751220703125, -0.137054443359375, -0.1302337646484375, -0.1234130859375, -0.1165924072265625, -0.109771728515625, -0.1029510498046875, -0.09613037109375, -0.0893096923828125, -0.082489013671875, -0.0756683349609375, -0.06884765625, -0.0620269775390625, -0.055206298828125, -0.0483856201171875, -0.04156494140625, -0.0347442626953125, -0.027923583984375, -0.0211029052734375, -0.0142822265625, -0.0074615478515625, -0.000640869140625, 0.0061798095703125, 0.01300048828125, 0.0198211669921875, 0.026641845703125, 0.0334625244140625, 0.040283203125, 0.0471038818359375, 0.053924560546875, 0.0607452392578125, 0.06756591796875, 0.0743865966796875, 0.081207275390625, 0.0880279541015625, 0.0948486328125, 0.1016693115234375, 0.108489990234375, 0.1153106689453125, 0.12213134765625, 0.1289520263671875, 0.135772705078125, 0.1425933837890625, 0.1494140625, 0.1562347412109375, 0.163055419921875, 0.1698760986328125, 0.17669677734375, 0.1835174560546875, 0.190338134765625, 0.1971588134765625, 0.2039794921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 10.0, 11.0, 28.0, 36.0, 45.0, 64.0, 80.0, 101.0, 115.0, 122.0, 119.0, 83.0, 54.0, 45.0, 28.0, 29.0, 13.0, 11.0, 1.0, 2.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1090688705444336, -1.0733213424682617, -1.0375738143920898, -1.001826286315918, -0.9660787582397461, -0.9303312301635742, -0.8945836424827576, -0.8588361144065857, -0.8230885863304138, -0.7873410582542419, -0.7515935301780701, -0.7158460021018982, -0.6800984144210815, -0.6443508863449097, -0.6086033582687378, -0.5728558301925659, -0.537108302116394, -0.5013607740402222, -0.4656132459640503, -0.42986568808555603, -0.39411816000938416, -0.3583706319332123, -0.322623074054718, -0.28687554597854614, -0.25112801790237427, -0.2153804898262024, -0.17963294684886932, -0.14388540387153625, -0.10813787579536438, -0.0723903477191925, -0.036642804741859436, -0.0008952617645263672, 0.03485226631164551, 0.07059980183839798, 0.10634733736515045, 0.14209488034248352, 0.1778424084186554, 0.21358993649482727, 0.24933747947216034, 0.2850850224494934, 0.3208325505256653, 0.35658007860183716, 0.39232760667800903, 0.4280751645565033, 0.46382269263267517, 0.49957022070884705, 0.5353177785873413, 0.5710653066635132, 0.6068128347396851, 0.6425603628158569, 0.6783078908920288, 0.7140554189682007, 0.7498029470443726, 0.7855504751205444, 0.8212980628013611, 0.857045590877533, 0.8927931189537048, 0.9285406470298767, 0.9642881751060486, 1.0000357627868652, 1.035783290863037, 1.071530818939209, 1.1072783470153809, 1.1430258750915527, 1.1787734031677246]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 5.0, 14.0, 13.0, 10.0, 16.0, 16.0, 19.0, 30.0, 26.0, 47.0, 31.0, 32.0, 43.0, 41.0, 55.0, 58.0, 43.0, 58.0, 38.0, 50.0, 59.0, 42.0, 29.0, 25.0, 30.0, 24.0, 18.0, 37.0, 16.0, 18.0, 13.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6355324983596802, -0.6174811720848083, -0.5994298458099365, -0.5813785791397095, -0.5633272528648376, -0.5452759265899658, -0.5272246599197388, -0.5091733336448669, -0.4911220073699951, -0.4730706810951233, -0.45501938462257385, -0.4369680881500244, -0.4189167618751526, -0.40086543560028076, -0.3828141391277313, -0.3647628426551819, -0.34671151638031006, -0.32866019010543823, -0.3106088936328888, -0.29255759716033936, -0.27450627088546753, -0.2564549446105957, -0.23840364813804626, -0.22035233676433563, -0.202301025390625, -0.18424971401691437, -0.16619840264320374, -0.1481470912694931, -0.13009577989578247, -0.11204446852207184, -0.0939931571483612, -0.07594184577465057, -0.057890474796295166, -0.039839163422584534, -0.0217878520488739, -0.003736540675163269, 0.014314770698547363, 0.032366082072257996, 0.05041739344596863, 0.06846870481967926, 0.08652001619338989, 0.10457132756710052, 0.12262263894081116, 0.1406739503145218, 0.15872526168823242, 0.17677657306194305, 0.1948278844356537, 0.21287919580936432, 0.23093050718307495, 0.24898181855678558, 0.2670331299304962, 0.28508442640304565, 0.3031357526779175, 0.3211870789527893, 0.33923837542533875, 0.3572896718978882, 0.37534099817276, 0.39339232444763184, 0.4114436209201813, 0.4294949173927307, 0.44754624366760254, 0.46559756994247437, 0.4836488664150238, 0.5017001628875732, 0.5197514891624451]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 11.0, 6.0, 24.0, 19.0, 27.0, 34.0, 60.0, 63.0, 116.0, 197.0, 341.0, 546.0, 1174.0, 2585.0, 6449.0, 18416.0, 65016.0, 257636.0, 462787.0, 168062.0, 43021.0, 13057.0, 4752.0, 1970.0, 951.0, 470.0, 260.0, 141.0, 125.0, 67.0, 54.0, 30.0, 25.0, 22.0, 8.0, 6.0, 1.0, 2.0, 6.0, 2.0, 0.0, 3.0, 3.0, 5.0, 1.0], "bins": [-0.1885986328125, -0.1835479736328125, -0.178497314453125, -0.1734466552734375, -0.16839599609375, -0.1633453369140625, -0.158294677734375, -0.1532440185546875, -0.148193359375, -0.1431427001953125, -0.138092041015625, -0.1330413818359375, -0.12799072265625, -0.1229400634765625, -0.117889404296875, -0.1128387451171875, -0.1077880859375, -0.1027374267578125, -0.097686767578125, -0.0926361083984375, -0.08758544921875, -0.0825347900390625, -0.077484130859375, -0.0724334716796875, -0.0673828125, -0.0623321533203125, -0.057281494140625, -0.0522308349609375, -0.04718017578125, -0.0421295166015625, -0.037078857421875, -0.0320281982421875, -0.0269775390625, -0.0219268798828125, -0.016876220703125, -0.0118255615234375, -0.00677490234375, -0.0017242431640625, 0.003326416015625, 0.0083770751953125, 0.013427734375, 0.0184783935546875, 0.023529052734375, 0.0285797119140625, 0.03363037109375, 0.0386810302734375, 0.043731689453125, 0.0487823486328125, 0.0538330078125, 0.0588836669921875, 0.063934326171875, 0.0689849853515625, 0.07403564453125, 0.0790863037109375, 0.084136962890625, 0.0891876220703125, 0.09423828125, 0.0992889404296875, 0.104339599609375, 0.1093902587890625, 0.11444091796875, 0.1194915771484375, 0.124542236328125, 0.1295928955078125, 0.1346435546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 13.0, 9.0, 12.0, 14.0, 16.0, 25.0, 22.0, 24.0, 33.0, 33.0, 37.0, 56.0, 43.0, 62.0, 50.0, 52.0, 65.0, 46.0, 67.0, 50.0, 42.0, 39.0, 33.0, 30.0, 28.0, 27.0, 23.0, 9.0, 9.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.38916015625, -0.3768501281738281, -0.36454010009765625, -0.3522300720214844, -0.3399200439453125, -0.3276100158691406, -0.31529998779296875, -0.3029899597167969, -0.290679931640625, -0.2783699035644531, -0.26605987548828125, -0.2537498474121094, -0.2414398193359375, -0.22912979125976562, -0.21681976318359375, -0.20450973510742188, -0.19219970703125, -0.17988967895507812, -0.16757965087890625, -0.15526962280273438, -0.1429595947265625, -0.13064956665039062, -0.11833953857421875, -0.10602951049804688, -0.093719482421875, -0.08140945434570312, -0.06909942626953125, -0.056789398193359375, -0.0444793701171875, -0.032169342041015625, -0.01985931396484375, -0.007549285888671875, 0.0047607421875, 0.017070770263671875, 0.02938079833984375, 0.041690826416015625, 0.0540008544921875, 0.06631088256835938, 0.07862091064453125, 0.09093093872070312, 0.103240966796875, 0.11555099487304688, 0.12786102294921875, 0.14017105102539062, 0.1524810791015625, 0.16479110717773438, 0.17710113525390625, 0.18941116333007812, 0.20172119140625, 0.21403121948242188, 0.22634124755859375, 0.23865127563476562, 0.2509613037109375, 0.2632713317871094, 0.27558135986328125, 0.2878913879394531, 0.300201416015625, 0.3125114440917969, 0.32482147216796875, 0.3371315002441406, 0.3494415283203125, 0.3617515563964844, 0.37406158447265625, 0.3863716125488281, 0.398681640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 9.0, 6.0, 9.0, 12.0, 23.0, 22.0, 29.0, 39.0, 43.0, 95.0, 108.0, 143.0, 192.0, 380.0, 642.0, 1145.0, 2000.0, 4206.0, 8986.0, 21603.0, 56059.0, 150252.0, 314938.0, 285798.0, 122677.0, 45729.0, 17854.0, 7539.0, 3578.0, 1806.0, 993.0, 556.0, 341.0, 213.0, 145.0, 98.0, 71.0, 63.0, 28.0, 32.0, 23.0, 14.0, 10.0, 9.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.11444091796875, -0.11085319519042969, -0.10726547241210938, -0.10367774963378906, -0.10009002685546875, -0.09650230407714844, -0.09291458129882812, -0.08932685852050781, -0.0857391357421875, -0.08215141296386719, -0.07856369018554688, -0.07497596740722656, -0.07138824462890625, -0.06780052185058594, -0.06421279907226562, -0.06062507629394531, -0.057037353515625, -0.05344963073730469, -0.049861907958984375, -0.04627418518066406, -0.04268646240234375, -0.03909873962402344, -0.035511016845703125, -0.03192329406738281, -0.0283355712890625, -0.024747848510742188, -0.021160125732421875, -0.017572402954101562, -0.01398468017578125, -0.010396957397460938, -0.006809234619140625, -0.0032215118408203125, 0.0003662109375, 0.0039539337158203125, 0.007541656494140625, 0.011129379272460938, 0.01471710205078125, 0.018304824829101562, 0.021892547607421875, 0.025480270385742188, 0.0290679931640625, 0.03265571594238281, 0.036243438720703125, 0.03983116149902344, 0.04341888427734375, 0.04700660705566406, 0.050594329833984375, 0.05418205261230469, 0.057769775390625, 0.06135749816894531, 0.06494522094726562, 0.06853294372558594, 0.07212066650390625, 0.07570838928222656, 0.07929611206054688, 0.08288383483886719, 0.0864715576171875, 0.09005928039550781, 0.09364700317382812, 0.09723472595214844, 0.10082244873046875, 0.10441017150878906, 0.10799789428710938, 0.11158561706542969, 0.11517333984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 5.0, 9.0, 7.0, 14.0, 14.0, 22.0, 19.0, 21.0, 25.0, 28.0, 42.0, 40.0, 38.0, 47.0, 45.0, 37.0, 50.0, 53.0, 50.0, 48.0, 47.0, 42.0, 35.0, 39.0, 28.0, 27.0, 24.0, 23.0, 24.0, 9.0, 12.0, 18.0, 6.0, 12.0, 3.0, 12.0, 7.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.630859375, -0.6099090576171875, -0.588958740234375, -0.5680084228515625, -0.54705810546875, -0.5261077880859375, -0.505157470703125, -0.4842071533203125, -0.4632568359375, -0.4423065185546875, -0.421356201171875, -0.4004058837890625, -0.37945556640625, -0.3585052490234375, -0.337554931640625, -0.3166046142578125, -0.295654296875, -0.2747039794921875, -0.253753662109375, -0.2328033447265625, -0.21185302734375, -0.1909027099609375, -0.169952392578125, -0.1490020751953125, -0.1280517578125, -0.1071014404296875, -0.086151123046875, -0.0652008056640625, -0.04425048828125, -0.0233001708984375, -0.002349853515625, 0.0186004638671875, 0.03955078125, 0.0605010986328125, 0.081451416015625, 0.1024017333984375, 0.12335205078125, 0.1443023681640625, 0.165252685546875, 0.1862030029296875, 0.2071533203125, 0.2281036376953125, 0.249053955078125, 0.2700042724609375, 0.29095458984375, 0.3119049072265625, 0.332855224609375, 0.3538055419921875, 0.374755859375, 0.3957061767578125, 0.416656494140625, 0.4376068115234375, 0.45855712890625, 0.4795074462890625, 0.500457763671875, 0.5214080810546875, 0.5423583984375, 0.5633087158203125, 0.584259033203125, 0.6052093505859375, 0.62615966796875, 0.6471099853515625, 0.668060302734375, 0.6890106201171875, 0.7099609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 11.0, 9.0, 13.0, 27.0, 43.0, 57.0, 94.0, 166.0, 424.0, 910.0, 2366.0, 7639.0, 38418.0, 319165.0, 576528.0, 82924.0, 13562.0, 3761.0, 1291.0, 537.0, 284.0, 124.0, 73.0, 51.0, 19.0, 16.0, 16.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.06475162506103516, -0.06218147277832031, -0.05961132049560547, -0.057041168212890625, -0.05447101593017578, -0.05190086364746094, -0.049330711364746094, -0.04676055908203125, -0.044190406799316406, -0.04162025451660156, -0.03905010223388672, -0.036479949951171875, -0.03390979766845703, -0.03133964538574219, -0.028769493103027344, -0.0261993408203125, -0.023629188537597656, -0.021059036254882812, -0.01848888397216797, -0.015918731689453125, -0.013348579406738281, -0.010778427124023438, -0.008208274841308594, -0.00563812255859375, -0.0030679702758789062, -0.0004978179931640625, 0.0020723342895507812, 0.004642486572265625, 0.007212638854980469, 0.009782791137695312, 0.012352943420410156, 0.014923095703125, 0.017493247985839844, 0.020063400268554688, 0.02263355255126953, 0.025203704833984375, 0.02777385711669922, 0.030344009399414062, 0.032914161682128906, 0.03548431396484375, 0.038054466247558594, 0.04062461853027344, 0.04319477081298828, 0.045764923095703125, 0.04833507537841797, 0.05090522766113281, 0.053475379943847656, 0.0560455322265625, 0.058615684509277344, 0.06118583679199219, 0.06375598907470703, 0.06632614135742188, 0.06889629364013672, 0.07146644592285156, 0.0740365982055664, 0.07660675048828125, 0.0791769027709961, 0.08174705505371094, 0.08431720733642578, 0.08688735961914062, 0.08945751190185547, 0.09202766418457031, 0.09459781646728516, 0.09716796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 10.0, 10.0, 32.0, 22.0, 66.0, 85.0, 131.0, 148.0, 151.0, 128.0, 90.0, 56.0, 35.0, 13.0, 9.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8312206268310547e-05, -2.7070753276348114e-05, -2.582930028438568e-05, -2.4587847292423248e-05, -2.3346394300460815e-05, -2.2104941308498383e-05, -2.086348831653595e-05, -1.9622035324573517e-05, -1.8380582332611084e-05, -1.713912934064865e-05, -1.5897676348686218e-05, -1.4656223356723785e-05, -1.3414770364761353e-05, -1.217331737279892e-05, -1.0931864380836487e-05, -9.690411388874054e-06, -8.448958396911621e-06, -7.207505404949188e-06, -5.966052412986755e-06, -4.7245994210243225e-06, -3.4831464290618896e-06, -2.2416934370994568e-06, -1.000240445137024e-06, 2.4121254682540894e-07, 1.4826655387878418e-06, 2.7241185307502747e-06, 3.9655715227127075e-06, 5.20702451467514e-06, 6.448477506637573e-06, 7.689930498600006e-06, 8.931383490562439e-06, 1.0172836482524872e-05, 1.1414289474487305e-05, 1.2655742466449738e-05, 1.389719545841217e-05, 1.5138648450374603e-05, 1.6380101442337036e-05, 1.762155443429947e-05, 1.8863007426261902e-05, 2.0104460418224335e-05, 2.1345913410186768e-05, 2.25873664021492e-05, 2.3828819394111633e-05, 2.5070272386074066e-05, 2.63117253780365e-05, 2.7553178369998932e-05, 2.8794631361961365e-05, 3.0036084353923798e-05, 3.127753734588623e-05, 3.251899033784866e-05, 3.3760443329811096e-05, 3.500189632177353e-05, 3.624334931373596e-05, 3.7484802305698395e-05, 3.872625529766083e-05, 3.996770828962326e-05, 4.120916128158569e-05, 4.2450614273548126e-05, 4.369206726551056e-05, 4.493352025747299e-05, 4.6174973249435425e-05, 4.741642624139786e-05, 4.865787923336029e-05, 4.9899332225322723e-05, 5.1140785217285156e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 4.0, 10.0, 12.0, 13.0, 17.0, 29.0, 48.0, 72.0, 169.0, 522.0, 1940.0, 10482.0, 98870.0, 737147.0, 178802.0, 16495.0, 2764.0, 686.0, 208.0, 94.0, 44.0, 31.0, 23.0, 15.0, 9.0, 14.0, 4.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1104736328125, -0.107086181640625, -0.10369873046875, -0.100311279296875, -0.096923828125, -0.093536376953125, -0.09014892578125, -0.086761474609375, -0.0833740234375, -0.079986572265625, -0.07659912109375, -0.073211669921875, -0.06982421875, -0.066436767578125, -0.06304931640625, -0.059661865234375, -0.0562744140625, -0.052886962890625, -0.04949951171875, -0.046112060546875, -0.042724609375, -0.039337158203125, -0.03594970703125, -0.032562255859375, -0.0291748046875, -0.025787353515625, -0.02239990234375, -0.019012451171875, -0.015625, -0.012237548828125, -0.00885009765625, -0.005462646484375, -0.0020751953125, 0.001312255859375, 0.00469970703125, 0.008087158203125, 0.011474609375, 0.014862060546875, 0.01824951171875, 0.021636962890625, 0.0250244140625, 0.028411865234375, 0.03179931640625, 0.035186767578125, 0.03857421875, 0.041961669921875, 0.04534912109375, 0.048736572265625, 0.0521240234375, 0.055511474609375, 0.05889892578125, 0.062286376953125, 0.065673828125, 0.069061279296875, 0.07244873046875, 0.075836181640625, 0.0792236328125, 0.082611083984375, 0.08599853515625, 0.089385986328125, 0.0927734375, 0.096160888671875, 0.09954833984375, 0.102935791015625, 0.1063232421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 9.0, 16.0, 14.0, 10.0, 22.0, 22.0, 30.0, 41.0, 59.0, 85.0, 83.0, 98.0, 69.0, 100.0, 75.0, 60.0, 40.0, 36.0, 33.0, 15.0, 19.0, 12.0, 9.0, 5.0, 12.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.016845703125, -0.016368508338928223, -0.015891313552856445, -0.015414118766784668, -0.01493692398071289, -0.014459729194641113, -0.013982534408569336, -0.013505339622497559, -0.013028144836425781, -0.012550950050354004, -0.012073755264282227, -0.01159656047821045, -0.011119365692138672, -0.010642170906066895, -0.010164976119995117, -0.00968778133392334, -0.009210586547851562, -0.008733391761779785, -0.008256196975708008, -0.0077790021896362305, -0.007301807403564453, -0.006824612617492676, -0.0063474178314208984, -0.005870223045349121, -0.005393028259277344, -0.004915833473205566, -0.004438638687133789, -0.003961443901062012, -0.0034842491149902344, -0.003007054328918457, -0.0025298595428466797, -0.0020526647567749023, -0.001575469970703125, -0.0010982751846313477, -0.0006210803985595703, -0.00014388561248779297, 0.0003333091735839844, 0.0008105039596557617, 0.001287698745727539, 0.0017648935317993164, 0.0022420883178710938, 0.002719283103942871, 0.0031964778900146484, 0.0036736726760864258, 0.004150867462158203, 0.0046280622482299805, 0.005105257034301758, 0.005582451820373535, 0.0060596466064453125, 0.00653684139251709, 0.007014036178588867, 0.0074912309646606445, 0.007968425750732422, 0.0084456205368042, 0.008922815322875977, 0.009400010108947754, 0.009877204895019531, 0.010354399681091309, 0.010831594467163086, 0.011308789253234863, 0.01178598403930664, 0.012263178825378418, 0.012740373611450195, 0.013217568397521973, 0.01369476318359375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 10.0, 23.0, 34.0, 45.0, 82.0, 117.0, 133.0, 178.0, 138.0, 97.0, 55.0, 47.0, 18.0, 10.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8470771908760071, -0.8199694156646729, -0.7928617000579834, -0.7657539248466492, -0.7386461496353149, -0.7115384340286255, -0.6844306588172913, -0.657322883605957, -0.6302151083946228, -0.6031073331832886, -0.5759996175765991, -0.5488918423652649, -0.5217840671539307, -0.4946763217449188, -0.467568576335907, -0.44046080112457275, -0.4133530557155609, -0.3862453103065491, -0.35913753509521484, -0.332029789686203, -0.3049220144748688, -0.27781426906585693, -0.2507064938545227, -0.22359874844551086, -0.19649098813533783, -0.1693832278251648, -0.14227546751499176, -0.11516771465539932, -0.08805995434522629, -0.06095220148563385, -0.033844441175460815, -0.006736680865287781, 0.020371079444885254, 0.04747883975505829, 0.07458660006523132, 0.10169435292482376, 0.1288021206855774, 0.15590986609458923, 0.18301762640476227, 0.2101253867149353, 0.23723314702510834, 0.26434090733528137, 0.2914486527442932, 0.31855642795562744, 0.3456641733646393, 0.3727719187736511, 0.39987969398498535, 0.4269874691963196, 0.4540952146053314, 0.48120296001434326, 0.5083107352256775, 0.5354185104370117, 0.5625262260437012, 0.5896340012550354, 0.6167417764663696, 0.6438494920730591, 0.6709572672843933, 0.6980650424957275, 0.725172758102417, 0.7522805333137512, 0.7793883085250854, 0.8064960241317749, 0.8336037993431091, 0.8607115745544434, 0.8878193497657776]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 8.0, 4.0, 6.0, 11.0, 16.0, 11.0, 16.0, 19.0, 23.0, 42.0, 37.0, 36.0, 46.0, 51.0, 64.0, 59.0, 67.0, 52.0, 60.0, 52.0, 64.0, 46.0, 28.0, 34.0, 32.0, 34.0, 22.0, 16.0, 20.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43540456891059875, -0.42257726192474365, -0.40974992513656616, -0.39692261815071106, -0.38409531116485596, -0.37126797437667847, -0.35844066739082336, -0.34561336040496826, -0.33278602361679077, -0.31995871663093567, -0.3071313798427582, -0.2943040728569031, -0.2814767360687256, -0.2686494290828705, -0.2558221220970154, -0.24299480020999908, -0.2301674783229828, -0.2173401564359665, -0.2045128345489502, -0.1916855275630951, -0.1788582056760788, -0.1660308837890625, -0.1532035768032074, -0.1403762549161911, -0.1275489330291748, -0.11472161114215851, -0.10189429670572281, -0.08906698226928711, -0.07623966038227081, -0.06341233849525452, -0.05058502405881882, -0.03775770962238312, -0.02493038773536682, -0.012103069573640823, 0.0007242485880851746, 0.013551566749811172, 0.02637888491153717, 0.03920620679855347, 0.052033521234989166, 0.06486083567142487, 0.07768815755844116, 0.09051547944545746, 0.10334279388189316, 0.11617010831832886, 0.12899743020534515, 0.14182475209236145, 0.15465205907821655, 0.16747938096523285, 0.18030670285224915, 0.19313402473926544, 0.20596134662628174, 0.21878865361213684, 0.23161597549915314, 0.24444329738616943, 0.25727060437202454, 0.27009791135787964, 0.28292524814605713, 0.29575255513191223, 0.3085798919200897, 0.3214071989059448, 0.3342345356941223, 0.3470618426799774, 0.3598891496658325, 0.37271648645401, 0.3855437934398651]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 10.0, 13.0, 22.0, 25.0, 52.0, 104.0, 293.0, 1597.0, 27950.0, 920093.0, 94645.0, 3000.0, 455.0, 135.0, 47.0, 33.0, 25.0, 12.0, 12.0, 7.0, 5.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5830078125, -1.5420379638671875, -1.501068115234375, -1.4600982666015625, -1.41912841796875, -1.3781585693359375, -1.337188720703125, -1.2962188720703125, -1.2552490234375, -1.2142791748046875, -1.173309326171875, -1.1323394775390625, -1.09136962890625, -1.0503997802734375, -1.009429931640625, -0.9684600830078125, -0.927490234375, -0.8865203857421875, -0.845550537109375, -0.8045806884765625, -0.76361083984375, -0.7226409912109375, -0.681671142578125, -0.6407012939453125, -0.5997314453125, -0.5587615966796875, -0.517791748046875, -0.4768218994140625, -0.43585205078125, -0.3948822021484375, -0.353912353515625, -0.3129425048828125, -0.27197265625, -0.2310028076171875, -0.190032958984375, -0.1490631103515625, -0.10809326171875, -0.0671234130859375, -0.026153564453125, 0.0148162841796875, 0.0557861328125, 0.0967559814453125, 0.137725830078125, 0.1786956787109375, 0.21966552734375, 0.2606353759765625, 0.301605224609375, 0.3425750732421875, 0.383544921875, 0.4245147705078125, 0.465484619140625, 0.5064544677734375, 0.54742431640625, 0.5883941650390625, 0.629364013671875, 0.6703338623046875, 0.7113037109375, 0.7522735595703125, 0.793243408203125, 0.8342132568359375, 0.87518310546875, 0.9161529541015625, 0.957122802734375, 0.9980926513671875, 1.0390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 15.0, 14.0, 12.0, 31.0, 36.0, 54.0, 73.0, 56.0, 94.0, 93.0, 84.0, 94.0, 86.0, 62.0, 66.0, 42.0, 30.0, 25.0, 16.0, 13.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.865234375, -0.824432373046875, -0.78363037109375, -0.742828369140625, -0.7020263671875, -0.661224365234375, -0.62042236328125, -0.579620361328125, -0.538818359375, -0.498016357421875, -0.45721435546875, -0.416412353515625, -0.3756103515625, -0.334808349609375, -0.29400634765625, -0.253204345703125, -0.21240234375, -0.171600341796875, -0.13079833984375, -0.089996337890625, -0.0491943359375, -0.008392333984375, 0.03240966796875, 0.073211669921875, 0.114013671875, 0.154815673828125, 0.19561767578125, 0.236419677734375, 0.2772216796875, 0.318023681640625, 0.35882568359375, 0.399627685546875, 0.4404296875, 0.481231689453125, 0.52203369140625, 0.562835693359375, 0.6036376953125, 0.644439697265625, 0.68524169921875, 0.726043701171875, 0.766845703125, 0.807647705078125, 0.84844970703125, 0.889251708984375, 0.9300537109375, 0.970855712890625, 1.01165771484375, 1.052459716796875, 1.09326171875, 1.134063720703125, 1.17486572265625, 1.215667724609375, 1.2564697265625, 1.297271728515625, 1.33807373046875, 1.378875732421875, 1.419677734375, 1.460479736328125, 1.50128173828125, 1.542083740234375, 1.5828857421875, 1.623687744140625, 1.66448974609375, 1.705291748046875, 1.74609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 5.0, 4.0, 9.0, 6.0, 7.0, 11.0, 17.0, 23.0, 33.0, 28.0, 52.0, 37.0, 53.0, 65.0, 101.0, 125.0, 174.0, 196.0, 260.0, 656.0, 3467.0, 55705.0, 853158.0, 126564.0, 5595.0, 869.0, 320.0, 244.0, 153.0, 129.0, 115.0, 64.0, 55.0, 52.0, 38.0, 48.0, 33.0, 19.0, 15.0, 8.0, 9.0, 10.0, 9.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83154296875, -0.8043746948242188, -0.7772064208984375, -0.7500381469726562, -0.722869873046875, -0.6957015991210938, -0.6685333251953125, -0.6413650512695312, -0.61419677734375, -0.5870285034179688, -0.5598602294921875, -0.5326919555664062, -0.505523681640625, -0.47835540771484375, -0.4511871337890625, -0.42401885986328125, -0.3968505859375, -0.36968231201171875, -0.3425140380859375, -0.31534576416015625, -0.288177490234375, -0.26100921630859375, -0.2338409423828125, -0.20667266845703125, -0.17950439453125, -0.15233612060546875, -0.1251678466796875, -0.09799957275390625, -0.070831298828125, -0.04366302490234375, -0.0164947509765625, 0.01067352294921875, 0.037841796875, 0.06501007080078125, 0.0921783447265625, 0.11934661865234375, 0.146514892578125, 0.17368316650390625, 0.2008514404296875, 0.22801971435546875, 0.25518798828125, 0.28235626220703125, 0.3095245361328125, 0.33669281005859375, 0.363861083984375, 0.39102935791015625, 0.4181976318359375, 0.44536590576171875, 0.4725341796875, 0.49970245361328125, 0.5268707275390625, 0.5540390014648438, 0.581207275390625, 0.6083755493164062, 0.6355438232421875, 0.6627120971679688, 0.68988037109375, 0.7170486450195312, 0.7442169189453125, 0.7713851928710938, 0.798553466796875, 0.8257217407226562, 0.8528900146484375, 0.8800582885742188, 0.9072265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 5.0, 4.0, 11.0, 12.0, 10.0, 13.0, 17.0, 14.0, 12.0, 17.0, 24.0, 29.0, 37.0, 26.0, 29.0, 35.0, 44.0, 30.0, 53.0, 40.0, 41.0, 47.0, 36.0, 38.0, 35.0, 37.0, 31.0, 32.0, 25.0, 27.0, 26.0, 18.0, 22.0, 23.0, 25.0, 15.0, 7.0, 10.0, 6.0, 6.0, 8.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.6298828125, -0.611358642578125, -0.59283447265625, -0.574310302734375, -0.5557861328125, -0.537261962890625, -0.51873779296875, -0.500213623046875, -0.481689453125, -0.463165283203125, -0.44464111328125, -0.426116943359375, -0.4075927734375, -0.389068603515625, -0.37054443359375, -0.352020263671875, -0.33349609375, -0.314971923828125, -0.29644775390625, -0.277923583984375, -0.2593994140625, -0.240875244140625, -0.22235107421875, -0.203826904296875, -0.185302734375, -0.166778564453125, -0.14825439453125, -0.129730224609375, -0.1112060546875, -0.092681884765625, -0.07415771484375, -0.055633544921875, -0.037109375, -0.018585205078125, -6.103515625e-05, 0.018463134765625, 0.0369873046875, 0.055511474609375, 0.07403564453125, 0.092559814453125, 0.111083984375, 0.129608154296875, 0.14813232421875, 0.166656494140625, 0.1851806640625, 0.203704833984375, 0.22222900390625, 0.240753173828125, 0.25927734375, 0.277801513671875, 0.29632568359375, 0.314849853515625, 0.3333740234375, 0.351898193359375, 0.37042236328125, 0.388946533203125, 0.407470703125, 0.425994873046875, 0.44451904296875, 0.463043212890625, 0.4815673828125, 0.500091552734375, 0.51861572265625, 0.537139892578125, 0.5556640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 15.0, 9.0, 20.0, 33.0, 53.0, 74.0, 144.0, 259.0, 776.0, 3599.0, 35012.0, 592743.0, 391031.0, 20995.0, 2572.0, 617.0, 254.0, 144.0, 64.0, 44.0, 27.0, 15.0, 13.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.22781753540039062, -0.22089385986328125, -0.21397018432617188, -0.2070465087890625, -0.20012283325195312, -0.19319915771484375, -0.18627548217773438, -0.179351806640625, -0.17242813110351562, -0.16550445556640625, -0.15858078002929688, -0.1516571044921875, -0.14473342895507812, -0.13780975341796875, -0.13088607788085938, -0.12396240234375, -0.11703872680664062, -0.11011505126953125, -0.10319137573242188, -0.0962677001953125, -0.08934402465820312, -0.08242034912109375, -0.07549667358398438, -0.068572998046875, -0.061649322509765625, -0.05472564697265625, -0.047801971435546875, -0.0408782958984375, -0.033954620361328125, -0.02703094482421875, -0.020107269287109375, -0.01318359375, -0.006259918212890625, 0.00066375732421875, 0.007587432861328125, 0.0145111083984375, 0.021434783935546875, 0.02835845947265625, 0.035282135009765625, 0.042205810546875, 0.049129486083984375, 0.05605316162109375, 0.06297683715820312, 0.0699005126953125, 0.07682418823242188, 0.08374786376953125, 0.09067153930664062, 0.09759521484375, 0.10451889038085938, 0.11144256591796875, 0.11836624145507812, 0.1252899169921875, 0.13221359252929688, 0.13913726806640625, 0.14606094360351562, 0.152984619140625, 0.15990829467773438, 0.16683197021484375, 0.17375564575195312, 0.1806793212890625, 0.18760299682617188, 0.19452667236328125, 0.20145034790039062, 0.2083740234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 8.0, 17.0, 7.0, 10.0, 17.0, 23.0, 21.0, 19.0, 29.0, 32.0, 41.0, 66.0, 63.0, 76.0, 64.0, 56.0, 72.0, 43.0, 64.0, 47.0, 31.0, 35.0, 30.0, 21.0, 23.0, 16.0, 9.0, 12.0, 9.0, 11.0, 6.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4841556549072266e-05, -1.4406628906726837e-05, -1.3971701264381409e-05, -1.353677362203598e-05, -1.3101845979690552e-05, -1.2666918337345123e-05, -1.2231990694999695e-05, -1.1797063052654266e-05, -1.1362135410308838e-05, -1.092720776796341e-05, -1.0492280125617981e-05, -1.0057352483272552e-05, -9.622424840927124e-06, -9.187497198581696e-06, -8.752569556236267e-06, -8.317641913890839e-06, -7.88271427154541e-06, -7.447786629199982e-06, -7.012858986854553e-06, -6.577931344509125e-06, -6.143003702163696e-06, -5.708076059818268e-06, -5.273148417472839e-06, -4.838220775127411e-06, -4.403293132781982e-06, -3.968365490436554e-06, -3.5334378480911255e-06, -3.098510205745697e-06, -2.6635825634002686e-06, -2.22865492105484e-06, -1.7937272787094116e-06, -1.3587996363639832e-06, -9.238719940185547e-07, -4.889443516731262e-07, -5.4016709327697754e-08, 3.809109330177307e-07, 8.158385753631592e-07, 1.2507662177085876e-06, 1.6856938600540161e-06, 2.1206215023994446e-06, 2.555549144744873e-06, 2.9904767870903015e-06, 3.42540442943573e-06, 3.8603320717811584e-06, 4.295259714126587e-06, 4.730187356472015e-06, 5.165114998817444e-06, 5.600042641162872e-06, 6.034970283508301e-06, 6.469897925853729e-06, 6.904825568199158e-06, 7.339753210544586e-06, 7.774680852890015e-06, 8.209608495235443e-06, 8.644536137580872e-06, 9.0794637799263e-06, 9.514391422271729e-06, 9.949319064617157e-06, 1.0384246706962585e-05, 1.0819174349308014e-05, 1.1254101991653442e-05, 1.1689029633998871e-05, 1.21239572763443e-05, 1.2558884918689728e-05, 1.2993812561035156e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 13.0, 14.0, 23.0, 25.0, 41.0, 62.0, 143.0, 338.0, 817.0, 2856.0, 16202.0, 243909.0, 721382.0, 54264.0, 6138.0, 1424.0, 484.0, 184.0, 100.0, 39.0, 33.0, 24.0, 13.0, 7.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.254638671875, -0.24720382690429688, -0.23976898193359375, -0.23233413696289062, -0.2248992919921875, -0.21746444702148438, -0.21002960205078125, -0.20259475708007812, -0.195159912109375, -0.18772506713867188, -0.18029022216796875, -0.17285537719726562, -0.1654205322265625, -0.15798568725585938, -0.15055084228515625, -0.14311599731445312, -0.13568115234375, -0.12824630737304688, -0.12081146240234375, -0.11337661743164062, -0.1059417724609375, -0.09850692749023438, -0.09107208251953125, -0.08363723754882812, -0.076202392578125, -0.06876754760742188, -0.06133270263671875, -0.053897857666015625, -0.0464630126953125, -0.039028167724609375, -0.03159332275390625, -0.024158477783203125, -0.0167236328125, -0.009288787841796875, -0.00185394287109375, 0.005580902099609375, 0.0130157470703125, 0.020450592041015625, 0.02788543701171875, 0.035320281982421875, 0.042755126953125, 0.050189971923828125, 0.05762481689453125, 0.06505966186523438, 0.0724945068359375, 0.07992935180664062, 0.08736419677734375, 0.09479904174804688, 0.10223388671875, 0.10966873168945312, 0.11710357666015625, 0.12453842163085938, 0.1319732666015625, 0.13940811157226562, 0.14684295654296875, 0.15427780151367188, 0.161712646484375, 0.16914749145507812, 0.17658233642578125, 0.18401718139648438, 0.1914520263671875, 0.19888687133789062, 0.20632171630859375, 0.21375656127929688, 0.22119140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 10.0, 12.0, 14.0, 18.0, 17.0, 23.0, 37.0, 50.0, 60.0, 69.0, 82.0, 93.0, 82.0, 64.0, 79.0, 62.0, 52.0, 42.0, 29.0, 28.0, 17.0, 15.0, 4.0, 6.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0738525390625, -0.0718998908996582, -0.0699472427368164, -0.06799459457397461, -0.06604194641113281, -0.06408929824829102, -0.06213665008544922, -0.06018400192260742, -0.058231353759765625, -0.05627870559692383, -0.05432605743408203, -0.052373409271240234, -0.05042076110839844, -0.04846811294555664, -0.046515464782714844, -0.04456281661987305, -0.04261016845703125, -0.04065752029418945, -0.038704872131347656, -0.03675222396850586, -0.03479957580566406, -0.032846927642822266, -0.03089427947998047, -0.028941631317138672, -0.026988983154296875, -0.025036334991455078, -0.02308368682861328, -0.021131038665771484, -0.019178390502929688, -0.01722574234008789, -0.015273094177246094, -0.013320446014404297, -0.0113677978515625, -0.009415149688720703, -0.007462501525878906, -0.005509853363037109, -0.0035572052001953125, -0.0016045570373535156, 0.00034809112548828125, 0.002300739288330078, 0.004253387451171875, 0.006206035614013672, 0.008158683776855469, 0.010111331939697266, 0.012063980102539062, 0.01401662826538086, 0.015969276428222656, 0.017921924591064453, 0.01987457275390625, 0.021827220916748047, 0.023779869079589844, 0.02573251724243164, 0.027685165405273438, 0.029637813568115234, 0.03159046173095703, 0.03354310989379883, 0.035495758056640625, 0.03744840621948242, 0.03940105438232422, 0.041353702545166016, 0.04330635070800781, 0.04525899887084961, 0.047211647033691406, 0.0491642951965332, 0.051116943359375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 25.0, 47.0, 60.0, 105.0, 146.0, 183.0, 161.0, 122.0, 62.0, 44.0, 24.0, 9.0, 2.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.493903398513794, -1.433180809020996, -1.3724582195281982, -1.3117356300354004, -1.251012921333313, -1.1902903318405151, -1.1295677423477173, -1.0688451528549194, -1.0081225633621216, -0.9473999738693237, -0.8866773247718811, -0.8259547352790833, -0.7652321457862854, -0.7045094966888428, -0.6437869071960449, -0.5830643177032471, -0.5223416686058044, -0.4616190493106842, -0.40089645981788635, -0.3401738405227661, -0.27945125102996826, -0.21872863173484802, -0.15800601243972778, -0.09728342294692993, -0.03656080365180969, 0.02416180446743965, 0.084884412586689, 0.14560702443122864, 0.20632962882518768, 0.26705223321914673, 0.32777485251426697, 0.3884974420070648, 0.44922006130218506, 0.5099426507949829, 0.5706652998924255, 0.6313878893852234, 0.6921104788780212, 0.7528331279754639, 0.8135557174682617, 0.8742783069610596, 0.9350008964538574, 0.9957234859466553, 1.0564460754394531, 1.117168664932251, 1.1778913736343384, 1.2386139631271362, 1.299336552619934, 1.360059142112732, 1.4207818508148193, 1.4815044403076172, 1.542227029800415, 1.602949619293213, 1.6636723279953003, 1.7243949174880981, 1.785117506980896, 1.8458400964736938, 1.9065626859664917, 1.9672852754592896, 2.028007984161377, 2.088730573654175, 2.1494531631469727, 2.2101757526397705, 2.2708983421325684, 2.331620931625366, 2.392343521118164]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 1.0, 3.0, 0.0, 6.0, 6.0, 7.0, 12.0, 9.0, 9.0, 14.0, 21.0, 16.0, 20.0, 20.0, 31.0, 29.0, 26.0, 34.0, 26.0, 38.0, 45.0, 46.0, 45.0, 48.0, 36.0, 47.0, 41.0, 33.0, 41.0, 39.0, 35.0, 24.0, 32.0, 24.0, 26.0, 19.0, 27.0, 10.0, 7.0, 8.0, 12.0, 7.0, 4.0, 13.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.2503734827041626, -1.2161850929260254, -1.1819968223571777, -1.14780855178833, -1.1136201620101929, -1.0794317722320557, -1.045243501663208, -1.0110552310943604, -0.9768668413162231, -0.9426785111427307, -0.9084901809692383, -0.8743018507957458, -0.8401135206222534, -0.805925190448761, -0.7717368602752686, -0.7375485301017761, -0.7033601999282837, -0.6691718697547913, -0.6349835395812988, -0.6007952094078064, -0.566606879234314, -0.5324185490608215, -0.4982302188873291, -0.46404188871383667, -0.42985355854034424, -0.3956652283668518, -0.3614768981933594, -0.32728856801986694, -0.2931002378463745, -0.2589119076728821, -0.22472357749938965, -0.19053524732589722, -0.15634703636169434, -0.1221587061882019, -0.08797037601470947, -0.05378204584121704, -0.01959371566772461, 0.014594614505767822, 0.048782944679260254, 0.08297127485275269, 0.11715960502624512, 0.15134793519973755, 0.18553626537322998, 0.2197245955467224, 0.25391292572021484, 0.2881012558937073, 0.3222895860671997, 0.35647791624069214, 0.39066624641418457, 0.424854576587677, 0.45904290676116943, 0.49323123693466187, 0.5274195671081543, 0.5616078972816467, 0.5957962274551392, 0.6299845576286316, 0.664172887802124, 0.6983612179756165, 0.7325495481491089, 0.7667378783226013, 0.8009262084960938, 0.8351145386695862, 0.8693028688430786, 0.903491199016571, 0.9376795291900635]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 6.0, 9.0, 12.0, 30.0, 39.0, 69.0, 94.0, 173.0, 320.0, 548.0, 1152.0, 2621.0, 8079.0, 37913.0, 335523.0, 2311756.0, 1326433.0, 141010.0, 19823.0, 5024.0, 1812.0, 870.0, 384.0, 237.0, 143.0, 64.0, 44.0, 42.0, 19.0, 19.0, 8.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70556640625, -0.6801910400390625, -0.654815673828125, -0.6294403076171875, -0.60406494140625, -0.5786895751953125, -0.553314208984375, -0.5279388427734375, -0.5025634765625, -0.4771881103515625, -0.451812744140625, -0.4264373779296875, -0.40106201171875, -0.3756866455078125, -0.350311279296875, -0.3249359130859375, -0.299560546875, -0.2741851806640625, -0.248809814453125, -0.2234344482421875, -0.19805908203125, -0.1726837158203125, -0.147308349609375, -0.1219329833984375, -0.0965576171875, -0.0711822509765625, -0.045806884765625, -0.0204315185546875, 0.00494384765625, 0.0303192138671875, 0.055694580078125, 0.0810699462890625, 0.1064453125, 0.1318206787109375, 0.157196044921875, 0.1825714111328125, 0.20794677734375, 0.2333221435546875, 0.258697509765625, 0.2840728759765625, 0.3094482421875, 0.3348236083984375, 0.360198974609375, 0.3855743408203125, 0.41094970703125, 0.4363250732421875, 0.461700439453125, 0.4870758056640625, 0.512451171875, 0.5378265380859375, 0.563201904296875, 0.5885772705078125, 0.61395263671875, 0.6393280029296875, 0.664703369140625, 0.6900787353515625, 0.7154541015625, 0.7408294677734375, 0.766204833984375, 0.7915802001953125, 0.81695556640625, 0.8423309326171875, 0.867706298828125, 0.8930816650390625, 0.91845703125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 6.0, 8.0, 8.0, 9.0, 11.0, 15.0, 27.0, 24.0, 22.0, 32.0, 32.0, 49.0, 53.0, 42.0, 52.0, 56.0, 54.0, 48.0, 51.0, 42.0, 43.0, 48.0, 40.0, 36.0, 32.0, 33.0, 20.0, 25.0, 11.0, 14.0, 7.0, 10.0, 12.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5615425109863281, -0.5454483032226562, -0.5293540954589844, -0.5132598876953125, -0.4971656799316406, -0.48107147216796875, -0.4649772644042969, -0.448883056640625, -0.4327888488769531, -0.41669464111328125, -0.4006004333496094, -0.3845062255859375, -0.3684120178222656, -0.35231781005859375, -0.3362236022949219, -0.32012939453125, -0.3040351867675781, -0.28794097900390625, -0.2718467712402344, -0.2557525634765625, -0.23965835571289062, -0.22356414794921875, -0.20746994018554688, -0.191375732421875, -0.17528152465820312, -0.15918731689453125, -0.14309310913085938, -0.1269989013671875, -0.11090469360351562, -0.09481048583984375, -0.07871627807617188, -0.0626220703125, -0.046527862548828125, -0.03043365478515625, -0.014339447021484375, 0.0017547607421875, 0.017848968505859375, 0.03394317626953125, 0.050037384033203125, 0.066131591796875, 0.08222579956054688, 0.09832000732421875, 0.11441421508789062, 0.1305084228515625, 0.14660263061523438, 0.16269683837890625, 0.17879104614257812, 0.19488525390625, 0.21097946166992188, 0.22707366943359375, 0.24316787719726562, 0.2592620849609375, 0.2753562927246094, 0.29145050048828125, 0.3075447082519531, 0.323638916015625, 0.3397331237792969, 0.35582733154296875, 0.3719215393066406, 0.3880157470703125, 0.4041099548339844, 0.42020416259765625, 0.4362983703613281, 0.452392578125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 6.0, 12.0, 25.0, 29.0, 65.0, 122.0, 224.0, 488.0, 1753.0, 15828.0, 3077991.0, 1086151.0, 9436.0, 1309.0, 433.0, 189.0, 83.0, 48.0, 34.0, 15.0, 14.0, 7.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.064453125, -2.0053253173828125, -1.946197509765625, -1.8870697021484375, -1.82794189453125, -1.7688140869140625, -1.709686279296875, -1.6505584716796875, -1.5914306640625, -1.5323028564453125, -1.473175048828125, -1.4140472412109375, -1.35491943359375, -1.2957916259765625, -1.236663818359375, -1.1775360107421875, -1.118408203125, -1.0592803955078125, -1.000152587890625, -0.9410247802734375, -0.88189697265625, -0.8227691650390625, -0.763641357421875, -0.7045135498046875, -0.6453857421875, -0.5862579345703125, -0.527130126953125, -0.4680023193359375, -0.40887451171875, -0.3497467041015625, -0.290618896484375, -0.2314910888671875, -0.17236328125, -0.1132354736328125, -0.054107666015625, 0.0050201416015625, 0.06414794921875, 0.1232757568359375, 0.182403564453125, 0.2415313720703125, 0.3006591796875, 0.3597869873046875, 0.418914794921875, 0.4780426025390625, 0.53717041015625, 0.5962982177734375, 0.655426025390625, 0.7145538330078125, 0.773681640625, 0.8328094482421875, 0.891937255859375, 0.9510650634765625, 1.01019287109375, 1.0693206787109375, 1.128448486328125, 1.1875762939453125, 1.2467041015625, 1.3058319091796875, 1.364959716796875, 1.4240875244140625, 1.48321533203125, 1.5423431396484375, 1.601470947265625, 1.6605987548828125, 1.7197265625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 18.0, 9.0, 18.0, 27.0, 27.0, 56.0, 68.0, 123.0, 137.0, 208.0, 334.0, 408.0, 542.0, 509.0, 508.0, 312.0, 243.0, 146.0, 96.0, 68.0, 54.0, 47.0, 25.0, 23.0, 10.0, 14.0, 5.0, 5.0, 8.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1868896484375, -0.18045997619628906, -0.17403030395507812, -0.1676006317138672, -0.16117095947265625, -0.1547412872314453, -0.14831161499023438, -0.14188194274902344, -0.1354522705078125, -0.12902259826660156, -0.12259292602539062, -0.11616325378417969, -0.10973358154296875, -0.10330390930175781, -0.09687423706054688, -0.09044456481933594, -0.084014892578125, -0.07758522033691406, -0.07115554809570312, -0.06472587585449219, -0.05829620361328125, -0.05186653137207031, -0.045436859130859375, -0.03900718688964844, -0.0325775146484375, -0.026147842407226562, -0.019718170166015625, -0.013288497924804688, -0.00685882568359375, -0.0004291534423828125, 0.006000518798828125, 0.012430191040039062, 0.01885986328125, 0.025289535522460938, 0.031719207763671875, 0.03814888000488281, 0.04457855224609375, 0.05100822448730469, 0.057437896728515625, 0.06386756896972656, 0.0702972412109375, 0.07672691345214844, 0.08315658569335938, 0.08958625793457031, 0.09601593017578125, 0.10244560241699219, 0.10887527465820312, 0.11530494689941406, 0.121734619140625, 0.12816429138183594, 0.13459396362304688, 0.1410236358642578, 0.14745330810546875, 0.1538829803466797, 0.16031265258789062, 0.16674232482910156, 0.1731719970703125, 0.17960166931152344, 0.18603134155273438, 0.1924610137939453, 0.19889068603515625, 0.2053203582763672, 0.21175003051757812, 0.21817970275878906, 0.224609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 28.0, 29.0, 42.0, 84.0, 101.0, 140.0, 141.0, 145.0, 110.0, 66.0, 40.0, 31.0, 16.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2180324792861938, -1.1779228448867798, -1.1378130912780762, -1.097703456878662, -1.057593822479248, -1.0174840688705444, -0.9773744344711304, -0.9372647404670715, -0.8971550464630127, -0.8570453524589539, -0.816935658454895, -0.776826024055481, -0.7367163300514221, -0.6966066360473633, -0.6564970016479492, -0.6163873076438904, -0.5762776136398315, -0.5361679196357727, -0.49605825543403625, -0.4559485912322998, -0.41583889722824097, -0.37572920322418213, -0.3356195390224457, -0.29550987482070923, -0.2554001808166504, -0.21529050171375275, -0.1751808226108551, -0.13507114350795746, -0.09496146440505981, -0.05485178530216217, -0.014742106199264526, 0.025367558002471924, 0.06547713279724121, 0.10558681190013885, 0.1456964910030365, 0.18580617010593414, 0.2259158492088318, 0.2660255432128906, 0.3061352074146271, 0.3462448716163635, 0.38635456562042236, 0.4264642596244812, 0.46657392382621765, 0.5066835880279541, 0.5467932820320129, 0.5869029760360718, 0.6270126104354858, 0.6671223044395447, 0.7072319984436035, 0.7473416924476624, 0.7874513864517212, 0.8275610208511353, 0.8676707148551941, 0.9077804088592529, 0.947890043258667, 0.9879997372627258, 1.0281094312667847, 1.0682190656661987, 1.1083288192749023, 1.1484384536743164, 1.1885480880737305, 1.228657841682434, 1.2687674760818481, 1.3088772296905518, 1.3489868640899658]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 3.0, 3.0, 5.0, 6.0, 15.0, 16.0, 17.0, 14.0, 26.0, 25.0, 20.0, 31.0, 29.0, 39.0, 45.0, 43.0, 24.0, 39.0, 48.0, 32.0, 35.0, 52.0, 52.0, 45.0, 38.0, 33.0, 34.0, 27.0, 41.0, 20.0, 27.0, 18.0, 20.0, 14.0, 9.0, 7.0, 7.0, 6.0, 5.0, 3.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.5226255059242249, -0.5073807239532471, -0.4921358823776245, -0.47689107060432434, -0.46164625883102417, -0.446401447057724, -0.43115663528442383, -0.41591182351112366, -0.4006670117378235, -0.3854221999645233, -0.37017738819122314, -0.354932576417923, -0.3396877646446228, -0.32444295287132263, -0.30919814109802246, -0.2939533293247223, -0.2787085175514221, -0.26346370577812195, -0.24821889400482178, -0.2329740822315216, -0.21772927045822144, -0.20248445868492126, -0.1872396469116211, -0.17199483513832092, -0.15675002336502075, -0.14150521159172058, -0.1262603998184204, -0.11101558804512024, -0.09577077627182007, -0.0805259644985199, -0.06528115272521973, -0.050036340951919556, -0.03479155898094177, -0.0195467472076416, -0.004301935434341431, 0.01094287633895874, 0.02618768811225891, 0.04143249988555908, 0.05667731165885925, 0.07192212343215942, 0.0871669352054596, 0.10241174697875977, 0.11765655875205994, 0.1329013705253601, 0.14814618229866028, 0.16339099407196045, 0.17863580584526062, 0.1938806176185608, 0.20912542939186096, 0.22437024116516113, 0.2396150529384613, 0.2548598647117615, 0.27010467648506165, 0.2853494882583618, 0.300594300031662, 0.31583911180496216, 0.33108392357826233, 0.3463287353515625, 0.36157354712486267, 0.37681835889816284, 0.392063170671463, 0.4073079824447632, 0.42255279421806335, 0.4377976059913635, 0.4530424177646637]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 11.0, 21.0, 16.0, 43.0, 67.0, 149.0, 313.0, 650.0, 1472.0, 3542.0, 8990.0, 23964.0, 83845.0, 472235.0, 358114.0, 62776.0, 19649.0, 7422.0, 2911.0, 1196.0, 504.0, 293.0, 149.0, 67.0, 33.0, 31.0, 11.0, 10.0, 8.0, 2.0, 6.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.196044921875, -0.19008636474609375, -0.1841278076171875, -0.17816925048828125, -0.172210693359375, -0.16625213623046875, -0.1602935791015625, -0.15433502197265625, -0.14837646484375, -0.14241790771484375, -0.1364593505859375, -0.13050079345703125, -0.124542236328125, -0.11858367919921875, -0.1126251220703125, -0.10666656494140625, -0.1007080078125, -0.09474945068359375, -0.0887908935546875, -0.08283233642578125, -0.076873779296875, -0.07091522216796875, -0.0649566650390625, -0.05899810791015625, -0.05303955078125, -0.04708099365234375, -0.0411224365234375, -0.03516387939453125, -0.029205322265625, -0.02324676513671875, -0.0172882080078125, -0.01132965087890625, -0.00537109375, 0.00058746337890625, 0.0065460205078125, 0.01250457763671875, 0.018463134765625, 0.02442169189453125, 0.0303802490234375, 0.03633880615234375, 0.04229736328125, 0.04825592041015625, 0.0542144775390625, 0.06017303466796875, 0.066131591796875, 0.07209014892578125, 0.0780487060546875, 0.08400726318359375, 0.0899658203125, 0.09592437744140625, 0.1018829345703125, 0.10784149169921875, 0.113800048828125, 0.11975860595703125, 0.1257171630859375, 0.13167572021484375, 0.13763427734375, 0.14359283447265625, 0.1495513916015625, 0.15550994873046875, 0.161468505859375, 0.16742706298828125, 0.1733856201171875, 0.17934417724609375, 0.185302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 9.0, 8.0, 21.0, 23.0, 24.0, 30.0, 34.0, 38.0, 41.0, 52.0, 48.0, 48.0, 56.0, 55.0, 54.0, 51.0, 81.0, 50.0, 57.0, 44.0, 26.0, 33.0, 15.0, 25.0, 13.0, 15.0, 10.0, 7.0, 1.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3729438781738281, -0.35990142822265625, -0.3468589782714844, -0.3338165283203125, -0.3207740783691406, -0.30773162841796875, -0.2946891784667969, -0.281646728515625, -0.2686042785644531, -0.25556182861328125, -0.24251937866210938, -0.2294769287109375, -0.21643447875976562, -0.20339202880859375, -0.19034957885742188, -0.17730712890625, -0.16426467895507812, -0.15122222900390625, -0.13817977905273438, -0.1251373291015625, -0.11209487915039062, -0.09905242919921875, -0.08600997924804688, -0.072967529296875, -0.059925079345703125, -0.04688262939453125, -0.033840179443359375, -0.0207977294921875, -0.007755279541015625, 0.00528717041015625, 0.018329620361328125, 0.0313720703125, 0.044414520263671875, 0.05745697021484375, 0.07049942016601562, 0.0835418701171875, 0.09658432006835938, 0.10962677001953125, 0.12266921997070312, 0.135711669921875, 0.14875411987304688, 0.16179656982421875, 0.17483901977539062, 0.1878814697265625, 0.20092391967773438, 0.21396636962890625, 0.22700881958007812, 0.24005126953125, 0.2530937194824219, 0.26613616943359375, 0.2791786193847656, 0.2922210693359375, 0.3052635192871094, 0.31830596923828125, 0.3313484191894531, 0.344390869140625, 0.3574333190917969, 0.37047576904296875, 0.3835182189941406, 0.3965606689453125, 0.4096031188964844, 0.42264556884765625, 0.4356880187988281, 0.44873046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 15.0, 19.0, 22.0, 44.0, 42.0, 62.0, 112.0, 180.0, 268.0, 490.0, 1003.0, 1835.0, 3959.0, 8644.0, 19983.0, 56887.0, 229298.0, 477861.0, 171379.0, 44790.0, 16822.0, 7523.0, 3504.0, 1708.0, 858.0, 449.0, 256.0, 158.0, 113.0, 61.0, 55.0, 30.0, 18.0, 20.0, 17.0, 7.0, 8.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.151611328125, -0.14707183837890625, -0.1425323486328125, -0.13799285888671875, -0.133453369140625, -0.12891387939453125, -0.1243743896484375, -0.11983489990234375, -0.11529541015625, -0.11075592041015625, -0.1062164306640625, -0.10167694091796875, -0.097137451171875, -0.09259796142578125, -0.0880584716796875, -0.08351898193359375, -0.0789794921875, -0.07444000244140625, -0.0699005126953125, -0.06536102294921875, -0.060821533203125, -0.05628204345703125, -0.0517425537109375, -0.04720306396484375, -0.04266357421875, -0.03812408447265625, -0.0335845947265625, -0.02904510498046875, -0.024505615234375, -0.01996612548828125, -0.0154266357421875, -0.01088714599609375, -0.00634765625, -0.00180816650390625, 0.0027313232421875, 0.00727081298828125, 0.011810302734375, 0.01634979248046875, 0.0208892822265625, 0.02542877197265625, 0.02996826171875, 0.03450775146484375, 0.0390472412109375, 0.04358673095703125, 0.048126220703125, 0.05266571044921875, 0.0572052001953125, 0.06174468994140625, 0.0662841796875, 0.07082366943359375, 0.0753631591796875, 0.07990264892578125, 0.084442138671875, 0.08898162841796875, 0.0935211181640625, 0.09806060791015625, 0.10260009765625, 0.10713958740234375, 0.1116790771484375, 0.11621856689453125, 0.120758056640625, 0.12529754638671875, 0.1298370361328125, 0.13437652587890625, 0.138916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 12.0, 12.0, 17.0, 20.0, 20.0, 16.0, 26.0, 22.0, 35.0, 27.0, 41.0, 38.0, 41.0, 50.0, 49.0, 49.0, 46.0, 54.0, 50.0, 42.0, 49.0, 40.0, 25.0, 35.0, 30.0, 23.0, 21.0, 15.0, 15.0, 13.0, 14.0, 9.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61181640625, -0.5891571044921875, -0.566497802734375, -0.5438385009765625, -0.52117919921875, -0.4985198974609375, -0.475860595703125, -0.4532012939453125, -0.4305419921875, -0.4078826904296875, -0.385223388671875, -0.3625640869140625, -0.33990478515625, -0.3172454833984375, -0.294586181640625, -0.2719268798828125, -0.249267578125, -0.2266082763671875, -0.203948974609375, -0.1812896728515625, -0.15863037109375, -0.1359710693359375, -0.113311767578125, -0.0906524658203125, -0.0679931640625, -0.0453338623046875, -0.022674560546875, -1.52587890625e-05, 0.02264404296875, 0.0453033447265625, 0.067962646484375, 0.0906219482421875, 0.11328125, 0.1359405517578125, 0.158599853515625, 0.1812591552734375, 0.20391845703125, 0.2265777587890625, 0.249237060546875, 0.2718963623046875, 0.2945556640625, 0.3172149658203125, 0.339874267578125, 0.3625335693359375, 0.38519287109375, 0.4078521728515625, 0.430511474609375, 0.4531707763671875, 0.475830078125, 0.4984893798828125, 0.521148681640625, 0.5438079833984375, 0.56646728515625, 0.5891265869140625, 0.611785888671875, 0.6344451904296875, 0.6571044921875, 0.6797637939453125, 0.702423095703125, 0.7250823974609375, 0.74774169921875, 0.7704010009765625, 0.793060302734375, 0.8157196044921875, 0.83837890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 4.0, 6.0, 10.0, 16.0, 17.0, 22.0, 38.0, 63.0, 94.0, 127.0, 215.0, 325.0, 523.0, 945.0, 1789.0, 3586.0, 7236.0, 15860.0, 38304.0, 104849.0, 296732.0, 351221.0, 139068.0, 49068.0, 20059.0, 8935.0, 4299.0, 2182.0, 1151.0, 660.0, 415.0, 222.0, 159.0, 106.0, 58.0, 46.0, 39.0, 32.0, 15.0, 12.0, 15.0, 9.0, 10.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.04058837890625, -0.039399147033691406, -0.03820991516113281, -0.03702068328857422, -0.035831451416015625, -0.03464221954345703, -0.03345298767089844, -0.032263755798339844, -0.03107452392578125, -0.029885292053222656, -0.028696060180664062, -0.02750682830810547, -0.026317596435546875, -0.02512836456298828, -0.023939132690429688, -0.022749900817871094, -0.0215606689453125, -0.020371437072753906, -0.019182205200195312, -0.01799297332763672, -0.016803741455078125, -0.015614509582519531, -0.014425277709960938, -0.013236045837402344, -0.01204681396484375, -0.010857582092285156, -0.009668350219726562, -0.008479118347167969, -0.007289886474609375, -0.006100654602050781, -0.0049114227294921875, -0.0037221908569335938, -0.002532958984375, -0.0013437271118164062, -0.0001544952392578125, 0.0010347366333007812, 0.002223968505859375, 0.0034132003784179688, 0.0046024322509765625, 0.005791664123535156, 0.00698089599609375, 0.008170127868652344, 0.009359359741210938, 0.010548591613769531, 0.011737823486328125, 0.012927055358886719, 0.014116287231445312, 0.015305519104003906, 0.0164947509765625, 0.017683982849121094, 0.018873214721679688, 0.02006244659423828, 0.021251678466796875, 0.02244091033935547, 0.023630142211914062, 0.024819374084472656, 0.02600860595703125, 0.027197837829589844, 0.028387069702148438, 0.02957630157470703, 0.030765533447265625, 0.03195476531982422, 0.03314399719238281, 0.034333229064941406, 0.0355224609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 3.0, 4.0, 9.0, 9.0, 19.0, 26.0, 35.0, 43.0, 67.0, 71.0, 86.0, 98.0, 95.0, 108.0, 77.0, 64.0, 49.0, 37.0, 28.0, 18.0, 12.0, 4.0, 4.0, 5.0, 2.0, 3.0, 5.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.0159950256347656e-05, -2.9391609132289886e-05, -2.8623268008232117e-05, -2.7854926884174347e-05, -2.7086585760116577e-05, -2.6318244636058807e-05, -2.5549903512001038e-05, -2.4781562387943268e-05, -2.4013221263885498e-05, -2.3244880139827728e-05, -2.247653901576996e-05, -2.170819789171219e-05, -2.093985676765442e-05, -2.017151564359665e-05, -1.940317451953888e-05, -1.863483339548111e-05, -1.786649227142334e-05, -1.709815114736557e-05, -1.63298100233078e-05, -1.556146889925003e-05, -1.479312777519226e-05, -1.4024786651134491e-05, -1.3256445527076721e-05, -1.2488104403018951e-05, -1.1719763278961182e-05, -1.0951422154903412e-05, -1.0183081030845642e-05, -9.414739906787872e-06, -8.646398782730103e-06, -7.878057658672333e-06, -7.109716534614563e-06, -6.341375410556793e-06, -5.5730342864990234e-06, -4.804693162441254e-06, -4.036352038383484e-06, -3.268010914325714e-06, -2.4996697902679443e-06, -1.7313286662101746e-06, -9.629875421524048e-07, -1.94646418094635e-07, 5.736947059631348e-07, 1.3420358300209045e-06, 2.1103769540786743e-06, 2.878718078136444e-06, 3.647059202194214e-06, 4.415400326251984e-06, 5.183741450309753e-06, 5.952082574367523e-06, 6.720423698425293e-06, 7.488764822483063e-06, 8.257105946540833e-06, 9.025447070598602e-06, 9.793788194656372e-06, 1.0562129318714142e-05, 1.1330470442771912e-05, 1.2098811566829681e-05, 1.2867152690887451e-05, 1.3635493814945221e-05, 1.440383493900299e-05, 1.517217606306076e-05, 1.594051718711853e-05, 1.67088583111763e-05, 1.747719943523407e-05, 1.824554055929184e-05, 1.901388168334961e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 4.0, 11.0, 14.0, 8.0, 11.0, 8.0, 24.0, 28.0, 38.0, 60.0, 98.0, 196.0, 432.0, 1058.0, 3116.0, 10144.0, 38120.0, 214215.0, 612425.0, 130252.0, 26821.0, 7490.0, 2354.0, 828.0, 331.0, 165.0, 89.0, 45.0, 36.0, 23.0, 28.0, 10.0, 8.0, 10.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0], "bins": [-0.0799560546875, -0.0777578353881836, -0.07555961608886719, -0.07336139678955078, -0.07116317749023438, -0.06896495819091797, -0.06676673889160156, -0.06456851959228516, -0.06237030029296875, -0.060172080993652344, -0.05797386169433594, -0.05577564239501953, -0.053577423095703125, -0.05137920379638672, -0.04918098449707031, -0.046982765197753906, -0.0447845458984375, -0.042586326599121094, -0.04038810729980469, -0.03818988800048828, -0.035991668701171875, -0.03379344940185547, -0.03159523010253906, -0.029397010803222656, -0.02719879150390625, -0.025000572204589844, -0.022802352905273438, -0.02060413360595703, -0.018405914306640625, -0.01620769500732422, -0.014009475708007812, -0.011811256408691406, -0.009613037109375, -0.007414817810058594, -0.0052165985107421875, -0.0030183792114257812, -0.000820159912109375, 0.0013780593872070312, 0.0035762786865234375, 0.005774497985839844, 0.00797271728515625, 0.010170936584472656, 0.012369155883789062, 0.014567375183105469, 0.016765594482421875, 0.01896381378173828, 0.021162033081054688, 0.023360252380371094, 0.0255584716796875, 0.027756690979003906, 0.029954910278320312, 0.03215312957763672, 0.034351348876953125, 0.03654956817626953, 0.03874778747558594, 0.040946006774902344, 0.04314422607421875, 0.045342445373535156, 0.04754066467285156, 0.04973888397216797, 0.051937103271484375, 0.05413532257080078, 0.05633354187011719, 0.058531761169433594, 0.06072998046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 8.0, 9.0, 8.0, 13.0, 12.0, 13.0, 18.0, 22.0, 20.0, 43.0, 50.0, 49.0, 64.0, 62.0, 58.0, 76.0, 72.0, 64.0, 50.0, 52.0, 45.0, 36.0, 25.0, 18.0, 19.0, 13.0, 10.0, 11.0, 8.0, 9.0, 4.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0112152099609375, -0.010865092277526855, -0.010514974594116211, -0.010164856910705566, -0.009814739227294922, -0.009464621543884277, -0.009114503860473633, -0.008764386177062988, -0.008414268493652344, -0.0080641508102417, -0.007714033126831055, -0.00736391544342041, -0.007013797760009766, -0.006663680076599121, -0.0063135623931884766, -0.005963444709777832, -0.0056133270263671875, -0.005263209342956543, -0.0049130916595458984, -0.004562973976135254, -0.004212856292724609, -0.003862738609313965, -0.0035126209259033203, -0.0031625032424926758, -0.0028123855590820312, -0.0024622678756713867, -0.002112150192260742, -0.0017620325088500977, -0.0014119148254394531, -0.0010617971420288086, -0.0007116794586181641, -0.00036156177520751953, -1.1444091796875e-05, 0.00033867359161376953, 0.0006887912750244141, 0.0010389089584350586, 0.0013890266418457031, 0.0017391443252563477, 0.002089262008666992, 0.0024393796920776367, 0.0027894973754882812, 0.0031396150588989258, 0.0034897327423095703, 0.003839850425720215, 0.004189968109130859, 0.004540085792541504, 0.0048902034759521484, 0.005240321159362793, 0.0055904388427734375, 0.005940556526184082, 0.0062906742095947266, 0.006640791893005371, 0.006990909576416016, 0.00734102725982666, 0.007691144943237305, 0.00804126262664795, 0.008391380310058594, 0.008741497993469238, 0.009091615676879883, 0.009441733360290527, 0.009791851043701172, 0.010141968727111816, 0.010492086410522461, 0.010842204093933105, 0.01119232177734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 20.0, 19.0, 43.0, 91.0, 146.0, 181.0, 199.0, 142.0, 75.0, 46.0, 20.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9946099519729614, -0.9624832272529602, -0.9303565621376038, -0.8982298374176025, -0.8661031126976013, -0.8339763879776001, -0.8018497228622437, -0.7697229981422424, -0.7375962734222412, -0.70546954870224, -0.6733428835868835, -0.6412161588668823, -0.6090894341468811, -0.5769627094268799, -0.5448360443115234, -0.5127093195915222, -0.48058265447616577, -0.44845595955848694, -0.4163292348384857, -0.3842025399208069, -0.35207581520080566, -0.31994912028312683, -0.287822425365448, -0.2556957006454468, -0.22356900572776794, -0.19144229590892792, -0.1593155860900879, -0.12718889117240906, -0.09506218135356903, -0.062935471534729, -0.03080877661705017, 0.001317933201789856, 0.03344464302062988, 0.06557135283946991, 0.09769805520772934, 0.12982475757598877, 0.1619514673948288, 0.19407817721366882, 0.22620487213134766, 0.2583315968513489, 0.2904582917690277, 0.32258498668670654, 0.35471171140670776, 0.3868384063243866, 0.41896510124206543, 0.45109182596206665, 0.4832185208797455, 0.5153452157974243, 0.5474719405174255, 0.5795986652374268, 0.6117253303527832, 0.6438520550727844, 0.6759787797927856, 0.7081054449081421, 0.7402321696281433, 0.7723588943481445, 0.804485559463501, 0.8366122841835022, 0.8687389492988586, 0.9008656740188599, 0.9329923987388611, 0.9651191234588623, 0.9972457885742188, 1.0293724536895752, 1.0614992380142212]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 7.0, 5.0, 4.0, 8.0, 10.0, 15.0, 17.0, 18.0, 23.0, 29.0, 33.0, 37.0, 35.0, 49.0, 42.0, 38.0, 48.0, 54.0, 42.0, 56.0, 48.0, 58.0, 52.0, 41.0, 40.0, 24.0, 39.0, 20.0, 21.0, 23.0, 15.0, 8.0, 11.0, 6.0, 3.0, 7.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34961679577827454, -0.3385044038295746, -0.32739201188087463, -0.3162795901298523, -0.30516719818115234, -0.2940548062324524, -0.28294241428375244, -0.2718300223350525, -0.26071763038635254, -0.2496052384376526, -0.23849283158779144, -0.2273804396390915, -0.21626803278923035, -0.2051556408405304, -0.19404324889183044, -0.1829308569431305, -0.17181843519210815, -0.1607060432434082, -0.14959363639354706, -0.1384812444448471, -0.12736883759498596, -0.11625644564628601, -0.10514405369758606, -0.09403165429830551, -0.08291925489902496, -0.07180685549974442, -0.060694459825754166, -0.049582064151763916, -0.03846966475248337, -0.02735726535320282, -0.01624487340450287, -0.0051324740052223206, 0.00597989559173584, 0.01709229312837124, 0.028204690665006638, 0.03931708633899689, 0.050429485738277435, 0.06154188513755798, 0.07265427708625793, 0.08376667648553848, 0.09487907588481903, 0.10599147528409958, 0.11710387468338013, 0.12821626663208008, 0.13932865858078003, 0.15044106543064117, 0.16155345737934113, 0.17266586422920227, 0.18377825617790222, 0.19489064812660217, 0.20600305497646332, 0.21711544692516327, 0.22822785377502441, 0.23934024572372437, 0.2504526376724243, 0.26156502962112427, 0.2726774215698242, 0.28378981351852417, 0.2949022054672241, 0.3060145974159241, 0.3171270191669464, 0.32823941111564636, 0.3393518030643463, 0.35046419501304626, 0.3615766167640686]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 5.0, 5.0, 8.0, 6.0, 10.0, 17.0, 22.0, 35.0, 51.0, 99.0, 219.0, 706.0, 3984.0, 38511.0, 667541.0, 316054.0, 18127.0, 2265.0, 518.0, 157.0, 76.0, 29.0, 34.0, 11.0, 10.0, 12.0, 7.0, 2.0, 2.0, 8.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.92578125, -0.8975982666015625, -0.869415283203125, -0.8412322998046875, -0.81304931640625, -0.7848663330078125, -0.756683349609375, -0.7285003662109375, -0.7003173828125, -0.6721343994140625, -0.643951416015625, -0.6157684326171875, -0.58758544921875, -0.5594024658203125, -0.531219482421875, -0.5030364990234375, -0.474853515625, -0.4466705322265625, -0.418487548828125, -0.3903045654296875, -0.36212158203125, -0.3339385986328125, -0.305755615234375, -0.2775726318359375, -0.2493896484375, -0.2212066650390625, -0.193023681640625, -0.1648406982421875, -0.13665771484375, -0.1084747314453125, -0.080291748046875, -0.0521087646484375, -0.02392578125, 0.0042572021484375, 0.032440185546875, 0.0606231689453125, 0.08880615234375, 0.1169891357421875, 0.145172119140625, 0.1733551025390625, 0.2015380859375, 0.2297210693359375, 0.257904052734375, 0.2860870361328125, 0.31427001953125, 0.3424530029296875, 0.370635986328125, 0.3988189697265625, 0.427001953125, 0.4551849365234375, 0.483367919921875, 0.5115509033203125, 0.53973388671875, 0.5679168701171875, 0.596099853515625, 0.6242828369140625, 0.6524658203125, 0.6806488037109375, 0.708831787109375, 0.7370147705078125, 0.76519775390625, 0.7933807373046875, 0.821563720703125, 0.8497467041015625, 0.8779296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 7.0, 5.0, 16.0, 7.0, 18.0, 19.0, 27.0, 39.0, 42.0, 44.0, 47.0, 54.0, 72.0, 59.0, 66.0, 65.0, 55.0, 66.0, 61.0, 50.0, 37.0, 32.0, 24.0, 14.0, 26.0, 10.0, 10.0, 8.0, 3.0, 5.0, 4.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7578125, -0.7300872802734375, -0.702362060546875, -0.6746368408203125, -0.64691162109375, -0.6191864013671875, -0.591461181640625, -0.5637359619140625, -0.5360107421875, -0.5082855224609375, -0.480560302734375, -0.4528350830078125, -0.42510986328125, -0.3973846435546875, -0.369659423828125, -0.3419342041015625, -0.314208984375, -0.2864837646484375, -0.258758544921875, -0.2310333251953125, -0.20330810546875, -0.1755828857421875, -0.147857666015625, -0.1201324462890625, -0.0924072265625, -0.0646820068359375, -0.036956787109375, -0.0092315673828125, 0.01849365234375, 0.0462188720703125, 0.073944091796875, 0.1016693115234375, 0.12939453125, 0.1571197509765625, 0.184844970703125, 0.2125701904296875, 0.24029541015625, 0.2680206298828125, 0.295745849609375, 0.3234710693359375, 0.3511962890625, 0.3789215087890625, 0.406646728515625, 0.4343719482421875, 0.46209716796875, 0.4898223876953125, 0.517547607421875, 0.5452728271484375, 0.572998046875, 0.6007232666015625, 0.628448486328125, 0.6561737060546875, 0.68389892578125, 0.7116241455078125, 0.739349365234375, 0.7670745849609375, 0.7947998046875, 0.8225250244140625, 0.850250244140625, 0.8779754638671875, 0.90570068359375, 0.9334259033203125, 0.961151123046875, 0.9888763427734375, 1.0166015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 10.0, 17.0, 23.0, 19.0, 26.0, 38.0, 53.0, 57.0, 64.0, 83.0, 107.0, 152.0, 263.0, 506.0, 1501.0, 7430.0, 67994.0, 749278.0, 200852.0, 15565.0, 2628.0, 772.0, 324.0, 180.0, 148.0, 89.0, 65.0, 55.0, 47.0, 36.0, 20.0, 24.0, 20.0, 22.0, 15.0, 10.0, 14.0, 8.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.70947265625, -0.6863555908203125, -0.663238525390625, -0.6401214599609375, -0.61700439453125, -0.5938873291015625, -0.570770263671875, -0.5476531982421875, -0.5245361328125, -0.5014190673828125, -0.478302001953125, -0.4551849365234375, -0.43206787109375, -0.4089508056640625, -0.385833740234375, -0.3627166748046875, -0.339599609375, -0.3164825439453125, -0.293365478515625, -0.2702484130859375, -0.24713134765625, -0.2240142822265625, -0.200897216796875, -0.1777801513671875, -0.1546630859375, -0.1315460205078125, -0.108428955078125, -0.0853118896484375, -0.06219482421875, -0.0390777587890625, -0.015960693359375, 0.0071563720703125, 0.0302734375, 0.0533905029296875, 0.076507568359375, 0.0996246337890625, 0.12274169921875, 0.1458587646484375, 0.168975830078125, 0.1920928955078125, 0.2152099609375, 0.2383270263671875, 0.261444091796875, 0.2845611572265625, 0.30767822265625, 0.3307952880859375, 0.353912353515625, 0.3770294189453125, 0.400146484375, 0.4232635498046875, 0.446380615234375, 0.4694976806640625, 0.49261474609375, 0.5157318115234375, 0.538848876953125, 0.5619659423828125, 0.5850830078125, 0.6082000732421875, 0.631317138671875, 0.6544342041015625, 0.67755126953125, 0.7006683349609375, 0.723785400390625, 0.7469024658203125, 0.77001953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 1.0, 2.0, 8.0, 14.0, 10.0, 9.0, 23.0, 15.0, 15.0, 20.0, 17.0, 30.0, 30.0, 35.0, 32.0, 30.0, 37.0, 34.0, 43.0, 37.0, 47.0, 49.0, 48.0, 46.0, 40.0, 38.0, 40.0, 38.0, 28.0, 19.0, 18.0, 15.0, 24.0, 11.0, 14.0, 15.0, 10.0, 9.0, 10.0, 6.0, 5.0, 6.0, 13.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.63623046875, -0.6144638061523438, -0.5926971435546875, -0.5709304809570312, -0.549163818359375, -0.5273971557617188, -0.5056304931640625, -0.48386383056640625, -0.46209716796875, -0.44033050537109375, -0.4185638427734375, -0.39679718017578125, -0.375030517578125, -0.35326385498046875, -0.3314971923828125, -0.30973052978515625, -0.2879638671875, -0.26619720458984375, -0.2444305419921875, -0.22266387939453125, -0.200897216796875, -0.17913055419921875, -0.1573638916015625, -0.13559722900390625, -0.11383056640625, -0.09206390380859375, -0.0702972412109375, -0.04853057861328125, -0.026763916015625, -0.00499725341796875, 0.0167694091796875, 0.03853607177734375, 0.060302734375, 0.08206939697265625, 0.1038360595703125, 0.12560272216796875, 0.147369384765625, 0.16913604736328125, 0.1909027099609375, 0.21266937255859375, 0.23443603515625, 0.25620269775390625, 0.2779693603515625, 0.29973602294921875, 0.321502685546875, 0.34326934814453125, 0.3650360107421875, 0.38680267333984375, 0.4085693359375, 0.43033599853515625, 0.4521026611328125, 0.47386932373046875, 0.495635986328125, 0.5174026489257812, 0.5391693115234375, 0.5609359741210938, 0.58270263671875, 0.6044692993164062, 0.6262359619140625, 0.6480026245117188, 0.669769287109375, 0.6915359497070312, 0.7133026123046875, 0.7350692749023438, 0.7568359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 13.0, 11.0, 18.0, 16.0, 14.0, 30.0, 55.0, 118.0, 230.0, 571.0, 1801.0, 8240.0, 92498.0, 841052.0, 92994.0, 7968.0, 1767.0, 609.0, 242.0, 109.0, 59.0, 32.0, 25.0, 15.0, 16.0, 11.0, 4.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.316162109375, -0.30672454833984375, -0.2972869873046875, -0.28784942626953125, -0.278411865234375, -0.26897430419921875, -0.2595367431640625, -0.25009918212890625, -0.24066162109375, -0.23122406005859375, -0.2217864990234375, -0.21234893798828125, -0.202911376953125, -0.19347381591796875, -0.1840362548828125, -0.17459869384765625, -0.1651611328125, -0.15572357177734375, -0.1462860107421875, -0.13684844970703125, -0.127410888671875, -0.11797332763671875, -0.1085357666015625, -0.09909820556640625, -0.08966064453125, -0.08022308349609375, -0.0707855224609375, -0.06134796142578125, -0.051910400390625, -0.04247283935546875, -0.0330352783203125, -0.02359771728515625, -0.01416015625, -0.00472259521484375, 0.0047149658203125, 0.01415252685546875, 0.023590087890625, 0.03302764892578125, 0.0424652099609375, 0.05190277099609375, 0.06134033203125, 0.07077789306640625, 0.0802154541015625, 0.08965301513671875, 0.099090576171875, 0.10852813720703125, 0.1179656982421875, 0.12740325927734375, 0.1368408203125, 0.14627838134765625, 0.1557159423828125, 0.16515350341796875, 0.174591064453125, 0.18402862548828125, 0.1934661865234375, 0.20290374755859375, 0.21234130859375, 0.22177886962890625, 0.2312164306640625, 0.24065399169921875, 0.250091552734375, 0.25952911376953125, 0.2689666748046875, 0.27840423583984375, 0.287841796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 10.0, 8.0, 13.0, 17.0, 25.0, 62.0, 52.0, 57.0, 85.0, 106.0, 101.0, 120.0, 62.0, 56.0, 41.0, 41.0, 37.0, 23.0, 20.0, 13.0, 7.0, 9.0, 12.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014636993408203e-05, -1.932494342327118e-05, -1.8503516912460327e-05, -1.7682090401649475e-05, -1.6860663890838623e-05, -1.603923738002777e-05, -1.5217810869216919e-05, -1.4396384358406067e-05, -1.3574957847595215e-05, -1.2753531336784363e-05, -1.193210482597351e-05, -1.1110678315162659e-05, -1.0289251804351807e-05, -9.467825293540955e-06, -8.646398782730103e-06, -7.82497227191925e-06, -7.0035457611083984e-06, -6.182119250297546e-06, -5.360692739486694e-06, -4.539266228675842e-06, -3.7178397178649902e-06, -2.896413207054138e-06, -2.074986696243286e-06, -1.253560185432434e-06, -4.3213367462158203e-07, 3.8929283618927e-07, 1.210719347000122e-06, 2.032145857810974e-06, 2.853572368621826e-06, 3.6749988794326782e-06, 4.49642539024353e-06, 5.317851901054382e-06, 6.139278411865234e-06, 6.9607049226760864e-06, 7.782131433486938e-06, 8.60355794429779e-06, 9.424984455108643e-06, 1.0246410965919495e-05, 1.1067837476730347e-05, 1.1889263987541199e-05, 1.271069049835205e-05, 1.3532117009162903e-05, 1.4353543519973755e-05, 1.5174970030784607e-05, 1.599639654159546e-05, 1.681782305240631e-05, 1.7639249563217163e-05, 1.8460676074028015e-05, 1.9282102584838867e-05, 2.010352909564972e-05, 2.092495560646057e-05, 2.1746382117271423e-05, 2.2567808628082275e-05, 2.3389235138893127e-05, 2.421066164970398e-05, 2.503208816051483e-05, 2.5853514671325684e-05, 2.6674941182136536e-05, 2.7496367692947388e-05, 2.831779420375824e-05, 2.9139220714569092e-05, 2.9960647225379944e-05, 3.0782073736190796e-05, 3.160350024700165e-05, 3.24249267578125e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 10.0, 13.0, 25.0, 54.0, 110.0, 224.0, 684.0, 2891.0, 26172.0, 847819.0, 161198.0, 7317.0, 1308.0, 404.0, 150.0, 54.0, 34.0, 22.0, 17.0, 12.0, 4.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.475341796875, -0.46166229248046875, -0.4479827880859375, -0.43430328369140625, -0.420623779296875, -0.40694427490234375, -0.3932647705078125, -0.37958526611328125, -0.36590576171875, -0.35222625732421875, -0.3385467529296875, -0.32486724853515625, -0.311187744140625, -0.29750823974609375, -0.2838287353515625, -0.27014923095703125, -0.2564697265625, -0.24279022216796875, -0.2291107177734375, -0.21543121337890625, -0.201751708984375, -0.18807220458984375, -0.1743927001953125, -0.16071319580078125, -0.14703369140625, -0.13335418701171875, -0.1196746826171875, -0.10599517822265625, -0.092315673828125, -0.07863616943359375, -0.0649566650390625, -0.05127716064453125, -0.03759765625, -0.02391815185546875, -0.0102386474609375, 0.00344085693359375, 0.017120361328125, 0.03079986572265625, 0.0444793701171875, 0.05815887451171875, 0.07183837890625, 0.08551788330078125, 0.0991973876953125, 0.11287689208984375, 0.126556396484375, 0.14023590087890625, 0.1539154052734375, 0.16759490966796875, 0.1812744140625, 0.19495391845703125, 0.2086334228515625, 0.22231292724609375, 0.235992431640625, 0.24967193603515625, 0.2633514404296875, 0.27703094482421875, 0.29071044921875, 0.30438995361328125, 0.3180694580078125, 0.33174896240234375, 0.345428466796875, 0.35910797119140625, 0.3727874755859375, 0.38646697998046875, 0.400146484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 5.0, 10.0, 16.0, 21.0, 22.0, 45.0, 58.0, 66.0, 87.0, 124.0, 136.0, 119.0, 82.0, 66.0, 47.0, 22.0, 28.0, 14.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1055908203125, -0.10210990905761719, -0.09862899780273438, -0.09514808654785156, -0.09166717529296875, -0.08818626403808594, -0.08470535278320312, -0.08122444152832031, -0.0777435302734375, -0.07426261901855469, -0.07078170776367188, -0.06730079650878906, -0.06381988525390625, -0.06033897399902344, -0.056858062744140625, -0.05337715148925781, -0.049896240234375, -0.04641532897949219, -0.042934417724609375, -0.03945350646972656, -0.03597259521484375, -0.03249168395996094, -0.029010772705078125, -0.025529861450195312, -0.0220489501953125, -0.018568038940429688, -0.015087127685546875, -0.011606216430664062, -0.00812530517578125, -0.0046443939208984375, -0.001163482666015625, 0.0023174285888671875, 0.00579833984375, 0.009279251098632812, 0.012760162353515625, 0.016241073608398438, 0.01972198486328125, 0.023202896118164062, 0.026683807373046875, 0.030164718627929688, 0.0336456298828125, 0.03712654113769531, 0.040607452392578125, 0.04408836364746094, 0.04756927490234375, 0.05105018615722656, 0.054531097412109375, 0.05801200866699219, 0.061492919921875, 0.06497383117675781, 0.06845474243164062, 0.07193565368652344, 0.07541656494140625, 0.07889747619628906, 0.08237838745117188, 0.08585929870605469, 0.0893402099609375, 0.09282112121582031, 0.09630203247070312, 0.09978294372558594, 0.10326385498046875, 0.10674476623535156, 0.11022567749023438, 0.11370658874511719, 0.1171875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 10.0, 13.0, 38.0, 103.0, 196.0, 240.0, 224.0, 110.0, 44.0, 17.0, 10.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8651397228240967, -1.779088020324707, -1.6930363178253174, -1.6069846153259277, -1.520932912826538, -1.4348812103271484, -1.3488295078277588, -1.2627778053283691, -1.1767261028289795, -1.0906744003295898, -1.0046226978302002, -0.9185709953308105, -0.8325192928314209, -0.7464675903320312, -0.6604158878326416, -0.574364185333252, -0.4883124828338623, -0.40226078033447266, -0.316209077835083, -0.23015737533569336, -0.1441056728363037, -0.05805397033691406, 0.027997732162475586, 0.11404943466186523, 0.20010113716125488, 0.28615283966064453, 0.3722045421600342, 0.45825624465942383, 0.5443079471588135, 0.6303596496582031, 0.7164113521575928, 0.8024630546569824, 0.8885147571563721, 0.9745664596557617, 1.0606181621551514, 1.146669864654541, 1.2327215671539307, 1.3187732696533203, 1.40482497215271, 1.4908766746520996, 1.5769283771514893, 1.662980079650879, 1.7490317821502686, 1.8350834846496582, 1.9211351871490479, 2.0071868896484375, 2.093238592147827, 2.179290294647217, 2.2653419971466064, 2.351393699645996, 2.4374454021453857, 2.5234971046447754, 2.609548807144165, 2.6956005096435547, 2.7816522121429443, 2.867703914642334, 2.9537556171417236, 3.0398073196411133, 3.125859022140503, 3.2119107246398926, 3.2979624271392822, 3.384014129638672, 3.4700658321380615, 3.556117534637451, 3.642169237136841]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 2.0, 8.0, 7.0, 8.0, 10.0, 13.0, 14.0, 21.0, 23.0, 21.0, 24.0, 34.0, 25.0, 36.0, 29.0, 49.0, 30.0, 53.0, 42.0, 48.0, 41.0, 36.0, 36.0, 46.0, 38.0, 33.0, 31.0, 32.0, 32.0, 20.0, 37.0, 14.0, 16.0, 15.0, 4.0, 14.0, 16.0, 9.0, 5.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.1624853610992432, -1.125333309173584, -1.0881812572479248, -1.0510293245315552, -1.013877272605896, -0.9767252206802368, -0.9395731687545776, -0.9024211764335632, -0.8652691841125488, -0.8281171321868896, -0.7909651398658752, -0.7538130879402161, -0.7166610956192017, -0.6795090436935425, -0.6423569917678833, -0.6052049994468689, -0.5680529475212097, -0.5309008955955505, -0.49374890327453613, -0.45659685134887695, -0.41944485902786255, -0.38229280710220337, -0.3451407849788666, -0.3079887628555298, -0.270836740732193, -0.2336847186088562, -0.1965326964855194, -0.15938065946102142, -0.12222863733768463, -0.08507661521434784, -0.047924578189849854, -0.010772556066513062, 0.02637946605682373, 0.06353148818016052, 0.10068351775407791, 0.1378355473279953, 0.1749875694513321, 0.21213959157466888, 0.24929162859916687, 0.28644365072250366, 0.32359567284584045, 0.36074769496917725, 0.39789971709251404, 0.43505173921585083, 0.47220379114151, 0.5093557834625244, 0.5465078353881836, 0.5836598873138428, 0.6208118796348572, 0.6579639315605164, 0.6951159238815308, 0.7322679758071899, 0.7694199681282043, 0.8065720200538635, 0.8437240123748779, 0.8808760643005371, 0.9180281162261963, 0.9551801681518555, 0.9923321604728699, 1.0294841527938843, 1.0666362047195435, 1.1037882566452026, 1.1409403085708618, 1.1780922412872314, 1.2152442932128906]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 8.0, 12.0, 12.0, 20.0, 53.0, 86.0, 178.0, 370.0, 975.0, 3195.0, 15787.0, 159726.0, 2373819.0, 1532573.0, 93353.0, 10199.0, 2425.0, 853.0, 327.0, 143.0, 80.0, 26.0, 28.0, 13.0, 8.0, 9.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3388671875, -1.3076553344726562, -1.2764434814453125, -1.2452316284179688, -1.214019775390625, -1.1828079223632812, -1.1515960693359375, -1.1203842163085938, -1.08917236328125, -1.0579605102539062, -1.0267486572265625, -0.9955368041992188, -0.964324951171875, -0.9331130981445312, -0.9019012451171875, -0.8706893920898438, -0.8394775390625, -0.8082656860351562, -0.7770538330078125, -0.7458419799804688, -0.714630126953125, -0.6834182739257812, -0.6522064208984375, -0.6209945678710938, -0.58978271484375, -0.5585708618164062, -0.5273590087890625, -0.49614715576171875, -0.464935302734375, -0.43372344970703125, -0.4025115966796875, -0.37129974365234375, -0.340087890625, -0.30887603759765625, -0.2776641845703125, -0.24645233154296875, -0.215240478515625, -0.18402862548828125, -0.1528167724609375, -0.12160491943359375, -0.09039306640625, -0.05918121337890625, -0.0279693603515625, 0.00324249267578125, 0.034454345703125, 0.06566619873046875, 0.0968780517578125, 0.12808990478515625, 0.1593017578125, 0.19051361083984375, 0.2217254638671875, 0.25293731689453125, 0.284149169921875, 0.31536102294921875, 0.3465728759765625, 0.37778472900390625, 0.40899658203125, 0.44020843505859375, 0.4714202880859375, 0.5026321411132812, 0.533843994140625, 0.5650558471679688, 0.5962677001953125, 0.6274795532226562, 0.65869140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 8.0, 5.0, 10.0, 17.0, 13.0, 18.0, 22.0, 20.0, 22.0, 39.0, 42.0, 43.0, 53.0, 42.0, 52.0, 59.0, 57.0, 63.0, 57.0, 68.0, 52.0, 38.0, 31.0, 29.0, 35.0, 17.0, 15.0, 21.0, 15.0, 7.0, 11.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.500732421875, -0.48291015625, -0.465087890625, -0.447265625, -0.429443359375, -0.41162109375, -0.393798828125, -0.3759765625, -0.358154296875, -0.34033203125, -0.322509765625, -0.3046875, -0.286865234375, -0.26904296875, -0.251220703125, -0.2333984375, -0.215576171875, -0.19775390625, -0.179931640625, -0.162109375, -0.144287109375, -0.12646484375, -0.108642578125, -0.0908203125, -0.072998046875, -0.05517578125, -0.037353515625, -0.01953125, -0.001708984375, 0.01611328125, 0.033935546875, 0.0517578125, 0.069580078125, 0.08740234375, 0.105224609375, 0.123046875, 0.140869140625, 0.15869140625, 0.176513671875, 0.1943359375, 0.212158203125, 0.22998046875, 0.247802734375, 0.265625, 0.283447265625, 0.30126953125, 0.319091796875, 0.3369140625, 0.354736328125, 0.37255859375, 0.390380859375, 0.408203125, 0.426025390625, 0.44384765625, 0.461669921875, 0.4794921875, 0.497314453125, 0.51513671875, 0.532958984375, 0.55078125, 0.568603515625, 0.58642578125, 0.604248046875, 0.6220703125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 9.0, 12.0, 22.0, 16.0, 20.0, 27.0, 66.0, 77.0, 137.0, 252.0, 578.0, 1638.0, 6244.0, 45434.0, 2152249.0, 1937290.0, 42071.0, 5562.0, 1410.0, 570.0, 247.0, 120.0, 79.0, 42.0, 27.0, 10.0, 13.0, 11.0, 15.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0272674560546875, -0.993011474609375, -0.9587554931640625, -0.92449951171875, -0.8902435302734375, -0.855987548828125, -0.8217315673828125, -0.7874755859375, -0.7532196044921875, -0.718963623046875, -0.6847076416015625, -0.65045166015625, -0.6161956787109375, -0.581939697265625, -0.5476837158203125, -0.513427734375, -0.4791717529296875, -0.444915771484375, -0.4106597900390625, -0.37640380859375, -0.3421478271484375, -0.307891845703125, -0.2736358642578125, -0.2393798828125, -0.2051239013671875, -0.170867919921875, -0.1366119384765625, -0.10235595703125, -0.0680999755859375, -0.033843994140625, 0.0004119873046875, 0.03466796875, 0.0689239501953125, 0.103179931640625, 0.1374359130859375, 0.17169189453125, 0.2059478759765625, 0.240203857421875, 0.2744598388671875, 0.3087158203125, 0.3429718017578125, 0.377227783203125, 0.4114837646484375, 0.44573974609375, 0.4799957275390625, 0.514251708984375, 0.5485076904296875, 0.582763671875, 0.6170196533203125, 0.651275634765625, 0.6855316162109375, 0.71978759765625, 0.7540435791015625, 0.788299560546875, 0.8225555419921875, 0.8568115234375, 0.8910675048828125, 0.925323486328125, 0.9595794677734375, 0.99383544921875, 1.0280914306640625, 1.062347412109375, 1.0966033935546875, 1.130859375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 13.0, 13.0, 21.0, 36.0, 32.0, 58.0, 77.0, 147.0, 234.0, 381.0, 538.0, 633.0, 641.0, 410.0, 276.0, 201.0, 99.0, 74.0, 41.0, 43.0, 22.0, 18.0, 11.0, 11.0, 7.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.212158203125, -0.20500755310058594, -0.19785690307617188, -0.1907062530517578, -0.18355560302734375, -0.1764049530029297, -0.16925430297851562, -0.16210365295410156, -0.1549530029296875, -0.14780235290527344, -0.14065170288085938, -0.1335010528564453, -0.12635040283203125, -0.11919975280761719, -0.11204910278320312, -0.10489845275878906, -0.097747802734375, -0.09059715270996094, -0.08344650268554688, -0.07629585266113281, -0.06914520263671875, -0.06199455261230469, -0.054843902587890625, -0.04769325256347656, -0.0405426025390625, -0.03339195251464844, -0.026241302490234375, -0.019090652465820312, -0.01194000244140625, -0.0047893524169921875, 0.002361297607421875, 0.009511947631835938, 0.01666259765625, 0.023813247680664062, 0.030963897705078125, 0.03811454772949219, 0.04526519775390625, 0.05241584777832031, 0.059566497802734375, 0.06671714782714844, 0.0738677978515625, 0.08101844787597656, 0.08816909790039062, 0.09531974792480469, 0.10247039794921875, 0.10962104797363281, 0.11677169799804688, 0.12392234802246094, 0.131072998046875, 0.13822364807128906, 0.14537429809570312, 0.1525249481201172, 0.15967559814453125, 0.1668262481689453, 0.17397689819335938, 0.18112754821777344, 0.1882781982421875, 0.19542884826660156, 0.20257949829101562, 0.2097301483154297, 0.21688079833984375, 0.2240314483642578, 0.23118209838867188, 0.23833274841308594, 0.2454833984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 10.0, 15.0, 32.0, 54.0, 73.0, 152.0, 164.0, 154.0, 140.0, 69.0, 61.0, 37.0, 17.0, 10.0, 10.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.330198884010315, -1.2857933044433594, -1.2413878440856934, -1.1969822645187378, -1.1525766849517822, -1.1081711053848267, -1.063765525817871, -1.019360065460205, -0.9749544858932495, -0.930548906326294, -0.8861433863639832, -0.8417378664016724, -0.7973322868347168, -0.7529267072677612, -0.7085211873054504, -0.6641156673431396, -0.6197100877761841, -0.5753045082092285, -0.5308989882469177, -0.48649343848228455, -0.44208788871765137, -0.3976823389530182, -0.353276789188385, -0.30887123942375183, -0.26446568965911865, -0.22006013989448547, -0.1756545901298523, -0.13124904036521912, -0.08684349060058594, -0.04243794083595276, 0.00196760892868042, 0.0463731586933136, 0.09077882766723633, 0.1351843774318695, 0.17958992719650269, 0.22399547696113586, 0.26840102672576904, 0.3128065764904022, 0.3572121262550354, 0.4016176760196686, 0.44602322578430176, 0.49042877554893494, 0.5348343253135681, 0.5792398452758789, 0.6236454248428345, 0.66805100440979, 0.7124565243721008, 0.7568620443344116, 0.8012676239013672, 0.8456732034683228, 0.8900787234306335, 0.9344842433929443, 0.9788898229598999, 1.0232954025268555, 1.0677008628845215, 1.112106442451477, 1.1565120220184326, 1.2009176015853882, 1.2453231811523438, 1.2897286415100098, 1.3341342210769653, 1.378539800643921, 1.422945261001587, 1.4673508405685425, 1.511756420135498]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 6.0, 10.0, 5.0, 8.0, 19.0, 14.0, 22.0, 16.0, 29.0, 42.0, 25.0, 35.0, 42.0, 39.0, 50.0, 39.0, 52.0, 51.0, 40.0, 55.0, 49.0, 42.0, 28.0, 38.0, 46.0, 30.0, 28.0, 26.0, 19.0, 16.0, 16.0, 11.0, 10.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5331793427467346, -0.5166094899177551, -0.5000395774841309, -0.48346972465515137, -0.4668998718261719, -0.4503300189971924, -0.4337601363658905, -0.4171902537345886, -0.40062040090560913, -0.38405054807662964, -0.36748066544532776, -0.3509107828140259, -0.3343409299850464, -0.3177710771560669, -0.301201194524765, -0.28463131189346313, -0.26806145906448364, -0.25149160623550415, -0.23492172360420227, -0.21835185587406158, -0.2017819881439209, -0.1852121204137802, -0.16864225268363953, -0.15207238495349884, -0.13550251722335815, -0.11893264949321747, -0.10236278176307678, -0.0857929140329361, -0.06922304630279541, -0.052653178572654724, -0.03608331084251404, -0.019513443112373352, -0.002943575382232666, 0.01362629234790802, 0.030196160078048706, 0.04676602780818939, 0.06333589553833008, 0.07990576326847076, 0.09647563099861145, 0.11304549872875214, 0.12961536645889282, 0.1461852341890335, 0.1627551019191742, 0.17932496964931488, 0.19589483737945557, 0.21246470510959625, 0.22903457283973694, 0.24560444056987762, 0.2621743083000183, 0.2787441611289978, 0.2953140437602997, 0.31188392639160156, 0.32845377922058105, 0.34502363204956055, 0.3615935146808624, 0.3781633973121643, 0.3947332501411438, 0.4113031029701233, 0.42787298560142517, 0.44444286823272705, 0.46101272106170654, 0.47758257389068604, 0.4941524565219879, 0.5107223391532898, 0.5272921919822693]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 6.0, 11.0, 23.0, 18.0, 46.0, 58.0, 108.0, 210.0, 370.0, 789.0, 1753.0, 4221.0, 10682.0, 30098.0, 88737.0, 245554.0, 364618.0, 196559.0, 67189.0, 22786.0, 8458.0, 3294.0, 1458.0, 728.0, 333.0, 165.0, 99.0, 76.0, 35.0, 20.0, 14.0, 11.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0772705078125, -0.0743408203125, -0.0714111328125, -0.0684814453125, -0.0655517578125, -0.0626220703125, -0.0596923828125, -0.0567626953125, -0.0538330078125, -0.0509033203125, -0.0479736328125, -0.0450439453125, -0.0421142578125, -0.0391845703125, -0.0362548828125, -0.0333251953125, -0.0303955078125, -0.0274658203125, -0.0245361328125, -0.0216064453125, -0.0186767578125, -0.0157470703125, -0.0128173828125, -0.0098876953125, -0.0069580078125, -0.0040283203125, -0.0010986328125, 0.0018310546875, 0.0047607421875, 0.0076904296875, 0.0106201171875, 0.0135498046875, 0.0164794921875, 0.0194091796875, 0.0223388671875, 0.0252685546875, 0.0281982421875, 0.0311279296875, 0.0340576171875, 0.0369873046875, 0.0399169921875, 0.0428466796875, 0.0457763671875, 0.0487060546875, 0.0516357421875, 0.0545654296875, 0.0574951171875, 0.0604248046875, 0.0633544921875, 0.0662841796875, 0.0692138671875, 0.0721435546875, 0.0750732421875, 0.0780029296875, 0.0809326171875, 0.0838623046875, 0.0867919921875, 0.0897216796875, 0.0926513671875, 0.0955810546875, 0.0985107421875, 0.1014404296875, 0.1043701171875, 0.1072998046875, 0.1102294921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 10.0, 9.0, 10.0, 11.0, 17.0, 17.0, 15.0, 30.0, 32.0, 39.0, 40.0, 51.0, 57.0, 56.0, 60.0, 68.0, 75.0, 44.0, 60.0, 49.0, 39.0, 50.0, 34.0, 25.0, 20.0, 20.0, 11.0, 13.0, 14.0, 12.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.2746162414550781, -0.26187896728515625, -0.24914169311523438, -0.2364044189453125, -0.22366714477539062, -0.21092987060546875, -0.19819259643554688, -0.185455322265625, -0.17271804809570312, -0.15998077392578125, -0.14724349975585938, -0.1345062255859375, -0.12176895141601562, -0.10903167724609375, -0.09629440307617188, -0.08355712890625, -0.07081985473632812, -0.05808258056640625, -0.045345306396484375, -0.0326080322265625, -0.019870758056640625, -0.00713348388671875, 0.005603790283203125, 0.018341064453125, 0.031078338623046875, 0.04381561279296875, 0.056552886962890625, 0.0692901611328125, 0.08202743530273438, 0.09476470947265625, 0.10750198364257812, 0.1202392578125, 0.13297653198242188, 0.14571380615234375, 0.15845108032226562, 0.1711883544921875, 0.18392562866210938, 0.19666290283203125, 0.20940017700195312, 0.222137451171875, 0.23487472534179688, 0.24761199951171875, 0.2603492736816406, 0.2730865478515625, 0.2858238220214844, 0.29856109619140625, 0.3112983703613281, 0.32403564453125, 0.3367729187011719, 0.34951019287109375, 0.3622474670410156, 0.3749847412109375, 0.3877220153808594, 0.40045928955078125, 0.4131965637207031, 0.425933837890625, 0.4386711120605469, 0.45140838623046875, 0.4641456604003906, 0.4768829345703125, 0.4896202087402344, 0.5023574829101562, 0.5150947570800781, 0.52783203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 16.0, 24.0, 25.0, 36.0, 66.0, 79.0, 112.0, 203.0, 344.0, 590.0, 1212.0, 2682.0, 6696.0, 18508.0, 57879.0, 177341.0, 363160.0, 271995.0, 98717.0, 30668.0, 10392.0, 4075.0, 1746.0, 820.0, 442.0, 247.0, 144.0, 92.0, 66.0, 48.0, 29.0, 28.0, 17.0, 16.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08929443359375, -0.08638858795166016, -0.08348274230957031, -0.08057689666748047, -0.07767105102539062, -0.07476520538330078, -0.07185935974121094, -0.0689535140991211, -0.06604766845703125, -0.0631418228149414, -0.06023597717285156, -0.05733013153076172, -0.054424285888671875, -0.05151844024658203, -0.04861259460449219, -0.045706748962402344, -0.0428009033203125, -0.039895057678222656, -0.03698921203613281, -0.03408336639404297, -0.031177520751953125, -0.02827167510986328, -0.025365829467773438, -0.022459983825683594, -0.01955413818359375, -0.016648292541503906, -0.013742446899414062, -0.010836601257324219, -0.007930755615234375, -0.005024909973144531, -0.0021190643310546875, 0.0007867813110351562, 0.003692626953125, 0.006598472595214844, 0.009504318237304688, 0.012410163879394531, 0.015316009521484375, 0.01822185516357422, 0.021127700805664062, 0.024033546447753906, 0.02693939208984375, 0.029845237731933594, 0.03275108337402344, 0.03565692901611328, 0.038562774658203125, 0.04146862030029297, 0.04437446594238281, 0.047280311584472656, 0.0501861572265625, 0.053092002868652344, 0.05599784851074219, 0.05890369415283203, 0.061809539794921875, 0.06471538543701172, 0.06762123107910156, 0.0705270767211914, 0.07343292236328125, 0.0763387680053711, 0.07924461364746094, 0.08215045928955078, 0.08505630493164062, 0.08796215057373047, 0.09086799621582031, 0.09377384185791016, 0.0966796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 7.0, 11.0, 6.0, 14.0, 15.0, 14.0, 19.0, 19.0, 29.0, 17.0, 31.0, 30.0, 41.0, 57.0, 49.0, 55.0, 54.0, 47.0, 51.0, 54.0, 40.0, 41.0, 33.0, 45.0, 24.0, 31.0, 29.0, 21.0, 22.0, 23.0, 19.0, 9.0, 7.0, 8.0, 4.0, 5.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7169876098632812, -0.6947174072265625, -0.6724472045898438, -0.650177001953125, -0.6279067993164062, -0.6056365966796875, -0.5833663940429688, -0.56109619140625, -0.5388259887695312, -0.5165557861328125, -0.49428558349609375, -0.472015380859375, -0.44974517822265625, -0.4274749755859375, -0.40520477294921875, -0.3829345703125, -0.36066436767578125, -0.3383941650390625, -0.31612396240234375, -0.293853759765625, -0.27158355712890625, -0.2493133544921875, -0.22704315185546875, -0.20477294921875, -0.18250274658203125, -0.1602325439453125, -0.13796234130859375, -0.115692138671875, -0.09342193603515625, -0.0711517333984375, -0.04888153076171875, -0.026611328125, -0.00434112548828125, 0.0179290771484375, 0.04019927978515625, 0.062469482421875, 0.08473968505859375, 0.1070098876953125, 0.12928009033203125, 0.15155029296875, 0.17382049560546875, 0.1960906982421875, 0.21836090087890625, 0.240631103515625, 0.26290130615234375, 0.2851715087890625, 0.30744171142578125, 0.3297119140625, 0.35198211669921875, 0.3742523193359375, 0.39652252197265625, 0.418792724609375, 0.44106292724609375, 0.4633331298828125, 0.48560333251953125, 0.50787353515625, 0.5301437377929688, 0.5524139404296875, 0.5746841430664062, 0.596954345703125, 0.6192245483398438, 0.6414947509765625, 0.6637649536132812, 0.68603515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 3.0, 6.0, 11.0, 16.0, 25.0, 32.0, 40.0, 57.0, 87.0, 148.0, 206.0, 331.0, 580.0, 1066.0, 2283.0, 5903.0, 19447.0, 89647.0, 467854.0, 371172.0, 65071.0, 15232.0, 4835.0, 1948.0, 951.0, 565.0, 337.0, 235.0, 142.0, 95.0, 66.0, 45.0, 32.0, 18.0, 13.0, 10.0, 10.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.048370361328125, -0.0467529296875, -0.045135498046875, -0.04351806640625, -0.041900634765625, -0.040283203125, -0.038665771484375, -0.03704833984375, -0.035430908203125, -0.0338134765625, -0.032196044921875, -0.03057861328125, -0.028961181640625, -0.02734375, -0.025726318359375, -0.02410888671875, -0.022491455078125, -0.0208740234375, -0.019256591796875, -0.01763916015625, -0.016021728515625, -0.014404296875, -0.012786865234375, -0.01116943359375, -0.009552001953125, -0.0079345703125, -0.006317138671875, -0.00469970703125, -0.003082275390625, -0.00146484375, 0.000152587890625, 0.00177001953125, 0.003387451171875, 0.0050048828125, 0.006622314453125, 0.00823974609375, 0.009857177734375, 0.011474609375, 0.013092041015625, 0.01470947265625, 0.016326904296875, 0.0179443359375, 0.019561767578125, 0.02117919921875, 0.022796630859375, 0.0244140625, 0.026031494140625, 0.02764892578125, 0.029266357421875, 0.0308837890625, 0.032501220703125, 0.03411865234375, 0.035736083984375, 0.037353515625, 0.038970947265625, 0.04058837890625, 0.042205810546875, 0.0438232421875, 0.045440673828125, 0.04705810546875, 0.048675537109375, 0.05029296875, 0.051910400390625, 0.05352783203125, 0.055145263671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 12.0, 18.0, 21.0, 19.0, 33.0, 33.0, 56.0, 64.0, 76.0, 97.0, 95.0, 103.0, 81.0, 71.0, 53.0, 30.0, 30.0, 24.0, 16.0, 8.0, 18.0, 9.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6808509826660156e-05, -1.6240403056144714e-05, -1.5672296285629272e-05, -1.510418951511383e-05, -1.4536082744598389e-05, -1.3967975974082947e-05, -1.3399869203567505e-05, -1.2831762433052063e-05, -1.2263655662536621e-05, -1.169554889202118e-05, -1.1127442121505737e-05, -1.0559335350990295e-05, -9.991228580474854e-06, -9.423121809959412e-06, -8.85501503944397e-06, -8.286908268928528e-06, -7.718801498413086e-06, -7.150694727897644e-06, -6.582587957382202e-06, -6.01448118686676e-06, -5.446374416351318e-06, -4.8782676458358765e-06, -4.3101608753204346e-06, -3.7420541048049927e-06, -3.1739473342895508e-06, -2.605840563774109e-06, -2.037733793258667e-06, -1.469627022743225e-06, -9.015202522277832e-07, -3.334134817123413e-07, 2.3469328880310059e-07, 8.028000593185425e-07, 1.3709068298339844e-06, 1.9390136003494263e-06, 2.507120370864868e-06, 3.07522714138031e-06, 3.643333911895752e-06, 4.211440682411194e-06, 4.779547452926636e-06, 5.347654223442078e-06, 5.9157609939575195e-06, 6.4838677644729614e-06, 7.051974534988403e-06, 7.620081305503845e-06, 8.188188076019287e-06, 8.756294846534729e-06, 9.324401617050171e-06, 9.892508387565613e-06, 1.0460615158081055e-05, 1.1028721928596497e-05, 1.1596828699111938e-05, 1.216493546962738e-05, 1.2733042240142822e-05, 1.3301149010658264e-05, 1.3869255781173706e-05, 1.4437362551689148e-05, 1.500546932220459e-05, 1.5573576092720032e-05, 1.6141682863235474e-05, 1.6709789633750916e-05, 1.7277896404266357e-05, 1.78460031747818e-05, 1.841410994529724e-05, 1.8982216715812683e-05, 1.9550323486328125e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 6.0, 5.0, 8.0, 10.0, 14.0, 12.0, 16.0, 20.0, 33.0, 36.0, 46.0, 93.0, 114.0, 160.0, 233.0, 404.0, 723.0, 1452.0, 3419.0, 9039.0, 29996.0, 115670.0, 427788.0, 340697.0, 83419.0, 22285.0, 7121.0, 2710.0, 1237.0, 627.0, 348.0, 209.0, 165.0, 111.0, 76.0, 45.0, 48.0, 34.0, 28.0, 25.0, 14.0, 13.0, 5.0, 12.0, 4.0, 6.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.047210693359375, -0.0457301139831543, -0.044249534606933594, -0.04276895523071289, -0.04128837585449219, -0.039807796478271484, -0.03832721710205078, -0.03684663772583008, -0.035366058349609375, -0.03388547897338867, -0.03240489959716797, -0.030924320220947266, -0.029443740844726562, -0.02796316146850586, -0.026482582092285156, -0.025002002716064453, -0.02352142333984375, -0.022040843963623047, -0.020560264587402344, -0.01907968521118164, -0.017599105834960938, -0.016118526458740234, -0.014637947082519531, -0.013157367706298828, -0.011676788330078125, -0.010196208953857422, -0.008715629577636719, -0.007235050201416016, -0.0057544708251953125, -0.004273891448974609, -0.0027933120727539062, -0.0013127326965332031, 0.0001678466796875, 0.0016484260559082031, 0.0031290054321289062, 0.004609584808349609, 0.0060901641845703125, 0.007570743560791016, 0.009051322937011719, 0.010531902313232422, 0.012012481689453125, 0.013493061065673828, 0.014973640441894531, 0.016454219818115234, 0.017934799194335938, 0.01941537857055664, 0.020895957946777344, 0.022376537322998047, 0.02385711669921875, 0.025337696075439453, 0.026818275451660156, 0.02829885482788086, 0.029779434204101562, 0.031260013580322266, 0.03274059295654297, 0.03422117233276367, 0.035701751708984375, 0.03718233108520508, 0.03866291046142578, 0.040143489837646484, 0.04162406921386719, 0.04310464859008789, 0.044585227966308594, 0.0460658073425293, 0.04754638671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 12.0, 7.0, 10.0, 14.0, 19.0, 16.0, 22.0, 39.0, 41.0, 55.0, 80.0, 90.0, 79.0, 87.0, 91.0, 69.0, 54.0, 55.0, 38.0, 35.0, 18.0, 20.0, 13.0, 7.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.011810302734375, -0.011343240737915039, -0.010876178741455078, -0.010409116744995117, -0.009942054748535156, -0.009474992752075195, -0.009007930755615234, -0.008540868759155273, -0.008073806762695312, -0.0076067447662353516, -0.007139682769775391, -0.00667262077331543, -0.006205558776855469, -0.005738496780395508, -0.005271434783935547, -0.004804372787475586, -0.004337310791015625, -0.003870248794555664, -0.003403186798095703, -0.002936124801635742, -0.0024690628051757812, -0.0020020008087158203, -0.0015349388122558594, -0.0010678768157958984, -0.0006008148193359375, -0.00013375282287597656, 0.0003333091735839844, 0.0008003711700439453, 0.0012674331665039062, 0.0017344951629638672, 0.002201557159423828, 0.002668619155883789, 0.00313568115234375, 0.003602743148803711, 0.004069805145263672, 0.004536867141723633, 0.005003929138183594, 0.005470991134643555, 0.005938053131103516, 0.0064051151275634766, 0.0068721771240234375, 0.0073392391204833984, 0.007806301116943359, 0.00827336311340332, 0.008740425109863281, 0.009207487106323242, 0.009674549102783203, 0.010141611099243164, 0.010608673095703125, 0.011075735092163086, 0.011542797088623047, 0.012009859085083008, 0.012476921081542969, 0.01294398307800293, 0.01341104507446289, 0.013878107070922852, 0.014345169067382812, 0.014812231063842773, 0.015279293060302734, 0.015746355056762695, 0.016213417053222656, 0.016680479049682617, 0.017147541046142578, 0.01761460304260254, 0.0180816650390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 10.0, 11.0, 36.0, 61.0, 138.0, 240.0, 229.0, 150.0, 77.0, 24.0, 19.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0677638053894043, -1.030988097190857, -0.9942123889923096, -0.9574366807937622, -0.9206609725952148, -0.8838852643966675, -0.8471095561981201, -0.8103338479995728, -0.7735581398010254, -0.736782431602478, -0.7000067234039307, -0.6632310152053833, -0.6264553070068359, -0.5896795988082886, -0.5529038906097412, -0.5161281824111938, -0.4793524742126465, -0.4425767660140991, -0.40580105781555176, -0.3690253496170044, -0.33224964141845703, -0.29547393321990967, -0.2586982250213623, -0.22192251682281494, -0.18514680862426758, -0.14837110042572021, -0.11159539222717285, -0.07481968402862549, -0.038043975830078125, -0.0012682676315307617, 0.0355074405670166, 0.07228314876556396, 0.10905873775482178, 0.14583444595336914, 0.1826101541519165, 0.21938586235046387, 0.25616157054901123, 0.2929372787475586, 0.32971298694610596, 0.3664886951446533, 0.4032644033432007, 0.44004011154174805, 0.4768158197402954, 0.5135915279388428, 0.5503672361373901, 0.5871429443359375, 0.6239186525344849, 0.6606943607330322, 0.6974700689315796, 0.734245777130127, 0.7710214853286743, 0.8077971935272217, 0.844572901725769, 0.8813486099243164, 0.9181243181228638, 0.9549000263214111, 0.9916757345199585, 1.0284514427185059, 1.0652271509170532, 1.1020028591156006, 1.138778567314148, 1.1755542755126953, 1.2123299837112427, 1.24910569190979, 1.2858814001083374]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 7.0, 11.0, 6.0, 15.0, 13.0, 19.0, 24.0, 22.0, 38.0, 40.0, 40.0, 49.0, 58.0, 46.0, 60.0, 58.0, 64.0, 65.0, 45.0, 50.0, 48.0, 46.0, 37.0, 37.0, 16.0, 14.0, 21.0, 9.0, 12.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35082903504371643, -0.3385494649410248, -0.32626989483833313, -0.3139903247356415, -0.30171075463294983, -0.28943121433258057, -0.2771516442298889, -0.26487207412719727, -0.2525925040245056, -0.24031293392181396, -0.22803336381912231, -0.21575379371643066, -0.2034742385149002, -0.19119466841220856, -0.1789150983095169, -0.16663554310798645, -0.1543559581041336, -0.14207638800144196, -0.1297968178987503, -0.11751725524663925, -0.1052376925945282, -0.09295812249183655, -0.0806785523891449, -0.06839898973703384, -0.056119419634342194, -0.04383985325694084, -0.03156028687953949, -0.01928071677684784, -0.007001150399446487, 0.0052784159779548645, 0.017557986080646515, 0.02983754873275757, 0.04211711883544922, 0.05439668521285057, 0.06667625159025192, 0.07895582169294357, 0.09123538434505463, 0.10351495444774628, 0.11579452455043793, 0.12807407975196838, 0.14035364985466003, 0.15263321995735168, 0.16491279006004333, 0.17719236016273499, 0.18947191536426544, 0.2017514854669571, 0.21403105556964874, 0.2263106107711792, 0.23859019577503204, 0.2508697509765625, 0.26314932107925415, 0.2754288911819458, 0.28770846128463745, 0.2999880313873291, 0.31226760149002075, 0.3245471715927124, 0.33682674169540405, 0.3491063117980957, 0.36138588190078735, 0.373665452003479, 0.38594502210617065, 0.3982245922088623, 0.41050416231155396, 0.4227837026119232, 0.43506327271461487]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 3.0, 7.0, 19.0, 28.0, 27.0, 43.0, 65.0, 107.0, 148.0, 272.0, 553.0, 1120.0, 2513.0, 5900.0, 14517.0, 37565.0, 109914.0, 356735.0, 350034.0, 107702.0, 36617.0, 13998.0, 5797.0, 2497.0, 1083.0, 505.0, 300.0, 172.0, 102.0, 61.0, 48.0, 33.0, 22.0, 16.0, 12.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.22534751892089844, -0.21595382690429688, -0.2065601348876953, -0.19716644287109375, -0.1877727508544922, -0.17837905883789062, -0.16898536682128906, -0.1595916748046875, -0.15019798278808594, -0.14080429077148438, -0.1314105987548828, -0.12201690673828125, -0.11262321472167969, -0.10322952270507812, -0.09383583068847656, -0.084442138671875, -0.07504844665527344, -0.06565475463867188, -0.05626106262207031, -0.04686737060546875, -0.03747367858886719, -0.028079986572265625, -0.018686294555664062, -0.0092926025390625, 0.0001010894775390625, 0.009494781494140625, 0.018888473510742188, 0.02828216552734375, 0.03767585754394531, 0.047069549560546875, 0.05646324157714844, 0.06585693359375, 0.07525062561035156, 0.08464431762695312, 0.09403800964355469, 0.10343170166015625, 0.11282539367675781, 0.12221908569335938, 0.13161277770996094, 0.1410064697265625, 0.15040016174316406, 0.15979385375976562, 0.1691875457763672, 0.17858123779296875, 0.1879749298095703, 0.19736862182617188, 0.20676231384277344, 0.216156005859375, 0.22554969787597656, 0.23494338989257812, 0.2443370819091797, 0.25373077392578125, 0.2631244659423828, 0.2725181579589844, 0.28191184997558594, 0.2913055419921875, 0.30069923400878906, 0.3100929260253906, 0.3194866180419922, 0.32888031005859375, 0.3382740020751953, 0.3476676940917969, 0.35706138610839844, 0.366455078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 9.0, 6.0, 12.0, 15.0, 12.0, 21.0, 16.0, 31.0, 32.0, 34.0, 42.0, 50.0, 57.0, 50.0, 57.0, 61.0, 66.0, 66.0, 53.0, 52.0, 58.0, 44.0, 31.0, 34.0, 25.0, 14.0, 14.0, 9.0, 10.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6962890625, -0.6701889038085938, -0.6440887451171875, -0.6179885864257812, -0.591888427734375, -0.5657882690429688, -0.5396881103515625, -0.5135879516601562, -0.48748779296875, -0.46138763427734375, -0.4352874755859375, -0.40918731689453125, -0.383087158203125, -0.35698699951171875, -0.3308868408203125, -0.30478668212890625, -0.2786865234375, -0.25258636474609375, -0.2264862060546875, -0.20038604736328125, -0.174285888671875, -0.14818572998046875, -0.1220855712890625, -0.09598541259765625, -0.06988525390625, -0.04378509521484375, -0.0176849365234375, 0.00841522216796875, 0.034515380859375, 0.06061553955078125, 0.0867156982421875, 0.11281585693359375, 0.138916015625, 0.16501617431640625, 0.1911163330078125, 0.21721649169921875, 0.243316650390625, 0.26941680908203125, 0.2955169677734375, 0.32161712646484375, 0.34771728515625, 0.37381744384765625, 0.3999176025390625, 0.42601776123046875, 0.452117919921875, 0.47821807861328125, 0.5043182373046875, 0.5304183959960938, 0.5565185546875, 0.5826187133789062, 0.6087188720703125, 0.6348190307617188, 0.660919189453125, 0.6870193481445312, 0.7131195068359375, 0.7392196655273438, 0.76531982421875, 0.7914199829101562, 0.8175201416015625, 0.8436203002929688, 0.869720458984375, 0.8958206176757812, 0.9219207763671875, 0.9480209350585938, 0.97412109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 7.0, 3.0, 5.0, 5.0, 4.0, 7.0, 11.0, 14.0, 14.0, 27.0, 30.0, 39.0, 48.0, 62.0, 98.0, 129.0, 226.0, 302.0, 536.0, 1519.0, 7905.0, 71193.0, 753522.0, 192087.0, 16397.0, 2520.0, 727.0, 340.0, 217.0, 158.0, 110.0, 69.0, 42.0, 52.0, 31.0, 26.0, 11.0, 11.0, 13.0, 12.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.650390625, -0.6298599243164062, -0.6093292236328125, -0.5887985229492188, -0.568267822265625, -0.5477371215820312, -0.5272064208984375, -0.5066757202148438, -0.48614501953125, -0.46561431884765625, -0.4450836181640625, -0.42455291748046875, -0.404022216796875, -0.38349151611328125, -0.3629608154296875, -0.34243011474609375, -0.3218994140625, -0.30136871337890625, -0.2808380126953125, -0.26030731201171875, -0.239776611328125, -0.21924591064453125, -0.1987152099609375, -0.17818450927734375, -0.15765380859375, -0.13712310791015625, -0.1165924072265625, -0.09606170654296875, -0.075531005859375, -0.05500030517578125, -0.0344696044921875, -0.01393890380859375, 0.006591796875, 0.02712249755859375, 0.0476531982421875, 0.06818389892578125, 0.088714599609375, 0.10924530029296875, 0.1297760009765625, 0.15030670166015625, 0.17083740234375, 0.19136810302734375, 0.2118988037109375, 0.23242950439453125, 0.252960205078125, 0.27349090576171875, 0.2940216064453125, 0.31455230712890625, 0.3350830078125, 0.35561370849609375, 0.3761444091796875, 0.39667510986328125, 0.417205810546875, 0.43773651123046875, 0.4582672119140625, 0.47879791259765625, 0.49932861328125, 0.5198593139648438, 0.5403900146484375, 0.5609207153320312, 0.581451416015625, 0.6019821166992188, 0.6225128173828125, 0.6430435180664062, 0.66357421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 5.0, 9.0, 8.0, 9.0, 9.0, 12.0, 20.0, 20.0, 30.0, 22.0, 29.0, 30.0, 41.0, 38.0, 43.0, 46.0, 54.0, 50.0, 58.0, 47.0, 51.0, 53.0, 50.0, 35.0, 34.0, 29.0, 26.0, 18.0, 31.0, 19.0, 14.0, 11.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88818359375, -0.861114501953125, -0.83404541015625, -0.806976318359375, -0.7799072265625, -0.752838134765625, -0.72576904296875, -0.698699951171875, -0.671630859375, -0.644561767578125, -0.61749267578125, -0.590423583984375, -0.5633544921875, -0.536285400390625, -0.50921630859375, -0.482147216796875, -0.455078125, -0.428009033203125, -0.40093994140625, -0.373870849609375, -0.3468017578125, -0.319732666015625, -0.29266357421875, -0.265594482421875, -0.238525390625, -0.211456298828125, -0.18438720703125, -0.157318115234375, -0.1302490234375, -0.103179931640625, -0.07611083984375, -0.049041748046875, -0.02197265625, 0.005096435546875, 0.03216552734375, 0.059234619140625, 0.0863037109375, 0.113372802734375, 0.14044189453125, 0.167510986328125, 0.194580078125, 0.221649169921875, 0.24871826171875, 0.275787353515625, 0.3028564453125, 0.329925537109375, 0.35699462890625, 0.384063720703125, 0.4111328125, 0.438201904296875, 0.46527099609375, 0.492340087890625, 0.5194091796875, 0.546478271484375, 0.57354736328125, 0.600616455078125, 0.627685546875, 0.654754638671875, 0.68182373046875, 0.708892822265625, 0.7359619140625, 0.763031005859375, 0.79010009765625, 0.817169189453125, 0.84423828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 6.0, 17.0, 19.0, 20.0, 34.0, 46.0, 82.0, 167.0, 327.0, 774.0, 2513.0, 11641.0, 130166.0, 814545.0, 76487.0, 8435.0, 1901.0, 689.0, 293.0, 116.0, 88.0, 41.0, 35.0, 21.0, 22.0, 13.0, 10.0, 7.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.2477283477783203, -0.23984146118164062, -0.23195457458496094, -0.22406768798828125, -0.21618080139160156, -0.20829391479492188, -0.2004070281982422, -0.1925201416015625, -0.1846332550048828, -0.17674636840820312, -0.16885948181152344, -0.16097259521484375, -0.15308570861816406, -0.14519882202148438, -0.1373119354248047, -0.129425048828125, -0.12153816223144531, -0.11365127563476562, -0.10576438903808594, -0.09787750244140625, -0.08999061584472656, -0.08210372924804688, -0.07421684265136719, -0.0663299560546875, -0.05844306945800781, -0.050556182861328125, -0.04266929626464844, -0.03478240966796875, -0.026895523071289062, -0.019008636474609375, -0.011121749877929688, -0.00323486328125, 0.0046520233154296875, 0.012538909912109375, 0.020425796508789062, 0.02831268310546875, 0.03619956970214844, 0.044086456298828125, 0.05197334289550781, 0.0598602294921875, 0.06774711608886719, 0.07563400268554688, 0.08352088928222656, 0.09140777587890625, 0.09929466247558594, 0.10718154907226562, 0.11506843566894531, 0.122955322265625, 0.1308422088623047, 0.13872909545898438, 0.14661598205566406, 0.15450286865234375, 0.16238975524902344, 0.17027664184570312, 0.1781635284423828, 0.1860504150390625, 0.1939373016357422, 0.20182418823242188, 0.20971107482910156, 0.21759796142578125, 0.22548484802246094, 0.23337173461914062, 0.2412586212158203, 0.2491455078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 7.0, 10.0, 7.0, 14.0, 15.0, 36.0, 50.0, 56.0, 60.0, 86.0, 104.0, 105.0, 110.0, 80.0, 72.0, 51.0, 36.0, 25.0, 17.0, 17.0, 11.0, 11.0, 3.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4318695068359375e-05, -2.360902726650238e-05, -2.2899359464645386e-05, -2.218969166278839e-05, -2.1480023860931396e-05, -2.0770356059074402e-05, -2.0060688257217407e-05, -1.9351020455360413e-05, -1.8641352653503418e-05, -1.7931684851646423e-05, -1.722201704978943e-05, -1.6512349247932434e-05, -1.580268144607544e-05, -1.5093013644218445e-05, -1.438334584236145e-05, -1.3673678040504456e-05, -1.2964010238647461e-05, -1.2254342436790466e-05, -1.1544674634933472e-05, -1.0835006833076477e-05, -1.0125339031219482e-05, -9.415671229362488e-06, -8.706003427505493e-06, -7.996335625648499e-06, -7.286667823791504e-06, -6.577000021934509e-06, -5.867332220077515e-06, -5.15766441822052e-06, -4.447996616363525e-06, -3.7383288145065308e-06, -3.028661012649536e-06, -2.3189932107925415e-06, -1.6093254089355469e-06, -8.996576070785522e-07, -1.8998980522155762e-07, 5.19677996635437e-07, 1.2293457984924316e-06, 1.9390136003494263e-06, 2.648681402206421e-06, 3.3583492040634155e-06, 4.06801700592041e-06, 4.777684807777405e-06, 5.487352609634399e-06, 6.197020411491394e-06, 6.906688213348389e-06, 7.616356015205383e-06, 8.326023817062378e-06, 9.035691618919373e-06, 9.745359420776367e-06, 1.0455027222633362e-05, 1.1164695024490356e-05, 1.1874362826347351e-05, 1.2584030628204346e-05, 1.329369843006134e-05, 1.4003366231918335e-05, 1.471303403377533e-05, 1.5422701835632324e-05, 1.613236963748932e-05, 1.6842037439346313e-05, 1.7551705241203308e-05, 1.8261373043060303e-05, 1.8971040844917297e-05, 1.9680708646774292e-05, 2.0390376448631287e-05, 2.110004425048828e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 16.0, 10.0, 25.0, 57.0, 145.0, 426.0, 1487.0, 10354.0, 589397.0, 435936.0, 8742.0, 1339.0, 352.0, 116.0, 51.0, 32.0, 18.0, 15.0, 11.0, 9.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443359375, -0.4290428161621094, -0.41472625732421875, -0.4004096984863281, -0.3860931396484375, -0.3717765808105469, -0.35746002197265625, -0.3431434631347656, -0.328826904296875, -0.3145103454589844, -0.30019378662109375, -0.2858772277832031, -0.2715606689453125, -0.2572441101074219, -0.24292755126953125, -0.22861099243164062, -0.21429443359375, -0.19997787475585938, -0.18566131591796875, -0.17134475708007812, -0.1570281982421875, -0.14271163940429688, -0.12839508056640625, -0.11407852172851562, -0.099761962890625, -0.08544540405273438, -0.07112884521484375, -0.056812286376953125, -0.0424957275390625, -0.028179168701171875, -0.01386260986328125, 0.000453948974609375, 0.0147705078125, 0.029087066650390625, 0.04340362548828125, 0.057720184326171875, 0.0720367431640625, 0.08635330200195312, 0.10066986083984375, 0.11498641967773438, 0.129302978515625, 0.14361953735351562, 0.15793609619140625, 0.17225265502929688, 0.1865692138671875, 0.20088577270507812, 0.21520233154296875, 0.22951889038085938, 0.24383544921875, 0.2581520080566406, 0.27246856689453125, 0.2867851257324219, 0.3011016845703125, 0.3154182434082031, 0.32973480224609375, 0.3440513610839844, 0.358367919921875, 0.3726844787597656, 0.38700103759765625, 0.4013175964355469, 0.4156341552734375, 0.4299507141113281, 0.44426727294921875, 0.4585838317871094, 0.472900390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 13.0, 16.0, 18.0, 23.0, 50.0, 73.0, 97.0, 98.0, 126.0, 139.0, 94.0, 84.0, 48.0, 33.0, 22.0, 18.0, 6.0, 12.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1092529296875, -0.10600852966308594, -0.10276412963867188, -0.09951972961425781, -0.09627532958984375, -0.09303092956542969, -0.08978652954101562, -0.08654212951660156, -0.0832977294921875, -0.08005332946777344, -0.07680892944335938, -0.07356452941894531, -0.07032012939453125, -0.06707572937011719, -0.06383132934570312, -0.06058692932128906, -0.057342529296875, -0.05409812927246094, -0.050853729248046875, -0.04760932922363281, -0.04436492919921875, -0.04112052917480469, -0.037876129150390625, -0.03463172912597656, -0.0313873291015625, -0.028142929077148438, -0.024898529052734375, -0.021654129028320312, -0.01840972900390625, -0.015165328979492188, -0.011920928955078125, -0.008676528930664062, -0.00543212890625, -0.0021877288818359375, 0.001056671142578125, 0.0043010711669921875, 0.00754547119140625, 0.010789871215820312, 0.014034271240234375, 0.017278671264648438, 0.0205230712890625, 0.023767471313476562, 0.027011871337890625, 0.030256271362304688, 0.03350067138671875, 0.03674507141113281, 0.039989471435546875, 0.04323387145996094, 0.046478271484375, 0.04972267150878906, 0.052967071533203125, 0.05621147155761719, 0.05945587158203125, 0.06270027160644531, 0.06594467163085938, 0.06918907165527344, 0.0724334716796875, 0.07567787170410156, 0.07892227172851562, 0.08216667175292969, 0.08541107177734375, 0.08865547180175781, 0.09189987182617188, 0.09514427185058594, 0.098388671875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 11.0, 28.0, 41.0, 108.0, 200.0, 215.0, 168.0, 112.0, 58.0, 33.0, 13.0, 9.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0269415378570557, -1.9604947566986084, -1.8940480947494507, -1.8276013135910034, -1.7611546516418457, -1.6947078704833984, -1.6282610893249512, -1.5618144273757935, -1.4953677654266357, -1.4289209842681885, -1.3624743223190308, -1.2960275411605835, -1.2295808792114258, -1.1631340980529785, -1.0966873168945312, -1.0302406549453735, -0.9637938737869263, -0.8973471522331238, -0.8309004306793213, -0.764453649520874, -0.6980069875717163, -0.631560206413269, -0.5651134848594666, -0.49866676330566406, -0.4322200417518616, -0.3657733201980591, -0.2993265986442566, -0.2328798472881317, -0.16643312573432922, -0.09998640418052673, -0.033539652824401855, 0.032907068729400635, 0.09935379028320312, 0.16580051183700562, 0.2322472482919693, 0.298693984746933, 0.3651407063007355, 0.43158742785453796, 0.49803417921066284, 0.5644809007644653, 0.6309276223182678, 0.6973743438720703, 0.7638210654258728, 0.8302677869796753, 0.8967145681381226, 0.9631612300872803, 1.0296080112457275, 1.0960547924041748, 1.1625014543533325, 1.2289482355117798, 1.2953948974609375, 1.3618416786193848, 1.4282883405685425, 1.4947351217269897, 1.5611817836761475, 1.6276285648345947, 1.694075345993042, 1.7605221271514893, 1.826968789100647, 1.8934155702590942, 1.959862232208252, 2.026309013366699, 2.0927557945251465, 2.1592025756835938, 2.225649118423462]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 3.0, 6.0, 11.0, 12.0, 15.0, 28.0, 16.0, 19.0, 27.0, 27.0, 31.0, 30.0, 32.0, 32.0, 44.0, 34.0, 45.0, 44.0, 32.0, 39.0, 47.0, 37.0, 40.0, 27.0, 40.0, 35.0, 34.0, 25.0, 25.0, 20.0, 21.0, 22.0, 14.0, 9.0, 9.0, 13.0, 8.0, 8.0, 8.0, 7.0, 1.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.2735111713409424, -1.2335801124572754, -1.1936490535736084, -1.1537179946899414, -1.1137869358062744, -1.0738558769226074, -1.0339248180389404, -0.9939937591552734, -0.9540627002716064, -0.9141316413879395, -0.8742005825042725, -0.8342695236206055, -0.7943384647369385, -0.7544074058532715, -0.7144763469696045, -0.6745452880859375, -0.6346142888069153, -0.5946832299232483, -0.5547521710395813, -0.5148211121559143, -0.4748900532722473, -0.4349589943885803, -0.3950279653072357, -0.3550969064235687, -0.31516584753990173, -0.27523478865623474, -0.23530372977256775, -0.19537268579006195, -0.15544162690639496, -0.11551056802272797, -0.07557952404022217, -0.035648465156555176, 0.004282593727111816, 0.04421364888548851, 0.0841447040438652, 0.1240757554769516, 0.1640068143606186, 0.20393787324428558, 0.24386891722679138, 0.2837999761104584, 0.32373103499412537, 0.36366209387779236, 0.40359315276145935, 0.44352418184280396, 0.48345524072647095, 0.5233862996101379, 0.5633173584938049, 0.6032484173774719, 0.6431794762611389, 0.6831105351448059, 0.7230415940284729, 0.7629726529121399, 0.8029037117958069, 0.8428347706794739, 0.8827657699584961, 0.9226968288421631, 0.9626278877258301, 1.002558946609497, 1.042490005493164, 1.082421064376831, 1.122352123260498, 1.162283182144165, 1.202214241027832, 1.242145299911499, 1.282076358795166]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 15.0, 23.0, 60.0, 130.0, 272.0, 924.0, 3951.0, 30457.0, 1034001.0, 3014338.0, 100824.0, 7126.0, 1410.0, 431.0, 168.0, 64.0, 38.0, 14.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4619140625, -1.4226226806640625, -1.383331298828125, -1.3440399169921875, -1.30474853515625, -1.2654571533203125, -1.226165771484375, -1.1868743896484375, -1.1475830078125, -1.1082916259765625, -1.069000244140625, -1.0297088623046875, -0.99041748046875, -0.9511260986328125, -0.911834716796875, -0.8725433349609375, -0.833251953125, -0.7939605712890625, -0.754669189453125, -0.7153778076171875, -0.67608642578125, -0.6367950439453125, -0.597503662109375, -0.5582122802734375, -0.5189208984375, -0.4796295166015625, -0.440338134765625, -0.4010467529296875, -0.36175537109375, -0.3224639892578125, -0.283172607421875, -0.2438812255859375, -0.20458984375, -0.1652984619140625, -0.126007080078125, -0.0867156982421875, -0.04742431640625, -0.0081329345703125, 0.031158447265625, 0.0704498291015625, 0.1097412109375, 0.1490325927734375, 0.188323974609375, 0.2276153564453125, 0.26690673828125, 0.3061981201171875, 0.345489501953125, 0.3847808837890625, 0.424072265625, 0.4633636474609375, 0.502655029296875, 0.5419464111328125, 0.58123779296875, 0.6205291748046875, 0.659820556640625, 0.6991119384765625, 0.7384033203125, 0.7776947021484375, 0.816986083984375, 0.8562774658203125, 0.89556884765625, 0.9348602294921875, 0.974151611328125, 1.0134429931640625, 1.052734375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 1.0, 1.0, 5.0, 13.0, 11.0, 19.0, 26.0, 20.0, 31.0, 24.0, 27.0, 36.0, 36.0, 44.0, 46.0, 55.0, 46.0, 62.0, 63.0, 45.0, 53.0, 41.0, 42.0, 41.0, 40.0, 36.0, 24.0, 25.0, 17.0, 19.0, 10.0, 9.0, 11.0, 7.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416015625, -0.40061187744140625, -0.3852081298828125, -0.36980438232421875, -0.354400634765625, -0.33899688720703125, -0.3235931396484375, -0.30818939208984375, -0.29278564453125, -0.27738189697265625, -0.2619781494140625, -0.24657440185546875, -0.231170654296875, -0.21576690673828125, -0.2003631591796875, -0.18495941162109375, -0.1695556640625, -0.15415191650390625, -0.1387481689453125, -0.12334442138671875, -0.107940673828125, -0.09253692626953125, -0.0771331787109375, -0.06172943115234375, -0.04632568359375, -0.03092193603515625, -0.0155181884765625, -0.00011444091796875, 0.015289306640625, 0.03069305419921875, 0.0460968017578125, 0.06150054931640625, 0.076904296875, 0.09230804443359375, 0.1077117919921875, 0.12311553955078125, 0.138519287109375, 0.15392303466796875, 0.1693267822265625, 0.18473052978515625, 0.20013427734375, 0.21553802490234375, 0.2309417724609375, 0.24634552001953125, 0.261749267578125, 0.27715301513671875, 0.2925567626953125, 0.30796051025390625, 0.3233642578125, 0.33876800537109375, 0.3541717529296875, 0.36957550048828125, 0.384979248046875, 0.40038299560546875, 0.4157867431640625, 0.43119049072265625, 0.44659423828125, 0.46199798583984375, 0.4774017333984375, 0.49280548095703125, 0.508209228515625, 0.5236129760742188, 0.5390167236328125, 0.5544204711914062, 0.56982421875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 12.0, 11.0, 14.0, 23.0, 26.0, 58.0, 67.0, 172.0, 354.0, 936.0, 3207.0, 21596.0, 698238.0, 3400197.0, 60594.0, 6214.0, 1492.0, 531.0, 235.0, 116.0, 52.0, 47.0, 24.0, 11.0, 15.0, 9.0, 2.0, 10.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8564453125, -0.81951904296875, -0.7825927734375, -0.74566650390625, -0.708740234375, -0.67181396484375, -0.6348876953125, -0.59796142578125, -0.56103515625, -0.52410888671875, -0.4871826171875, -0.45025634765625, -0.413330078125, -0.37640380859375, -0.3394775390625, -0.30255126953125, -0.265625, -0.22869873046875, -0.1917724609375, -0.15484619140625, -0.117919921875, -0.08099365234375, -0.0440673828125, -0.00714111328125, 0.02978515625, 0.06671142578125, 0.1036376953125, 0.14056396484375, 0.177490234375, 0.21441650390625, 0.2513427734375, 0.28826904296875, 0.3251953125, 0.36212158203125, 0.3990478515625, 0.43597412109375, 0.472900390625, 0.50982666015625, 0.5467529296875, 0.58367919921875, 0.62060546875, 0.65753173828125, 0.6944580078125, 0.73138427734375, 0.768310546875, 0.80523681640625, 0.8421630859375, 0.87908935546875, 0.916015625, 0.95294189453125, 0.9898681640625, 1.02679443359375, 1.063720703125, 1.10064697265625, 1.1375732421875, 1.17449951171875, 1.21142578125, 1.24835205078125, 1.2852783203125, 1.32220458984375, 1.359130859375, 1.39605712890625, 1.4329833984375, 1.46990966796875, 1.5068359375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 6.0, 6.0, 9.0, 10.0, 11.0, 17.0, 29.0, 31.0, 72.0, 88.0, 129.0, 208.0, 376.0, 577.0, 658.0, 610.0, 470.0, 262.0, 194.0, 111.0, 69.0, 37.0, 27.0, 21.0, 11.0, 10.0, 8.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.310302734375, -0.3030357360839844, -0.29576873779296875, -0.2885017395019531, -0.2812347412109375, -0.2739677429199219, -0.26670074462890625, -0.2594337463378906, -0.252166748046875, -0.24489974975585938, -0.23763275146484375, -0.23036575317382812, -0.2230987548828125, -0.21583175659179688, -0.20856475830078125, -0.20129776000976562, -0.19403076171875, -0.18676376342773438, -0.17949676513671875, -0.17222976684570312, -0.1649627685546875, -0.15769577026367188, -0.15042877197265625, -0.14316177368164062, -0.135894775390625, -0.12862777709960938, -0.12136077880859375, -0.11409378051757812, -0.1068267822265625, -0.09955978393554688, -0.09229278564453125, -0.08502578735351562, -0.0777587890625, -0.07049179077148438, -0.06322479248046875, -0.055957794189453125, -0.0486907958984375, -0.041423797607421875, -0.03415679931640625, -0.026889801025390625, -0.019622802734375, -0.012355804443359375, -0.00508880615234375, 0.002178192138671875, 0.0094451904296875, 0.016712188720703125, 0.02397918701171875, 0.031246185302734375, 0.03851318359375, 0.045780181884765625, 0.05304718017578125, 0.060314178466796875, 0.0675811767578125, 0.07484817504882812, 0.08211517333984375, 0.08938217163085938, 0.096649169921875, 0.10391616821289062, 0.11118316650390625, 0.11845016479492188, 0.1257171630859375, 0.13298416137695312, 0.14025115966796875, 0.14751815795898438, 0.15478515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 13.0, 39.0, 91.0, 134.0, 163.0, 200.0, 159.0, 82.0, 44.0, 40.0, 17.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09526526927948, -1.0481679439544678, -1.001070499420166, -0.953973114490509, -0.906875729560852, -0.8597783446311951, -0.8126809597015381, -0.7655835747718811, -0.7184861898422241, -0.6713888049125671, -0.6242914199829102, -0.5771940350532532, -0.5300966501235962, -0.4829992651939392, -0.4359018802642822, -0.38880449533462524, -0.34170711040496826, -0.2946097254753113, -0.2475123405456543, -0.20041495561599731, -0.15331757068634033, -0.10622018575668335, -0.05912280082702637, -0.012025415897369385, 0.0350719690322876, 0.08216935396194458, 0.12926673889160156, 0.17636412382125854, 0.22346150875091553, 0.2705588936805725, 0.3176562786102295, 0.3647536635398865, 0.4118509292602539, 0.4589483141899109, 0.5060456991195679, 0.5531430840492249, 0.6002404689788818, 0.6473378539085388, 0.6944352388381958, 0.7415326237678528, 0.7886300086975098, 0.8357273936271667, 0.8828247785568237, 0.9299221634864807, 0.9770195484161377, 1.0241169929504395, 1.0712143182754517, 1.1183116436004639, 1.1654090881347656, 1.2125065326690674, 1.2596038579940796, 1.3067011833190918, 1.3537986278533936, 1.4008960723876953, 1.4479933977127075, 1.4950907230377197, 1.5421881675720215, 1.5892856121063232, 1.6363829374313354, 1.6834802627563477, 1.7305777072906494, 1.7776751518249512, 1.8247724771499634, 1.8718698024749756, 1.9189672470092773]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 12.0, 15.0, 10.0, 21.0, 20.0, 24.0, 28.0, 20.0, 28.0, 41.0, 44.0, 42.0, 51.0, 48.0, 57.0, 55.0, 48.0, 53.0, 46.0, 43.0, 41.0, 42.0, 25.0, 25.0, 31.0, 30.0, 26.0, 15.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.40488138794898987, -0.38882824778556824, -0.3727750778198242, -0.3567219376564026, -0.34066879749298096, -0.3246156573295593, -0.3085625171661377, -0.2925093472003937, -0.27645620703697205, -0.2604030668735504, -0.2443499118089676, -0.22829675674438477, -0.21224361658096313, -0.1961904764175415, -0.18013732135295868, -0.16408416628837585, -0.14803102612495422, -0.1319778859615326, -0.11592473089694977, -0.09987158328294754, -0.08381843566894531, -0.06776528805494308, -0.05171214044094086, -0.03565899282693863, -0.0196058452129364, -0.0035526975989341736, 0.012500450015068054, 0.028553597629070282, 0.04460674524307251, 0.06065989285707474, 0.07671304047107697, 0.0927661880850792, 0.10881936550140381, 0.12487251311540604, 0.14092566072940826, 0.1569788157939911, 0.17303195595741272, 0.18908509612083435, 0.20513825118541718, 0.22119140625, 0.23724454641342163, 0.25329768657684326, 0.2693508267402649, 0.2854039967060089, 0.30145713686943054, 0.3175102770328522, 0.3335634469985962, 0.3496165871620178, 0.36566972732543945, 0.3817228674888611, 0.3977760076522827, 0.41382917761802673, 0.42988231778144836, 0.44593545794487, 0.461988627910614, 0.47804176807403564, 0.4940949082374573, 0.5101480484008789, 0.5262011885643005, 0.5422543287277222, 0.5583075284957886, 0.5743606686592102, 0.5904138088226318, 0.6064669489860535, 0.6225200891494751]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 8.0, 12.0, 16.0, 26.0, 21.0, 46.0, 68.0, 108.0, 159.0, 292.0, 636.0, 1449.0, 3833.0, 11894.0, 42100.0, 164031.0, 427039.0, 286683.0, 78944.0, 20720.0, 6357.0, 2248.0, 855.0, 421.0, 207.0, 129.0, 79.0, 47.0, 40.0, 27.0, 12.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1368408203125, -0.1330108642578125, -0.129180908203125, -0.1253509521484375, -0.12152099609375, -0.1176910400390625, -0.113861083984375, -0.1100311279296875, -0.106201171875, -0.1023712158203125, -0.098541259765625, -0.0947113037109375, -0.09088134765625, -0.0870513916015625, -0.083221435546875, -0.0793914794921875, -0.0755615234375, -0.0717315673828125, -0.067901611328125, -0.0640716552734375, -0.06024169921875, -0.0564117431640625, -0.052581787109375, -0.0487518310546875, -0.044921875, -0.0410919189453125, -0.037261962890625, -0.0334320068359375, -0.02960205078125, -0.0257720947265625, -0.021942138671875, -0.0181121826171875, -0.0142822265625, -0.0104522705078125, -0.006622314453125, -0.0027923583984375, 0.00103759765625, 0.0048675537109375, 0.008697509765625, 0.0125274658203125, 0.016357421875, 0.0201873779296875, 0.024017333984375, 0.0278472900390625, 0.03167724609375, 0.0355072021484375, 0.039337158203125, 0.0431671142578125, 0.0469970703125, 0.0508270263671875, 0.054656982421875, 0.0584869384765625, 0.06231689453125, 0.0661468505859375, 0.069976806640625, 0.0738067626953125, 0.07763671875, 0.0814666748046875, 0.085296630859375, 0.0891265869140625, 0.09295654296875, 0.0967864990234375, 0.100616455078125, 0.1044464111328125, 0.1082763671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 10.0, 9.0, 13.0, 12.0, 23.0, 13.0, 24.0, 29.0, 46.0, 29.0, 36.0, 45.0, 57.0, 45.0, 53.0, 59.0, 60.0, 56.0, 51.0, 37.0, 46.0, 31.0, 51.0, 29.0, 26.0, 24.0, 15.0, 19.0, 5.0, 13.0, 8.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2836151123046875, -0.272064208984375, -0.2605133056640625, -0.24896240234375, -0.2374114990234375, -0.225860595703125, -0.2143096923828125, -0.2027587890625, -0.1912078857421875, -0.179656982421875, -0.1681060791015625, -0.15655517578125, -0.1450042724609375, -0.133453369140625, -0.1219024658203125, -0.1103515625, -0.0988006591796875, -0.087249755859375, -0.0756988525390625, -0.06414794921875, -0.0525970458984375, -0.041046142578125, -0.0294952392578125, -0.0179443359375, -0.0063934326171875, 0.005157470703125, 0.0167083740234375, 0.02825927734375, 0.0398101806640625, 0.051361083984375, 0.0629119873046875, 0.074462890625, 0.0860137939453125, 0.097564697265625, 0.1091156005859375, 0.12066650390625, 0.1322174072265625, 0.143768310546875, 0.1553192138671875, 0.1668701171875, 0.1784210205078125, 0.189971923828125, 0.2015228271484375, 0.21307373046875, 0.2246246337890625, 0.236175537109375, 0.2477264404296875, 0.25927734375, 0.2708282470703125, 0.282379150390625, 0.2939300537109375, 0.30548095703125, 0.3170318603515625, 0.328582763671875, 0.3401336669921875, 0.3516845703125, 0.3632354736328125, 0.374786376953125, 0.3863372802734375, 0.39788818359375, 0.4094390869140625, 0.420989990234375, 0.4325408935546875, 0.444091796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 10.0, 11.0, 19.0, 18.0, 39.0, 54.0, 81.0, 129.0, 174.0, 270.0, 476.0, 861.0, 1736.0, 3832.0, 9270.0, 24702.0, 73936.0, 211075.0, 358425.0, 233172.0, 83733.0, 27924.0, 10128.0, 4215.0, 1889.0, 927.0, 556.0, 314.0, 185.0, 125.0, 76.0, 43.0, 30.0, 31.0, 8.0, 30.0, 11.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.09382247924804688, -0.09102630615234375, -0.08823013305664062, -0.0854339599609375, -0.08263778686523438, -0.07984161376953125, -0.07704544067382812, -0.074249267578125, -0.07145309448242188, -0.06865692138671875, -0.06586074829101562, -0.0630645751953125, -0.060268402099609375, -0.05747222900390625, -0.054676055908203125, -0.0518798828125, -0.049083709716796875, -0.04628753662109375, -0.043491363525390625, -0.0406951904296875, -0.037899017333984375, -0.03510284423828125, -0.032306671142578125, -0.029510498046875, -0.026714324951171875, -0.02391815185546875, -0.021121978759765625, -0.0183258056640625, -0.015529632568359375, -0.01273345947265625, -0.009937286376953125, -0.00714111328125, -0.004344940185546875, -0.00154876708984375, 0.001247406005859375, 0.0040435791015625, 0.006839752197265625, 0.00963592529296875, 0.012432098388671875, 0.015228271484375, 0.018024444580078125, 0.02082061767578125, 0.023616790771484375, 0.0264129638671875, 0.029209136962890625, 0.03200531005859375, 0.034801483154296875, 0.03759765625, 0.040393829345703125, 0.04319000244140625, 0.045986175537109375, 0.0487823486328125, 0.051578521728515625, 0.05437469482421875, 0.057170867919921875, 0.059967041015625, 0.06276321411132812, 0.06555938720703125, 0.06835556030273438, 0.0711517333984375, 0.07394790649414062, 0.07674407958984375, 0.07954025268554688, 0.08233642578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 6.0, 7.0, 7.0, 15.0, 11.0, 15.0, 16.0, 18.0, 41.0, 29.0, 24.0, 42.0, 40.0, 43.0, 39.0, 40.0, 42.0, 49.0, 42.0, 45.0, 34.0, 38.0, 48.0, 29.0, 32.0, 37.0, 34.0, 25.0, 20.0, 25.0, 18.0, 11.0, 14.0, 10.0, 9.0, 8.0, 9.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.583984375, -0.5640716552734375, -0.544158935546875, -0.5242462158203125, -0.50433349609375, -0.4844207763671875, -0.464508056640625, -0.4445953369140625, -0.4246826171875, -0.4047698974609375, -0.384857177734375, -0.3649444580078125, -0.34503173828125, -0.3251190185546875, -0.305206298828125, -0.2852935791015625, -0.265380859375, -0.2454681396484375, -0.225555419921875, -0.2056427001953125, -0.18572998046875, -0.1658172607421875, -0.145904541015625, -0.1259918212890625, -0.1060791015625, -0.0861663818359375, -0.066253662109375, -0.0463409423828125, -0.02642822265625, -0.0065155029296875, 0.013397216796875, 0.0333099365234375, 0.05322265625, 0.0731353759765625, 0.093048095703125, 0.1129608154296875, 0.13287353515625, 0.1527862548828125, 0.172698974609375, 0.1926116943359375, 0.2125244140625, 0.2324371337890625, 0.252349853515625, 0.2722625732421875, 0.29217529296875, 0.3120880126953125, 0.332000732421875, 0.3519134521484375, 0.371826171875, 0.3917388916015625, 0.411651611328125, 0.4315643310546875, 0.45147705078125, 0.4713897705078125, 0.491302490234375, 0.5112152099609375, 0.5311279296875, 0.5510406494140625, 0.570953369140625, 0.5908660888671875, 0.61077880859375, 0.6306915283203125, 0.650604248046875, 0.6705169677734375, 0.6904296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 10.0, 9.0, 13.0, 10.0, 15.0, 26.0, 23.0, 41.0, 60.0, 56.0, 144.0, 203.0, 263.0, 455.0, 683.0, 1195.0, 2250.0, 4232.0, 9876.0, 26835.0, 85813.0, 266557.0, 388989.0, 175222.0, 53426.0, 17718.0, 6955.0, 3228.0, 1674.0, 961.0, 567.0, 335.0, 229.0, 145.0, 95.0, 66.0, 52.0, 33.0, 27.0, 20.0, 15.0, 7.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0323486328125, -0.0312809944152832, -0.030213356018066406, -0.02914571762084961, -0.028078079223632812, -0.027010440826416016, -0.02594280242919922, -0.024875164031982422, -0.023807525634765625, -0.022739887237548828, -0.02167224884033203, -0.020604610443115234, -0.019536972045898438, -0.01846933364868164, -0.017401695251464844, -0.016334056854248047, -0.01526641845703125, -0.014198780059814453, -0.013131141662597656, -0.01206350326538086, -0.010995864868164062, -0.009928226470947266, -0.008860588073730469, -0.007792949676513672, -0.006725311279296875, -0.005657672882080078, -0.004590034484863281, -0.0035223960876464844, -0.0024547576904296875, -0.0013871192932128906, -0.00031948089599609375, 0.0007481575012207031, 0.0018157958984375, 0.002883434295654297, 0.003951072692871094, 0.005018711090087891, 0.0060863494873046875, 0.007153987884521484, 0.008221626281738281, 0.009289264678955078, 0.010356903076171875, 0.011424541473388672, 0.012492179870605469, 0.013559818267822266, 0.014627456665039062, 0.01569509506225586, 0.016762733459472656, 0.017830371856689453, 0.01889801025390625, 0.019965648651123047, 0.021033287048339844, 0.02210092544555664, 0.023168563842773438, 0.024236202239990234, 0.02530384063720703, 0.026371479034423828, 0.027439117431640625, 0.028506755828857422, 0.02957439422607422, 0.030642032623291016, 0.03170967102050781, 0.03277730941772461, 0.033844947814941406, 0.0349125862121582, 0.035980224609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 13.0, 15.0, 15.0, 10.0, 22.0, 13.0, 22.0, 30.0, 32.0, 33.0, 48.0, 70.0, 48.0, 62.0, 53.0, 62.0, 63.0, 65.0, 43.0, 44.0, 40.0, 41.0, 30.0, 36.0, 19.0, 12.0, 11.0, 9.0, 3.0, 6.0, 5.0, 2.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3172626495361328e-05, -1.280568540096283e-05, -1.2438744306564331e-05, -1.2071803212165833e-05, -1.1704862117767334e-05, -1.1337921023368835e-05, -1.0970979928970337e-05, -1.0604038834571838e-05, -1.023709774017334e-05, -9.870156645774841e-06, -9.503215551376343e-06, -9.136274456977844e-06, -8.769333362579346e-06, -8.402392268180847e-06, -8.035451173782349e-06, -7.66851007938385e-06, -7.3015689849853516e-06, -6.934627890586853e-06, -6.5676867961883545e-06, -6.200745701789856e-06, -5.833804607391357e-06, -5.466863512992859e-06, -5.09992241859436e-06, -4.732981324195862e-06, -4.366040229797363e-06, -3.999099135398865e-06, -3.632158041000366e-06, -3.2652169466018677e-06, -2.898275852203369e-06, -2.5313347578048706e-06, -2.164393663406372e-06, -1.7974525690078735e-06, -1.430511474609375e-06, -1.0635703802108765e-06, -6.966292858123779e-07, -3.296881914138794e-07, 3.725290298461914e-08, 4.041939973831177e-07, 7.711350917816162e-07, 1.1380761861801147e-06, 1.5050172805786133e-06, 1.8719583749771118e-06, 2.2388994693756104e-06, 2.605840563774109e-06, 2.9727816581726074e-06, 3.339722752571106e-06, 3.7066638469696045e-06, 4.073604941368103e-06, 4.4405460357666016e-06, 4.8074871301651e-06, 5.174428224563599e-06, 5.541369318962097e-06, 5.908310413360596e-06, 6.275251507759094e-06, 6.642192602157593e-06, 7.009133696556091e-06, 7.37607479095459e-06, 7.743015885353088e-06, 8.109956979751587e-06, 8.476898074150085e-06, 8.843839168548584e-06, 9.210780262947083e-06, 9.577721357345581e-06, 9.94466245174408e-06, 1.0311603546142578e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 12.0, 7.0, 6.0, 10.0, 16.0, 14.0, 15.0, 20.0, 46.0, 57.0, 80.0, 143.0, 231.0, 435.0, 783.0, 1524.0, 3559.0, 8997.0, 29013.0, 118462.0, 431052.0, 338629.0, 81752.0, 21144.0, 6911.0, 2758.0, 1296.0, 624.0, 347.0, 218.0, 141.0, 84.0, 43.0, 29.0, 22.0, 23.0, 6.0, 10.0, 11.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041290283203125, -0.03986024856567383, -0.038430213928222656, -0.037000179290771484, -0.03557014465332031, -0.03414011001586914, -0.03271007537841797, -0.0312800407409668, -0.029850006103515625, -0.028419971466064453, -0.02698993682861328, -0.02555990219116211, -0.024129867553710938, -0.022699832916259766, -0.021269798278808594, -0.019839763641357422, -0.01840972900390625, -0.016979694366455078, -0.015549659729003906, -0.014119625091552734, -0.012689590454101562, -0.01125955581665039, -0.009829521179199219, -0.008399486541748047, -0.006969451904296875, -0.005539417266845703, -0.004109382629394531, -0.0026793479919433594, -0.0012493133544921875, 0.00018072128295898438, 0.0016107559204101562, 0.003040790557861328, 0.0044708251953125, 0.005900859832763672, 0.007330894470214844, 0.008760929107666016, 0.010190963745117188, 0.01162099838256836, 0.013051033020019531, 0.014481067657470703, 0.015911102294921875, 0.017341136932373047, 0.01877117156982422, 0.02020120620727539, 0.021631240844726562, 0.023061275482177734, 0.024491310119628906, 0.025921344757080078, 0.02735137939453125, 0.028781414031982422, 0.030211448669433594, 0.031641483306884766, 0.03307151794433594, 0.03450155258178711, 0.03593158721923828, 0.03736162185668945, 0.038791656494140625, 0.0402216911315918, 0.04165172576904297, 0.04308176040649414, 0.04451179504394531, 0.045941829681396484, 0.047371864318847656, 0.04880189895629883, 0.05023193359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 12.0, 10.0, 13.0, 13.0, 16.0, 14.0, 29.0, 29.0, 35.0, 33.0, 58.0, 67.0, 78.0, 92.0, 91.0, 57.0, 61.0, 51.0, 42.0, 40.0, 32.0, 20.0, 19.0, 13.0, 20.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0122222900390625, -0.011849761009216309, -0.011477231979370117, -0.011104702949523926, -0.010732173919677734, -0.010359644889831543, -0.009987115859985352, -0.00961458683013916, -0.009242057800292969, -0.008869528770446777, -0.008496999740600586, -0.008124470710754395, -0.007751941680908203, -0.007379412651062012, -0.00700688362121582, -0.006634354591369629, -0.0062618255615234375, -0.005889296531677246, -0.005516767501831055, -0.005144238471984863, -0.004771709442138672, -0.0043991804122924805, -0.004026651382446289, -0.0036541223526000977, -0.0032815933227539062, -0.002909064292907715, -0.0025365352630615234, -0.002164006233215332, -0.0017914772033691406, -0.0014189481735229492, -0.0010464191436767578, -0.0006738901138305664, -0.000301361083984375, 7.11679458618164e-05, 0.0004436969757080078, 0.0008162260055541992, 0.0011887550354003906, 0.001561284065246582, 0.0019338130950927734, 0.002306342124938965, 0.0026788711547851562, 0.0030514001846313477, 0.003423929214477539, 0.0037964582443237305, 0.004168987274169922, 0.004541516304016113, 0.004914045333862305, 0.005286574363708496, 0.0056591033935546875, 0.006031632423400879, 0.00640416145324707, 0.006776690483093262, 0.007149219512939453, 0.0075217485427856445, 0.007894277572631836, 0.008266806602478027, 0.008639335632324219, 0.00901186466217041, 0.009384393692016602, 0.009756922721862793, 0.010129451751708984, 0.010501980781555176, 0.010874509811401367, 0.011247038841247559, 0.01161956787109375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 13.0, 27.0, 94.0, 220.0, 258.0, 201.0, 117.0, 46.0, 15.0, 5.0, 6.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8341423869132996, -0.793684720993042, -0.7532271146774292, -0.7127695083618164, -0.6723118424415588, -0.6318541765213013, -0.5913965702056885, -0.5509389638900757, -0.5104812979698181, -0.47002366185188293, -0.42956602573394775, -0.3891083896160126, -0.3486507534980774, -0.3081931173801422, -0.26773548126220703, -0.22727784514427185, -0.18682020902633667, -0.1463625729084015, -0.10590493679046631, -0.06544730067253113, -0.024989664554595947, 0.015467971563339233, 0.055925607681274414, 0.0963832437992096, 0.13684087991714478, 0.17729851603507996, 0.21775615215301514, 0.2582137882709503, 0.2986714243888855, 0.3391290605068207, 0.37958669662475586, 0.42004433274269104, 0.460502028465271, 0.5009596347808838, 0.5414173007011414, 0.5818749666213989, 0.6223325729370117, 0.6627901792526245, 0.7032478451728821, 0.7437055110931396, 0.7841631174087524, 0.8246207237243652, 0.8650783896446228, 0.9055360555648804, 0.9459936618804932, 0.986451268196106, 1.0269088745117188, 1.067366600036621, 1.1078242063522339, 1.1482818126678467, 1.188739538192749, 1.2291971445083618, 1.2696547508239746, 1.3101123571395874, 1.3505699634552002, 1.3910276889801025, 1.4314852952957153, 1.4719429016113281, 1.5124006271362305, 1.5528582334518433, 1.593315839767456, 1.6337734460830688, 1.6742310523986816, 1.714688777923584, 1.7551463842391968]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 13.0, 12.0, 14.0, 19.0, 21.0, 34.0, 34.0, 35.0, 40.0, 50.0, 55.0, 64.0, 56.0, 66.0, 67.0, 56.0, 53.0, 45.0, 50.0, 34.0, 36.0, 36.0, 31.0, 18.0, 14.0, 4.0, 11.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31671202182769775, -0.30428546667099, -0.29185888171195984, -0.2794323265552521, -0.2670057713985443, -0.25457918643951416, -0.2421526312828064, -0.22972607612609863, -0.21729950606822968, -0.20487293601036072, -0.19244638085365295, -0.180019810795784, -0.16759324073791504, -0.15516668558120728, -0.14274011552333832, -0.13031354546546936, -0.1178869903087616, -0.10546042770147324, -0.09303386509418488, -0.08060729503631592, -0.06818073242902756, -0.0557541698217392, -0.04332759976387024, -0.03090103715658188, -0.018474474549293518, -0.006047910079360008, 0.006378654390573502, 0.01880522072315216, 0.03123178333044052, 0.04365834593772888, 0.05608491599559784, 0.0685114786028862, 0.08093807101249695, 0.09336463361978531, 0.10579119622707367, 0.11821776628494263, 0.1306443214416504, 0.14307089149951935, 0.1554974615573883, 0.16792401671409607, 0.18035058677196503, 0.19277715682983398, 0.20520371198654175, 0.2176302820444107, 0.23005685210227966, 0.24248340725898743, 0.2549099922180176, 0.26733654737472534, 0.2797631025314331, 0.29218965768814087, 0.304616242647171, 0.3170427978038788, 0.32946935296058655, 0.3418959379196167, 0.35432249307632446, 0.3667490482330322, 0.37917560338974, 0.39160215854644775, 0.4040287435054779, 0.41645529866218567, 0.42888185381889343, 0.4413084387779236, 0.45373499393463135, 0.4661615490913391, 0.47858813405036926]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 5.0, 6.0, 16.0, 19.0, 41.0, 38.0, 78.0, 162.0, 226.0, 510.0, 1171.0, 2705.0, 7232.0, 21500.0, 83171.0, 466813.0, 368636.0, 67193.0, 18309.0, 6205.0, 2419.0, 1046.0, 512.0, 228.0, 116.0, 72.0, 47.0, 25.0, 16.0, 12.0, 12.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3696403503417969, -0.35768890380859375, -0.3457374572753906, -0.3337860107421875, -0.3218345642089844, -0.30988311767578125, -0.2979316711425781, -0.285980224609375, -0.2740287780761719, -0.26207733154296875, -0.2501258850097656, -0.2381744384765625, -0.22622299194335938, -0.21427154541015625, -0.20232009887695312, -0.19036865234375, -0.17841720581054688, -0.16646575927734375, -0.15451431274414062, -0.1425628662109375, -0.13061141967773438, -0.11865997314453125, -0.10670852661132812, -0.094757080078125, -0.08280563354492188, -0.07085418701171875, -0.058902740478515625, -0.0469512939453125, -0.034999847412109375, -0.02304840087890625, -0.011096954345703125, 0.0008544921875, 0.012805938720703125, 0.02475738525390625, 0.036708831787109375, 0.0486602783203125, 0.060611724853515625, 0.07256317138671875, 0.08451461791992188, 0.096466064453125, 0.10841751098632812, 0.12036895751953125, 0.13232040405273438, 0.1442718505859375, 0.15622329711914062, 0.16817474365234375, 0.18012619018554688, 0.19207763671875, 0.20402908325195312, 0.21598052978515625, 0.22793197631835938, 0.2398834228515625, 0.2518348693847656, 0.26378631591796875, 0.2757377624511719, 0.287689208984375, 0.2996406555175781, 0.31159210205078125, 0.3235435485839844, 0.3354949951171875, 0.3474464416503906, 0.35939788818359375, 0.3713493347167969, 0.38330078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 10.0, 14.0, 9.0, 19.0, 19.0, 29.0, 36.0, 46.0, 39.0, 58.0, 68.0, 68.0, 57.0, 70.0, 56.0, 62.0, 40.0, 63.0, 54.0, 40.0, 35.0, 29.0, 20.0, 16.0, 7.0, 7.0, 5.0, 9.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.78662109375, -0.7607421875, -0.73486328125, -0.708984375, -0.68310546875, -0.6572265625, -0.63134765625, -0.60546875, -0.57958984375, -0.5537109375, -0.52783203125, -0.501953125, -0.47607421875, -0.4501953125, -0.42431640625, -0.3984375, -0.37255859375, -0.3466796875, -0.32080078125, -0.294921875, -0.26904296875, -0.2431640625, -0.21728515625, -0.19140625, -0.16552734375, -0.1396484375, -0.11376953125, -0.087890625, -0.06201171875, -0.0361328125, -0.01025390625, 0.015625, 0.04150390625, 0.0673828125, 0.09326171875, 0.119140625, 0.14501953125, 0.1708984375, 0.19677734375, 0.22265625, 0.24853515625, 0.2744140625, 0.30029296875, 0.326171875, 0.35205078125, 0.3779296875, 0.40380859375, 0.4296875, 0.45556640625, 0.4814453125, 0.50732421875, 0.533203125, 0.55908203125, 0.5849609375, 0.61083984375, 0.63671875, 0.66259765625, 0.6884765625, 0.71435546875, 0.740234375, 0.76611328125, 0.7919921875, 0.81787109375, 0.84375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 11.0, 15.0, 17.0, 36.0, 44.0, 71.0, 114.0, 191.0, 417.0, 1218.0, 7938.0, 191515.0, 820853.0, 22495.0, 2383.0, 587.0, 244.0, 138.0, 88.0, 42.0, 23.0, 23.0, 19.0, 12.0, 9.0, 4.0, 2.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83740234375, -0.8066177368164062, -0.7758331298828125, -0.7450485229492188, -0.714263916015625, -0.6834793090820312, -0.6526947021484375, -0.6219100952148438, -0.59112548828125, -0.5603408813476562, -0.5295562744140625, -0.49877166748046875, -0.467987060546875, -0.43720245361328125, -0.4064178466796875, -0.37563323974609375, -0.3448486328125, -0.31406402587890625, -0.2832794189453125, -0.25249481201171875, -0.221710205078125, -0.19092559814453125, -0.1601409912109375, -0.12935638427734375, -0.09857177734375, -0.06778717041015625, -0.0370025634765625, -0.00621795654296875, 0.024566650390625, 0.05535125732421875, 0.0861358642578125, 0.11692047119140625, 0.147705078125, 0.17848968505859375, 0.2092742919921875, 0.24005889892578125, 0.270843505859375, 0.30162811279296875, 0.3324127197265625, 0.36319732666015625, 0.39398193359375, 0.42476654052734375, 0.4555511474609375, 0.48633575439453125, 0.517120361328125, 0.5479049682617188, 0.5786895751953125, 0.6094741821289062, 0.6402587890625, 0.6710433959960938, 0.7018280029296875, 0.7326126098632812, 0.763397216796875, 0.7941818237304688, 0.8249664306640625, 0.8557510375976562, 0.88653564453125, 0.9173202514648438, 0.9481048583984375, 0.9788894653320312, 1.009674072265625, 1.0404586791992188, 1.0712432861328125, 1.1020278930664062, 1.1328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 7.0, 6.0, 5.0, 11.0, 8.0, 9.0, 12.0, 11.0, 27.0, 33.0, 24.0, 26.0, 20.0, 44.0, 57.0, 46.0, 56.0, 47.0, 52.0, 56.0, 44.0, 58.0, 46.0, 43.0, 36.0, 37.0, 32.0, 27.0, 25.0, 13.0, 15.0, 15.0, 8.0, 14.0, 7.0, 4.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8466796875, -0.8193435668945312, -0.7920074462890625, -0.7646713256835938, -0.737335205078125, -0.7099990844726562, -0.6826629638671875, -0.6553268432617188, -0.62799072265625, -0.6006546020507812, -0.5733184814453125, -0.5459823608398438, -0.518646240234375, -0.49131011962890625, -0.4639739990234375, -0.43663787841796875, -0.4093017578125, -0.38196563720703125, -0.3546295166015625, -0.32729339599609375, -0.299957275390625, -0.27262115478515625, -0.2452850341796875, -0.21794891357421875, -0.19061279296875, -0.16327667236328125, -0.1359405517578125, -0.10860443115234375, -0.081268310546875, -0.05393218994140625, -0.0265960693359375, 0.00074005126953125, 0.028076171875, 0.05541229248046875, 0.0827484130859375, 0.11008453369140625, 0.137420654296875, 0.16475677490234375, 0.1920928955078125, 0.21942901611328125, 0.24676513671875, 0.27410125732421875, 0.3014373779296875, 0.32877349853515625, 0.356109619140625, 0.38344573974609375, 0.4107818603515625, 0.43811798095703125, 0.4654541015625, 0.49279022216796875, 0.5201263427734375, 0.5474624633789062, 0.574798583984375, 0.6021347045898438, 0.6294708251953125, 0.6568069458007812, 0.68414306640625, 0.7114791870117188, 0.7388153076171875, 0.7661514282226562, 0.793487548828125, 0.8208236694335938, 0.8481597900390625, 0.8754959106445312, 0.90283203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 7.0, 5.0, 10.0, 13.0, 17.0, 25.0, 45.0, 69.0, 107.0, 167.0, 377.0, 1234.0, 5963.0, 76359.0, 878459.0, 77608.0, 5985.0, 1196.0, 412.0, 173.0, 94.0, 63.0, 42.0, 35.0, 14.0, 11.0, 6.0, 6.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3076171875, -0.2984352111816406, -0.28925323486328125, -0.2800712585449219, -0.2708892822265625, -0.2617073059082031, -0.25252532958984375, -0.24334335327148438, -0.234161376953125, -0.22497940063476562, -0.21579742431640625, -0.20661544799804688, -0.1974334716796875, -0.18825149536132812, -0.17906951904296875, -0.16988754272460938, -0.16070556640625, -0.15152359008789062, -0.14234161376953125, -0.13315963745117188, -0.1239776611328125, -0.11479568481445312, -0.10561370849609375, -0.09643173217773438, -0.087249755859375, -0.07806777954101562, -0.06888580322265625, -0.059703826904296875, -0.0505218505859375, -0.041339874267578125, -0.03215789794921875, -0.022975921630859375, -0.0137939453125, -0.004611968994140625, 0.00457000732421875, 0.013751983642578125, 0.0229339599609375, 0.032115936279296875, 0.04129791259765625, 0.050479888916015625, 0.059661865234375, 0.06884384155273438, 0.07802581787109375, 0.08720779418945312, 0.0963897705078125, 0.10557174682617188, 0.11475372314453125, 0.12393569946289062, 0.13311767578125, 0.14229965209960938, 0.15148162841796875, 0.16066360473632812, 0.1698455810546875, 0.17902755737304688, 0.18820953369140625, 0.19739151000976562, 0.206573486328125, 0.21575546264648438, 0.22493743896484375, 0.23411941528320312, 0.2433013916015625, 0.2524833679199219, 0.26166534423828125, 0.2708473205566406, 0.280029296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 0.0, 7.0, 9.0, 5.0, 10.0, 17.0, 26.0, 26.0, 34.0, 54.0, 84.0, 111.0, 145.0, 133.0, 86.0, 48.0, 66.0, 35.0, 27.0, 17.0, 17.0, 14.0, 8.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.135204315185547e-05, -3.054458647966385e-05, -2.973712980747223e-05, -2.892967313528061e-05, -2.812221646308899e-05, -2.731475979089737e-05, -2.650730311870575e-05, -2.569984644651413e-05, -2.489238977432251e-05, -2.408493310213089e-05, -2.327747642993927e-05, -2.247001975774765e-05, -2.166256308555603e-05, -2.085510641336441e-05, -2.004764974117279e-05, -1.924019306898117e-05, -1.843273639678955e-05, -1.762527972459793e-05, -1.681782305240631e-05, -1.601036638021469e-05, -1.5202909708023071e-05, -1.4395453035831451e-05, -1.3587996363639832e-05, -1.2780539691448212e-05, -1.1973083019256592e-05, -1.1165626347064972e-05, -1.0358169674873352e-05, -9.550713002681732e-06, -8.743256330490112e-06, -7.935799658298492e-06, -7.1283429861068726e-06, -6.320886313915253e-06, -5.513429641723633e-06, -4.705972969532013e-06, -3.898516297340393e-06, -3.091059625148773e-06, -2.2836029529571533e-06, -1.4761462807655334e-06, -6.686896085739136e-07, 1.387670636177063e-07, 9.462237358093262e-07, 1.753680408000946e-06, 2.561137080192566e-06, 3.368593752384186e-06, 4.176050424575806e-06, 4.9835070967674255e-06, 5.790963768959045e-06, 6.598420441150665e-06, 7.405877113342285e-06, 8.213333785533905e-06, 9.020790457725525e-06, 9.828247129917145e-06, 1.0635703802108765e-05, 1.1443160474300385e-05, 1.2250617146492004e-05, 1.3058073818683624e-05, 1.3865530490875244e-05, 1.4672987163066864e-05, 1.5480443835258484e-05, 1.6287900507450104e-05, 1.7095357179641724e-05, 1.7902813851833344e-05, 1.8710270524024963e-05, 1.9517727196216583e-05, 2.0325183868408203e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 4.0, 13.0, 19.0, 20.0, 40.0, 69.0, 149.0, 421.0, 1455.0, 9556.0, 644755.0, 382424.0, 7721.0, 1226.0, 355.0, 147.0, 60.0, 35.0, 16.0, 22.0, 7.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5576629638671875, -0.542572021484375, -0.5274810791015625, -0.51239013671875, -0.4972991943359375, -0.482208251953125, -0.4671173095703125, -0.4520263671875, -0.4369354248046875, -0.421844482421875, -0.4067535400390625, -0.39166259765625, -0.3765716552734375, -0.361480712890625, -0.3463897705078125, -0.331298828125, -0.3162078857421875, -0.301116943359375, -0.2860260009765625, -0.27093505859375, -0.2558441162109375, -0.240753173828125, -0.2256622314453125, -0.2105712890625, -0.1954803466796875, -0.180389404296875, -0.1652984619140625, -0.15020751953125, -0.1351165771484375, -0.120025634765625, -0.1049346923828125, -0.08984375, -0.0747528076171875, -0.059661865234375, -0.0445709228515625, -0.02947998046875, -0.0143890380859375, 0.000701904296875, 0.0157928466796875, 0.0308837890625, 0.0459747314453125, 0.061065673828125, 0.0761566162109375, 0.09124755859375, 0.1063385009765625, 0.121429443359375, 0.1365203857421875, 0.151611328125, 0.1667022705078125, 0.181793212890625, 0.1968841552734375, 0.21197509765625, 0.2270660400390625, 0.242156982421875, 0.2572479248046875, 0.2723388671875, 0.2874298095703125, 0.302520751953125, 0.3176116943359375, 0.33270263671875, 0.3477935791015625, 0.362884521484375, 0.3779754638671875, 0.39306640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 14.0, 13.0, 18.0, 34.0, 38.0, 55.0, 89.0, 135.0, 165.0, 146.0, 76.0, 70.0, 40.0, 20.0, 20.0, 13.0, 15.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08575439453125, -0.08226490020751953, -0.07877540588378906, -0.0752859115600586, -0.07179641723632812, -0.06830692291259766, -0.06481742858886719, -0.06132793426513672, -0.05783843994140625, -0.05434894561767578, -0.05085945129394531, -0.047369956970214844, -0.043880462646484375, -0.040390968322753906, -0.03690147399902344, -0.03341197967529297, -0.0299224853515625, -0.02643299102783203, -0.022943496704101562, -0.019454002380371094, -0.015964508056640625, -0.012475013732910156, -0.008985519409179688, -0.005496025085449219, -0.00200653076171875, 0.0014829635620117188, 0.0049724578857421875, 0.008461952209472656, 0.011951446533203125, 0.015440940856933594, 0.018930435180664062, 0.02241992950439453, 0.025909423828125, 0.02939891815185547, 0.03288841247558594, 0.036377906799316406, 0.039867401123046875, 0.043356895446777344, 0.04684638977050781, 0.05033588409423828, 0.05382537841796875, 0.05731487274169922, 0.06080436706542969, 0.06429386138916016, 0.06778335571289062, 0.0712728500366211, 0.07476234436035156, 0.07825183868408203, 0.0817413330078125, 0.08523082733154297, 0.08872032165527344, 0.0922098159790039, 0.09569931030273438, 0.09918880462646484, 0.10267829895019531, 0.10616779327392578, 0.10965728759765625, 0.11314678192138672, 0.11663627624511719, 0.12012577056884766, 0.12361526489257812, 0.1271047592163086, 0.13059425354003906, 0.13408374786376953, 0.1375732421875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 18.0, 55.0, 173.0, 293.0, 237.0, 146.0, 52.0, 20.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2860541343688965, -1.1938409805297852, -1.1016277074813843, -1.009414553642273, -0.9172013998031616, -0.8249881863594055, -0.7327749729156494, -0.6405618190765381, -0.548348605632782, -0.45613542199134827, -0.36392223834991455, -0.27170902490615845, -0.17949584126472473, -0.08728265762329102, 0.004930555820465088, 0.09714370965957642, 0.18935692310333252, 0.28157010674476624, 0.37378329038619995, 0.46599650382995605, 0.5582096576690674, 0.6504228711128235, 0.7426360845565796, 0.8348492383956909, 0.927062451839447, 1.0192756652832031, 1.1114888191223145, 1.2037019729614258, 1.2959152460098267, 1.388128399848938, 1.4803416728973389, 1.5725548267364502, 1.6647679805755615, 1.7569811344146729, 1.8491944074630737, 1.941407561302185, 2.033620834350586, 2.1258339881896973, 2.2180471420288086, 2.31026029586792, 2.4024734497070312, 2.4946866035461426, 2.586899757385254, 2.6791129112243652, 2.7713263034820557, 2.863539457321167, 2.9557526111602783, 3.0479657649993896, 3.14017915725708, 3.2323923110961914, 3.3246054649353027, 3.416818618774414, 3.5090320110321045, 3.601245164871216, 3.693458318710327, 3.7856714725494385, 3.87788462638855, 3.970097780227661, 4.062311172485352, 4.154524326324463, 4.246737480163574, 4.3389506340026855, 4.431163787841797, 4.523376941680908, 4.6155900955200195]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 6.0, 7.0, 8.0, 10.0, 14.0, 21.0, 17.0, 26.0, 22.0, 35.0, 28.0, 31.0, 34.0, 35.0, 42.0, 49.0, 36.0, 48.0, 54.0, 31.0, 39.0, 41.0, 40.0, 47.0, 35.0, 34.0, 43.0, 33.0, 24.0, 19.0, 20.0, 12.0, 7.0, 8.0, 12.0, 7.0, 6.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0779831409454346, -1.0378050804138184, -0.9976270198822021, -0.9574488997459412, -0.917270839214325, -0.8770927786827087, -0.8369146585464478, -0.7967365980148315, -0.7565585374832153, -0.7163804769515991, -0.6762024164199829, -0.6360242962837219, -0.5958462357521057, -0.5556681752204895, -0.5154900550842285, -0.4753119945526123, -0.4351339340209961, -0.3949558734893799, -0.3547777831554413, -0.3145996928215027, -0.2744216322898865, -0.23424355685710907, -0.19406548142433167, -0.15388739109039307, -0.11370933055877686, -0.07353125512599945, -0.033353179693222046, 0.006824895739555359, 0.047002971172332764, 0.08718104660511017, 0.12735912203788757, 0.16753721237182617, 0.20771539211273193, 0.24789346754550934, 0.28807154297828674, 0.32824963331222534, 0.36842769384384155, 0.40860575437545776, 0.44878384470939636, 0.48896193504333496, 0.5291399955749512, 0.5693180561065674, 0.6094961166381836, 0.6496742367744446, 0.6898522973060608, 0.730030357837677, 0.770208477973938, 0.8103865385055542, 0.8505645990371704, 0.8907426595687866, 0.9309207201004028, 0.9710988402366638, 1.0112769603729248, 1.051455020904541, 1.0916330814361572, 1.1318111419677734, 1.1719892024993896, 1.2121672630310059, 1.252345323562622, 1.2925233840942383, 1.3327014446258545, 1.3728796243667603, 1.4130576848983765, 1.4532357454299927, 1.4934138059616089]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 12.0, 21.0, 31.0, 47.0, 77.0, 139.0, 299.0, 729.0, 2176.0, 6624.0, 27428.0, 275643.0, 2705078.0, 1089752.0, 71983.0, 9853.0, 2531.0, 920.0, 413.0, 216.0, 116.0, 70.0, 41.0, 19.0, 30.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.072265625, -1.0459442138671875, -1.019622802734375, -0.9933013916015625, -0.96697998046875, -0.9406585693359375, -0.914337158203125, -0.8880157470703125, -0.8616943359375, -0.8353729248046875, -0.809051513671875, -0.7827301025390625, -0.75640869140625, -0.7300872802734375, -0.703765869140625, -0.6774444580078125, -0.651123046875, -0.6248016357421875, -0.598480224609375, -0.5721588134765625, -0.54583740234375, -0.5195159912109375, -0.493194580078125, -0.4668731689453125, -0.4405517578125, -0.4142303466796875, -0.387908935546875, -0.3615875244140625, -0.33526611328125, -0.3089447021484375, -0.282623291015625, -0.2563018798828125, -0.22998046875, -0.2036590576171875, -0.177337646484375, -0.1510162353515625, -0.12469482421875, -0.0983734130859375, -0.072052001953125, -0.0457305908203125, -0.0194091796875, 0.0069122314453125, 0.033233642578125, 0.0595550537109375, 0.08587646484375, 0.1121978759765625, 0.138519287109375, 0.1648406982421875, 0.191162109375, 0.2174835205078125, 0.243804931640625, 0.2701263427734375, 0.29644775390625, 0.3227691650390625, 0.349090576171875, 0.3754119873046875, 0.4017333984375, 0.4280548095703125, 0.454376220703125, 0.4806976318359375, 0.50701904296875, 0.5333404541015625, 0.559661865234375, 0.5859832763671875, 0.6123046875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 4.0, 8.0, 20.0, 15.0, 19.0, 17.0, 39.0, 40.0, 52.0, 66.0, 83.0, 64.0, 76.0, 72.0, 89.0, 78.0, 61.0, 45.0, 44.0, 30.0, 32.0, 22.0, 15.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42041015625, -0.39827728271484375, -0.3761444091796875, -0.35401153564453125, -0.331878662109375, -0.30974578857421875, -0.2876129150390625, -0.26548004150390625, -0.24334716796875, -0.22121429443359375, -0.1990814208984375, -0.17694854736328125, -0.154815673828125, -0.13268280029296875, -0.1105499267578125, -0.08841705322265625, -0.0662841796875, -0.04415130615234375, -0.0220184326171875, 0.00011444091796875, 0.022247314453125, 0.04438018798828125, 0.0665130615234375, 0.08864593505859375, 0.11077880859375, 0.13291168212890625, 0.1550445556640625, 0.17717742919921875, 0.199310302734375, 0.22144317626953125, 0.2435760498046875, 0.26570892333984375, 0.287841796875, 0.30997467041015625, 0.3321075439453125, 0.35424041748046875, 0.376373291015625, 0.39850616455078125, 0.4206390380859375, 0.44277191162109375, 0.46490478515625, 0.48703765869140625, 0.5091705322265625, 0.5313034057617188, 0.553436279296875, 0.5755691528320312, 0.5977020263671875, 0.6198348999023438, 0.6419677734375, 0.6641006469726562, 0.6862335205078125, 0.7083663940429688, 0.730499267578125, 0.7526321411132812, 0.7747650146484375, 0.7968978881835938, 0.81903076171875, 0.8411636352539062, 0.8632965087890625, 0.8854293823242188, 0.907562255859375, 0.9296951293945312, 0.9518280029296875, 0.9739608764648438, 0.99609375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 11.0, 16.0, 14.0, 26.0, 46.0, 76.0, 126.0, 376.0, 1076.0, 5457.0, 98179.0, 4005297.0, 77466.0, 4608.0, 922.0, 294.0, 118.0, 63.0, 28.0, 22.0, 13.0, 9.0, 9.0, 4.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.85546875, -1.80316162109375, -1.7508544921875, -1.69854736328125, -1.646240234375, -1.59393310546875, -1.5416259765625, -1.48931884765625, -1.43701171875, -1.38470458984375, -1.3323974609375, -1.28009033203125, -1.227783203125, -1.17547607421875, -1.1231689453125, -1.07086181640625, -1.0185546875, -0.96624755859375, -0.9139404296875, -0.86163330078125, -0.809326171875, -0.75701904296875, -0.7047119140625, -0.65240478515625, -0.60009765625, -0.54779052734375, -0.4954833984375, -0.44317626953125, -0.390869140625, -0.33856201171875, -0.2862548828125, -0.23394775390625, -0.181640625, -0.12933349609375, -0.0770263671875, -0.02471923828125, 0.027587890625, 0.07989501953125, 0.1322021484375, 0.18450927734375, 0.23681640625, 0.28912353515625, 0.3414306640625, 0.39373779296875, 0.446044921875, 0.49835205078125, 0.5506591796875, 0.60296630859375, 0.6552734375, 0.70758056640625, 0.7598876953125, 0.81219482421875, 0.864501953125, 0.91680908203125, 0.9691162109375, 1.02142333984375, 1.07373046875, 1.12603759765625, 1.1783447265625, 1.23065185546875, 1.282958984375, 1.33526611328125, 1.3875732421875, 1.43988037109375, 1.4921875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 4.0, 11.0, 20.0, 38.0, 75.0, 118.0, 253.0, 560.0, 878.0, 1031.0, 540.0, 233.0, 136.0, 63.0, 37.0, 20.0, 16.0, 10.0, 1.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2314453125, -0.2204742431640625, -0.209503173828125, -0.1985321044921875, -0.18756103515625, -0.1765899658203125, -0.165618896484375, -0.1546478271484375, -0.1436767578125, -0.1327056884765625, -0.121734619140625, -0.1107635498046875, -0.09979248046875, -0.0888214111328125, -0.077850341796875, -0.0668792724609375, -0.055908203125, -0.0449371337890625, -0.033966064453125, -0.0229949951171875, -0.01202392578125, -0.0010528564453125, 0.009918212890625, 0.0208892822265625, 0.0318603515625, 0.0428314208984375, 0.053802490234375, 0.0647735595703125, 0.07574462890625, 0.0867156982421875, 0.097686767578125, 0.1086578369140625, 0.11962890625, 0.1305999755859375, 0.141571044921875, 0.1525421142578125, 0.16351318359375, 0.1744842529296875, 0.185455322265625, 0.1964263916015625, 0.2073974609375, 0.2183685302734375, 0.229339599609375, 0.2403106689453125, 0.25128173828125, 0.2622528076171875, 0.273223876953125, 0.2841949462890625, 0.295166015625, 0.3061370849609375, 0.317108154296875, 0.3280792236328125, 0.33905029296875, 0.3500213623046875, 0.360992431640625, 0.3719635009765625, 0.3829345703125, 0.3939056396484375, 0.404876708984375, 0.4158477783203125, 0.42681884765625, 0.4377899169921875, 0.448760986328125, 0.4597320556640625, 0.470703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 9.0, 35.0, 34.0, 71.0, 88.0, 131.0, 152.0, 126.0, 119.0, 89.0, 55.0, 36.0, 26.0, 13.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5778068900108337, -0.5397259593009949, -0.501645028591156, -0.4635641276836395, -0.42548322677612305, -0.3874022960662842, -0.3493213653564453, -0.31124046444892883, -0.27315953373908997, -0.2350786179304123, -0.19699770212173462, -0.15891677141189575, -0.12083585560321808, -0.0827549397945404, -0.04467400908470154, -0.006593108177185059, 0.03148782253265381, 0.06956873834133148, 0.10764966160058975, 0.14573058485984802, 0.1838115006685257, 0.22189241647720337, 0.25997334718704224, 0.2980542480945587, 0.3361351788043976, 0.37421610951423645, 0.41229701042175293, 0.4503779411315918, 0.48845887184143066, 0.5265398025512695, 0.5646207332611084, 0.6027016043663025, 0.6407824754714966, 0.6788634061813354, 0.7169443368911743, 0.7550252676010132, 0.7931061387062073, 0.8311870694160461, 0.869268000125885, 0.9073488712310791, 0.945429801940918, 0.9835107326507568, 1.0215916633605957, 1.0596725940704346, 1.0977535247802734, 1.1358344554901123, 1.1739153861999512, 1.2119961977005005, 1.250077247619629, 1.2881581783294678, 1.3262391090393066, 1.3643200397491455, 1.4024009704589844, 1.4404819011688232, 1.478562831878662, 1.5166436433792114, 1.5547245740890503, 1.5928055047988892, 1.630886435508728, 1.668967366218567, 1.7070482969284058, 1.745129108428955, 1.783210039138794, 1.8212909698486328, 1.8593719005584717]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 11.0, 19.0, 18.0, 24.0, 25.0, 29.0, 39.0, 33.0, 35.0, 47.0, 53.0, 46.0, 51.0, 51.0, 37.0, 49.0, 54.0, 49.0, 48.0, 48.0, 28.0, 36.0, 36.0, 26.0, 16.0, 14.0, 16.0, 19.0, 10.0, 12.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5202762484550476, -0.5027804970741272, -0.48528480529785156, -0.46778908371925354, -0.4502933621406555, -0.4327976405620575, -0.4153019189834595, -0.39780616760253906, -0.3803104758262634, -0.3628147542476654, -0.3453190326690674, -0.32782331109046936, -0.31032758951187134, -0.2928318679332733, -0.2753361463546753, -0.2578403949737549, -0.24034467339515686, -0.22284895181655884, -0.20535323023796082, -0.1878575086593628, -0.17036178708076477, -0.15286606550216675, -0.13537032902240753, -0.11787460744380951, -0.10037888586521149, -0.08288316428661346, -0.06538744270801544, -0.04789171367883682, -0.0303959921002388, -0.012900270521640778, 0.004595458507537842, 0.022091180086135864, 0.03958690166473389, 0.05708262324333191, 0.07457834482192993, 0.09207407385110855, 0.10956979542970657, 0.127065509557724, 0.14456124603748322, 0.16205696761608124, 0.17955268919467926, 0.19704841077327728, 0.2145441323518753, 0.23203986883163452, 0.24953559041023254, 0.26703131198883057, 0.2845270335674286, 0.3020227551460266, 0.31951847672462463, 0.33701419830322266, 0.3545099198818207, 0.3720056414604187, 0.3895013630390167, 0.40699708461761475, 0.42449283599853516, 0.4419885277748108, 0.4594842791557312, 0.4769800007343292, 0.49447572231292725, 0.5119714736938477, 0.5294671654701233, 0.5469629168510437, 0.5644586086273193, 0.5819543600082397, 0.5994500517845154]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 6.0, 10.0, 16.0, 33.0, 52.0, 71.0, 119.0, 346.0, 864.0, 2490.0, 9748.0, 61369.0, 616387.0, 319295.0, 29198.0, 5749.0, 1661.0, 596.0, 236.0, 113.0, 55.0, 41.0, 29.0, 17.0, 14.0, 7.0, 3.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.234130859375, -0.22540283203125, -0.2166748046875, -0.20794677734375, -0.19921875, -0.19049072265625, -0.1817626953125, -0.17303466796875, -0.164306640625, -0.15557861328125, -0.1468505859375, -0.13812255859375, -0.12939453125, -0.12066650390625, -0.1119384765625, -0.10321044921875, -0.094482421875, -0.08575439453125, -0.0770263671875, -0.06829833984375, -0.0595703125, -0.05084228515625, -0.0421142578125, -0.03338623046875, -0.024658203125, -0.01593017578125, -0.0072021484375, 0.00152587890625, 0.01025390625, 0.01898193359375, 0.0277099609375, 0.03643798828125, 0.045166015625, 0.05389404296875, 0.0626220703125, 0.07135009765625, 0.080078125, 0.08880615234375, 0.0975341796875, 0.10626220703125, 0.114990234375, 0.12371826171875, 0.1324462890625, 0.14117431640625, 0.14990234375, 0.15863037109375, 0.1673583984375, 0.17608642578125, 0.184814453125, 0.19354248046875, 0.2022705078125, 0.21099853515625, 0.2197265625, 0.22845458984375, 0.2371826171875, 0.24591064453125, 0.254638671875, 0.26336669921875, 0.2720947265625, 0.28082275390625, 0.28955078125, 0.29827880859375, 0.3070068359375, 0.31573486328125, 0.324462890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 8.0, 14.0, 18.0, 24.0, 50.0, 41.0, 53.0, 64.0, 64.0, 60.0, 80.0, 67.0, 80.0, 63.0, 64.0, 53.0, 44.0, 44.0, 34.0, 24.0, 20.0, 14.0, 10.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4292869567871094, -0.41350555419921875, -0.3977241516113281, -0.3819427490234375, -0.3661613464355469, -0.35037994384765625, -0.3345985412597656, -0.318817138671875, -0.3030357360839844, -0.28725433349609375, -0.2714729309082031, -0.2556915283203125, -0.23991012573242188, -0.22412872314453125, -0.20834732055664062, -0.19256591796875, -0.17678451538085938, -0.16100311279296875, -0.14522171020507812, -0.1294403076171875, -0.11365890502929688, -0.09787750244140625, -0.08209609985351562, -0.066314697265625, -0.050533294677734375, -0.03475189208984375, -0.018970489501953125, -0.0031890869140625, 0.012592315673828125, 0.02837371826171875, 0.044155120849609375, 0.0599365234375, 0.07571792602539062, 0.09149932861328125, 0.10728073120117188, 0.1230621337890625, 0.13884353637695312, 0.15462493896484375, 0.17040634155273438, 0.186187744140625, 0.20196914672851562, 0.21775054931640625, 0.23353195190429688, 0.2493133544921875, 0.2650947570800781, 0.28087615966796875, 0.2966575622558594, 0.31243896484375, 0.3282203674316406, 0.34400177001953125, 0.3597831726074219, 0.3755645751953125, 0.3913459777832031, 0.40712738037109375, 0.4229087829589844, 0.438690185546875, 0.4544715881347656, 0.47025299072265625, 0.4860343933105469, 0.5018157958984375, 0.5175971984863281, 0.5333786010742188, 0.5491600036621094, 0.56494140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 2.0, 8.0, 11.0, 7.0, 18.0, 24.0, 32.0, 50.0, 71.0, 92.0, 121.0, 215.0, 316.0, 539.0, 876.0, 1517.0, 2806.0, 5173.0, 11445.0, 27786.0, 75016.0, 202369.0, 341947.0, 231507.0, 88472.0, 32182.0, 12868.0, 5958.0, 3060.0, 1626.0, 870.0, 548.0, 349.0, 207.0, 131.0, 97.0, 61.0, 64.0, 33.0, 21.0, 16.0, 12.0, 10.0, 3.0, 3.0, 1.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08917236328125, -0.08643531799316406, -0.08369827270507812, -0.08096122741699219, -0.07822418212890625, -0.07548713684082031, -0.07275009155273438, -0.07001304626464844, -0.0672760009765625, -0.06453895568847656, -0.061801910400390625, -0.05906486511230469, -0.05632781982421875, -0.05359077453613281, -0.050853729248046875, -0.04811668395996094, -0.045379638671875, -0.04264259338378906, -0.039905548095703125, -0.03716850280761719, -0.03443145751953125, -0.03169441223144531, -0.028957366943359375, -0.026220321655273438, -0.0234832763671875, -0.020746231079101562, -0.018009185791015625, -0.015272140502929688, -0.01253509521484375, -0.009798049926757812, -0.007061004638671875, -0.0043239593505859375, -0.0015869140625, 0.0011501312255859375, 0.003887176513671875, 0.0066242218017578125, 0.00936126708984375, 0.012098312377929688, 0.014835357666015625, 0.017572402954101562, 0.0203094482421875, 0.023046493530273438, 0.025783538818359375, 0.028520584106445312, 0.03125762939453125, 0.03399467468261719, 0.036731719970703125, 0.03946876525878906, 0.042205810546875, 0.04494285583496094, 0.047679901123046875, 0.05041694641113281, 0.05315399169921875, 0.05589103698730469, 0.058628082275390625, 0.06136512756347656, 0.0641021728515625, 0.06683921813964844, 0.06957626342773438, 0.07231330871582031, 0.07505035400390625, 0.07778739929199219, 0.08052444458007812, 0.08326148986816406, 0.08599853515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 11.0, 6.0, 11.0, 11.0, 24.0, 13.0, 9.0, 22.0, 28.0, 28.0, 29.0, 31.0, 43.0, 35.0, 44.0, 45.0, 47.0, 55.0, 44.0, 46.0, 36.0, 42.0, 44.0, 34.0, 39.0, 32.0, 25.0, 17.0, 17.0, 16.0, 20.0, 15.0, 13.0, 14.0, 6.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5380859375, -0.5186691284179688, -0.4992523193359375, -0.47983551025390625, -0.460418701171875, -0.44100189208984375, -0.4215850830078125, -0.40216827392578125, -0.38275146484375, -0.36333465576171875, -0.3439178466796875, -0.32450103759765625, -0.305084228515625, -0.28566741943359375, -0.2662506103515625, -0.24683380126953125, -0.2274169921875, -0.20800018310546875, -0.1885833740234375, -0.16916656494140625, -0.149749755859375, -0.13033294677734375, -0.1109161376953125, -0.09149932861328125, -0.07208251953125, -0.05266571044921875, -0.0332489013671875, -0.01383209228515625, 0.005584716796875, 0.02500152587890625, 0.0444183349609375, 0.06383514404296875, 0.083251953125, 0.10266876220703125, 0.1220855712890625, 0.14150238037109375, 0.160919189453125, 0.18033599853515625, 0.1997528076171875, 0.21916961669921875, 0.23858642578125, 0.25800323486328125, 0.2774200439453125, 0.29683685302734375, 0.316253662109375, 0.33567047119140625, 0.3550872802734375, 0.37450408935546875, 0.3939208984375, 0.41333770751953125, 0.4327545166015625, 0.45217132568359375, 0.471588134765625, 0.49100494384765625, 0.5104217529296875, 0.5298385620117188, 0.54925537109375, 0.5686721801757812, 0.5880889892578125, 0.6075057983398438, 0.626922607421875, 0.6463394165039062, 0.6657562255859375, 0.6851730346679688, 0.70458984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 9.0, 13.0, 17.0, 29.0, 46.0, 57.0, 100.0, 140.0, 225.0, 405.0, 758.0, 1434.0, 2872.0, 6225.0, 15501.0, 46996.0, 189812.0, 516659.0, 192033.0, 47665.0, 15348.0, 6239.0, 2796.0, 1428.0, 711.0, 415.0, 227.0, 147.0, 75.0, 46.0, 41.0, 25.0, 21.0, 15.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0511474609375, -0.04957389831542969, -0.048000335693359375, -0.04642677307128906, -0.04485321044921875, -0.04327964782714844, -0.041706085205078125, -0.04013252258300781, -0.0385589599609375, -0.03698539733886719, -0.035411834716796875, -0.03383827209472656, -0.03226470947265625, -0.030691146850585938, -0.029117584228515625, -0.027544021606445312, -0.025970458984375, -0.024396896362304688, -0.022823333740234375, -0.021249771118164062, -0.01967620849609375, -0.018102645874023438, -0.016529083251953125, -0.014955520629882812, -0.0133819580078125, -0.011808395385742188, -0.010234832763671875, -0.008661270141601562, -0.00708770751953125, -0.0055141448974609375, -0.003940582275390625, -0.0023670196533203125, -0.00079345703125, 0.0007801055908203125, 0.002353668212890625, 0.0039272308349609375, 0.00550079345703125, 0.0070743560791015625, 0.008647918701171875, 0.010221481323242188, 0.0117950439453125, 0.013368606567382812, 0.014942169189453125, 0.016515731811523438, 0.01808929443359375, 0.019662857055664062, 0.021236419677734375, 0.022809982299804688, 0.024383544921875, 0.025957107543945312, 0.027530670166015625, 0.029104232788085938, 0.03067779541015625, 0.03225135803222656, 0.033824920654296875, 0.03539848327636719, 0.0369720458984375, 0.03854560852050781, 0.040119171142578125, 0.04169273376464844, 0.04326629638671875, 0.04483985900878906, 0.046413421630859375, 0.04798698425292969, 0.049560546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 12.0, 18.0, 22.0, 29.0, 36.0, 75.0, 96.0, 98.0, 135.0, 130.0, 114.0, 68.0, 47.0, 46.0, 28.0, 14.0, 13.0, 5.0, 6.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5795230865478516e-05, -1.4992430806159973e-05, -1.418963074684143e-05, -1.3386830687522888e-05, -1.2584030628204346e-05, -1.1781230568885803e-05, -1.097843050956726e-05, -1.0175630450248718e-05, -9.372830390930176e-06, -8.570030331611633e-06, -7.76723027229309e-06, -6.964430212974548e-06, -6.161630153656006e-06, -5.358830094337463e-06, -4.556030035018921e-06, -3.7532299757003784e-06, -2.950429916381836e-06, -2.1476298570632935e-06, -1.344829797744751e-06, -5.420297384262085e-07, 2.60770320892334e-07, 1.0635703802108765e-06, 1.866370439529419e-06, 2.6691704988479614e-06, 3.471970558166504e-06, 4.274770617485046e-06, 5.077570676803589e-06, 5.880370736122131e-06, 6.683170795440674e-06, 7.485970854759216e-06, 8.288770914077759e-06, 9.091570973396301e-06, 9.894371032714844e-06, 1.0697171092033386e-05, 1.1499971151351929e-05, 1.2302771210670471e-05, 1.3105571269989014e-05, 1.3908371329307556e-05, 1.4711171388626099e-05, 1.551397144794464e-05, 1.6316771507263184e-05, 1.7119571566581726e-05, 1.792237162590027e-05, 1.872517168521881e-05, 1.9527971744537354e-05, 2.0330771803855896e-05, 2.113357186317444e-05, 2.193637192249298e-05, 2.2739171981811523e-05, 2.3541972041130066e-05, 2.434477210044861e-05, 2.514757215976715e-05, 2.5950372219085693e-05, 2.6753172278404236e-05, 2.755597233772278e-05, 2.835877239704132e-05, 2.9161572456359863e-05, 2.9964372515678406e-05, 3.076717257499695e-05, 3.156997263431549e-05, 3.237277269363403e-05, 3.3175572752952576e-05, 3.397837281227112e-05, 3.478117287158966e-05, 3.55839729309082e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 7.0, 9.0, 13.0, 10.0, 13.0, 12.0, 22.0, 38.0, 38.0, 60.0, 93.0, 174.0, 262.0, 461.0, 816.0, 1550.0, 3207.0, 6825.0, 16115.0, 42494.0, 141221.0, 434673.0, 277509.0, 76704.0, 26156.0, 10483.0, 4704.0, 2188.0, 1113.0, 590.0, 351.0, 195.0, 139.0, 92.0, 54.0, 40.0, 32.0, 23.0, 24.0, 11.0, 9.0, 5.0, 3.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.044952392578125, -0.0434417724609375, -0.04193115234375, -0.0404205322265625, -0.038909912109375, -0.0373992919921875, -0.035888671875, -0.0343780517578125, -0.032867431640625, -0.0313568115234375, -0.02984619140625, -0.0283355712890625, -0.026824951171875, -0.0253143310546875, -0.0238037109375, -0.0222930908203125, -0.020782470703125, -0.0192718505859375, -0.01776123046875, -0.0162506103515625, -0.014739990234375, -0.0132293701171875, -0.01171875, -0.0102081298828125, -0.008697509765625, -0.0071868896484375, -0.00567626953125, -0.0041656494140625, -0.002655029296875, -0.0011444091796875, 0.0003662109375, 0.0018768310546875, 0.003387451171875, 0.0048980712890625, 0.00640869140625, 0.0079193115234375, 0.009429931640625, 0.0109405517578125, 0.012451171875, 0.0139617919921875, 0.015472412109375, 0.0169830322265625, 0.01849365234375, 0.0200042724609375, 0.021514892578125, 0.0230255126953125, 0.0245361328125, 0.0260467529296875, 0.027557373046875, 0.0290679931640625, 0.03057861328125, 0.0320892333984375, 0.033599853515625, 0.0351104736328125, 0.03662109375, 0.0381317138671875, 0.039642333984375, 0.0411529541015625, 0.04266357421875, 0.0441741943359375, 0.045684814453125, 0.0471954345703125, 0.0487060546875, 0.0502166748046875, 0.051727294921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 3.0, 6.0, 5.0, 11.0, 10.0, 11.0, 14.0, 19.0, 19.0, 25.0, 26.0, 43.0, 35.0, 54.0, 62.0, 77.0, 73.0, 79.0, 68.0, 67.0, 54.0, 39.0, 34.0, 31.0, 33.0, 19.0, 15.0, 9.0, 6.0, 6.0, 10.0, 4.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.014862060546875, -0.014423727989196777, -0.013985395431518555, -0.013547062873840332, -0.01310873031616211, -0.012670397758483887, -0.012232065200805664, -0.011793732643127441, -0.011355400085449219, -0.010917067527770996, -0.010478734970092773, -0.01004040241241455, -0.009602069854736328, -0.009163737297058105, -0.008725404739379883, -0.00828707218170166, -0.007848739624023438, -0.007410407066345215, -0.006972074508666992, -0.0065337419509887695, -0.006095409393310547, -0.005657076835632324, -0.0052187442779541016, -0.004780411720275879, -0.004342079162597656, -0.0039037466049194336, -0.003465414047241211, -0.0030270814895629883, -0.0025887489318847656, -0.002150416374206543, -0.0017120838165283203, -0.0012737512588500977, -0.000835418701171875, -0.00039708614349365234, 4.124641418457031e-05, 0.00047957897186279297, 0.0009179115295410156, 0.0013562440872192383, 0.001794576644897461, 0.0022329092025756836, 0.0026712417602539062, 0.003109574317932129, 0.0035479068756103516, 0.003986239433288574, 0.004424571990966797, 0.0048629045486450195, 0.005301237106323242, 0.005739569664001465, 0.0061779022216796875, 0.00661623477935791, 0.007054567337036133, 0.0074928998947143555, 0.007931232452392578, 0.0083695650100708, 0.008807897567749023, 0.009246230125427246, 0.009684562683105469, 0.010122895240783691, 0.010561227798461914, 0.010999560356140137, 0.01143789291381836, 0.011876225471496582, 0.012314558029174805, 0.012752890586853027, 0.01319122314453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 10.0, 37.0, 86.0, 154.0, 216.0, 200.0, 163.0, 82.0, 28.0, 11.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43615466356277466, -0.4026948809623718, -0.369235098361969, -0.33577534556388855, -0.3023155629634857, -0.2688557803630829, -0.23539601266384125, -0.2019362449645996, -0.16847646236419678, -0.13501667976379395, -0.10155691206455231, -0.06809713691473007, -0.03463736176490784, -0.0011775791645050049, 0.03228218853473663, 0.06574195623397827, 0.0992017388343811, 0.13266152143478394, 0.16612128913402557, 0.1995810568332672, 0.23304083943367004, 0.2665006220340729, 0.2999603748321533, 0.33342015743255615, 0.366879940032959, 0.4003397226333618, 0.43379950523376465, 0.4672592580318451, 0.5007190704345703, 0.5341788530349731, 0.5676385760307312, 0.601098358631134, 0.6345582008361816, 0.6680179834365845, 0.7014777660369873, 0.7349375486373901, 0.768397331237793, 0.8018571138381958, 0.8353168368339539, 0.8687766194343567, 0.9022364020347595, 0.9356961846351624, 0.9691559672355652, 1.0026156902313232, 1.036075472831726, 1.069535255432129, 1.1029950380325317, 1.1364548206329346, 1.1699146032333374, 1.2033743858337402, 1.236834168434143, 1.270293951034546, 1.3037537336349487, 1.3372135162353516, 1.3706732988357544, 1.4041330814361572, 1.4375927448272705, 1.4710525274276733, 1.5045123100280762, 1.537972092628479, 1.5714318752288818, 1.6048916578292847, 1.6383514404296875, 1.6718111038208008, 1.7052710056304932]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 5.0, 22.0, 14.0, 30.0, 23.0, 40.0, 54.0, 52.0, 67.0, 57.0, 52.0, 77.0, 58.0, 63.0, 72.0, 60.0, 52.0, 36.0, 43.0, 22.0, 27.0, 21.0, 19.0, 15.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3889988660812378, -0.37512797117233276, -0.36125707626342773, -0.3473861515522003, -0.3335152566432953, -0.31964436173439026, -0.30577343702316284, -0.2919025421142578, -0.2780316472053528, -0.26416075229644775, -0.2502898573875427, -0.2364189326763153, -0.22254803776741028, -0.20867714285850525, -0.19480623304843903, -0.1809353232383728, -0.16706442832946777, -0.15319353342056274, -0.13932262361049652, -0.1254517138004303, -0.11158081889152527, -0.09770991653203964, -0.08383901417255402, -0.06996811181306839, -0.056097209453582764, -0.04222630709409714, -0.02835540473461151, -0.014484502375125885, -0.0006136000156402588, 0.013257302343845367, 0.027128204703330994, 0.04099910706281662, 0.054870039224624634, 0.06874094158411026, 0.08261184394359589, 0.09648274630308151, 0.11035364866256714, 0.12422455102205276, 0.1380954533815384, 0.15196636319160461, 0.16583725810050964, 0.17970815300941467, 0.1935790628194809, 0.20744997262954712, 0.22132086753845215, 0.23519176244735718, 0.2490626722574234, 0.2629335820674896, 0.27680447697639465, 0.2906753718852997, 0.3045462965965271, 0.31841719150543213, 0.33228808641433716, 0.3461589813232422, 0.3600298762321472, 0.37390080094337463, 0.38777169585227966, 0.4016425907611847, 0.4155135154724121, 0.42938441038131714, 0.44325530529022217, 0.4571262001991272, 0.4709970951080322, 0.48486801981925964, 0.4987389147281647]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 3.0, 5.0, 15.0, 35.0, 55.0, 78.0, 145.0, 334.0, 688.0, 1878.0, 6908.0, 31050.0, 316658.0, 629655.0, 47466.0, 9519.0, 2507.0, 856.0, 348.0, 154.0, 90.0, 53.0, 28.0, 9.0, 3.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453369140625, -0.4366493225097656, -0.41992950439453125, -0.4032096862792969, -0.3864898681640625, -0.3697700500488281, -0.35305023193359375, -0.3363304138183594, -0.319610595703125, -0.3028907775878906, -0.28617095947265625, -0.2694511413574219, -0.2527313232421875, -0.23601150512695312, -0.21929168701171875, -0.20257186889648438, -0.18585205078125, -0.16913223266601562, -0.15241241455078125, -0.13569259643554688, -0.1189727783203125, -0.10225296020507812, -0.08553314208984375, -0.06881332397460938, -0.052093505859375, -0.035373687744140625, -0.01865386962890625, -0.001934051513671875, 0.0147857666015625, 0.031505584716796875, 0.04822540283203125, 0.06494522094726562, 0.0816650390625, 0.09838485717773438, 0.11510467529296875, 0.13182449340820312, 0.1485443115234375, 0.16526412963867188, 0.18198394775390625, 0.19870376586914062, 0.215423583984375, 0.23214340209960938, 0.24886322021484375, 0.2655830383300781, 0.2823028564453125, 0.2990226745605469, 0.31574249267578125, 0.3324623107910156, 0.34918212890625, 0.3659019470214844, 0.38262176513671875, 0.3993415832519531, 0.4160614013671875, 0.4327812194824219, 0.44950103759765625, 0.4662208557128906, 0.482940673828125, 0.4996604919433594, 0.5163803100585938, 0.5331001281738281, 0.5498199462890625, 0.5665397644042969, 0.5832595825195312, 0.5999794006347656, 0.61669921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 19.0, 16.0, 27.0, 35.0, 61.0, 70.0, 69.0, 82.0, 77.0, 97.0, 100.0, 94.0, 69.0, 51.0, 39.0, 29.0, 25.0, 26.0, 12.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.4894027709960938, -1.4514617919921875, -1.4135208129882812, -1.375579833984375, -1.3376388549804688, -1.2996978759765625, -1.2617568969726562, -1.22381591796875, -1.1858749389648438, -1.1479339599609375, -1.1099929809570312, -1.072052001953125, -1.0341110229492188, -0.9961700439453125, -0.9582290649414062, -0.9202880859375, -0.8823471069335938, -0.8444061279296875, -0.8064651489257812, -0.768524169921875, -0.7305831909179688, -0.6926422119140625, -0.6547012329101562, -0.61676025390625, -0.5788192749023438, -0.5408782958984375, -0.5029373168945312, -0.464996337890625, -0.42705535888671875, -0.3891143798828125, -0.35117340087890625, -0.313232421875, -0.27529144287109375, -0.2373504638671875, -0.19940948486328125, -0.161468505859375, -0.12352752685546875, -0.0855865478515625, -0.04764556884765625, -0.00970458984375, 0.02823638916015625, 0.0661773681640625, 0.10411834716796875, 0.142059326171875, 0.18000030517578125, 0.2179412841796875, 0.25588226318359375, 0.2938232421875, 0.33176422119140625, 0.3697052001953125, 0.40764617919921875, 0.445587158203125, 0.48352813720703125, 0.5214691162109375, 0.5594100952148438, 0.59735107421875, 0.6352920532226562, 0.6732330322265625, 0.7111740112304688, 0.749114990234375, 0.7870559692382812, 0.8249969482421875, 0.8629379272460938, 0.90087890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 4.0, 4.0, 7.0, 8.0, 15.0, 17.0, 14.0, 42.0, 43.0, 62.0, 93.0, 181.0, 312.0, 1123.0, 10052.0, 899909.0, 131770.0, 3522.0, 676.0, 252.0, 124.0, 78.0, 51.0, 35.0, 38.0, 25.0, 12.0, 15.0, 16.0, 14.0, 6.0, 5.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.3684539794921875, -1.326751708984375, -1.2850494384765625, -1.24334716796875, -1.2016448974609375, -1.159942626953125, -1.1182403564453125, -1.0765380859375, -1.0348358154296875, -0.993133544921875, -0.9514312744140625, -0.90972900390625, -0.8680267333984375, -0.826324462890625, -0.7846221923828125, -0.742919921875, -0.7012176513671875, -0.659515380859375, -0.6178131103515625, -0.57611083984375, -0.5344085693359375, -0.492706298828125, -0.4510040283203125, -0.4093017578125, -0.3675994873046875, -0.325897216796875, -0.2841949462890625, -0.24249267578125, -0.2007904052734375, -0.159088134765625, -0.1173858642578125, -0.07568359375, -0.0339813232421875, 0.007720947265625, 0.0494232177734375, 0.09112548828125, 0.1328277587890625, 0.174530029296875, 0.2162322998046875, 0.2579345703125, 0.2996368408203125, 0.341339111328125, 0.3830413818359375, 0.42474365234375, 0.4664459228515625, 0.508148193359375, 0.5498504638671875, 0.591552734375, 0.6332550048828125, 0.674957275390625, 0.7166595458984375, 0.75836181640625, 0.8000640869140625, 0.841766357421875, 0.8834686279296875, 0.9251708984375, 0.9668731689453125, 1.008575439453125, 1.0502777099609375, 1.09197998046875, 1.1336822509765625, 1.175384521484375, 1.2170867919921875, 1.2587890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 1.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 10.0, 19.0, 12.0, 20.0, 25.0, 17.0, 32.0, 35.0, 30.0, 39.0, 44.0, 53.0, 62.0, 55.0, 43.0, 49.0, 48.0, 48.0, 35.0, 53.0, 35.0, 30.0, 29.0, 23.0, 28.0, 14.0, 9.0, 12.0, 7.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.8291015625, -0.8031463623046875, -0.777191162109375, -0.7512359619140625, -0.72528076171875, -0.6993255615234375, -0.673370361328125, -0.6474151611328125, -0.6214599609375, -0.5955047607421875, -0.569549560546875, -0.5435943603515625, -0.51763916015625, -0.4916839599609375, -0.465728759765625, -0.4397735595703125, -0.413818359375, -0.3878631591796875, -0.361907958984375, -0.3359527587890625, -0.30999755859375, -0.2840423583984375, -0.258087158203125, -0.2321319580078125, -0.2061767578125, -0.1802215576171875, -0.154266357421875, -0.1283111572265625, -0.10235595703125, -0.0764007568359375, -0.050445556640625, -0.0244903564453125, 0.00146484375, 0.0274200439453125, 0.053375244140625, 0.0793304443359375, 0.10528564453125, 0.1312408447265625, 0.157196044921875, 0.1831512451171875, 0.2091064453125, 0.2350616455078125, 0.261016845703125, 0.2869720458984375, 0.31292724609375, 0.3388824462890625, 0.364837646484375, 0.3907928466796875, 0.416748046875, 0.4427032470703125, 0.468658447265625, 0.4946136474609375, 0.52056884765625, 0.5465240478515625, 0.572479248046875, 0.5984344482421875, 0.6243896484375, 0.6503448486328125, 0.676300048828125, 0.7022552490234375, 0.72821044921875, 0.7541656494140625, 0.780120849609375, 0.8060760498046875, 0.83203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 11.0, 14.0, 25.0, 25.0, 35.0, 86.0, 153.0, 352.0, 874.0, 3310.0, 20566.0, 450171.0, 546167.0, 21816.0, 3356.0, 937.0, 346.0, 135.0, 62.0, 35.0, 23.0, 8.0, 7.0, 4.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16264915466308594, -0.15452194213867188, -0.1463947296142578, -0.13826751708984375, -0.1301403045654297, -0.12201309204101562, -0.11388587951660156, -0.1057586669921875, -0.09763145446777344, -0.08950424194335938, -0.08137702941894531, -0.07324981689453125, -0.06512260437011719, -0.056995391845703125, -0.04886817932128906, -0.040740966796875, -0.03261375427246094, -0.024486541748046875, -0.016359329223632812, -0.00823211669921875, -0.0001049041748046875, 0.008022308349609375, 0.016149520874023438, 0.0242767333984375, 0.03240394592285156, 0.040531158447265625, 0.04865837097167969, 0.05678558349609375, 0.06491279602050781, 0.07304000854492188, 0.08116722106933594, 0.08929443359375, 0.09742164611816406, 0.10554885864257812, 0.11367607116699219, 0.12180328369140625, 0.1299304962158203, 0.13805770874023438, 0.14618492126464844, 0.1543121337890625, 0.16243934631347656, 0.17056655883789062, 0.1786937713623047, 0.18682098388671875, 0.1949481964111328, 0.20307540893554688, 0.21120262145996094, 0.219329833984375, 0.22745704650878906, 0.23558425903320312, 0.2437114715576172, 0.25183868408203125, 0.2599658966064453, 0.2680931091308594, 0.27622032165527344, 0.2843475341796875, 0.29247474670410156, 0.3006019592285156, 0.3087291717529297, 0.31685638427734375, 0.3249835968017578, 0.3331108093261719, 0.34123802185058594, 0.349365234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 4.0, 6.0, 13.0, 16.0, 17.0, 31.0, 56.0, 77.0, 87.0, 171.0, 179.0, 106.0, 79.0, 45.0, 29.0, 28.0, 18.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1755695343017578e-05, -2.085324376821518e-05, -1.995079219341278e-05, -1.9048340618610382e-05, -1.8145889043807983e-05, -1.7243437469005585e-05, -1.6340985894203186e-05, -1.5438534319400787e-05, -1.4536082744598389e-05, -1.363363116979599e-05, -1.2731179594993591e-05, -1.1828728020191193e-05, -1.0926276445388794e-05, -1.0023824870586395e-05, -9.121373295783997e-06, -8.218921720981598e-06, -7.316470146179199e-06, -6.4140185713768005e-06, -5.511566996574402e-06, -4.609115421772003e-06, -3.7066638469696045e-06, -2.804212272167206e-06, -1.9017606973648071e-06, -9.993091225624084e-07, -9.685754776000977e-08, 8.055940270423889e-07, 1.7080456018447876e-06, 2.6104971766471863e-06, 3.512948751449585e-06, 4.415400326251984e-06, 5.317851901054382e-06, 6.220303475856781e-06, 7.12275505065918e-06, 8.025206625461578e-06, 8.927658200263977e-06, 9.830109775066376e-06, 1.0732561349868774e-05, 1.1635012924671173e-05, 1.2537464499473572e-05, 1.343991607427597e-05, 1.4342367649078369e-05, 1.5244819223880768e-05, 1.6147270798683167e-05, 1.7049722373485565e-05, 1.7952173948287964e-05, 1.8854625523090363e-05, 1.975707709789276e-05, 2.065952867269516e-05, 2.156198024749756e-05, 2.2464431822299957e-05, 2.3366883397102356e-05, 2.4269334971904755e-05, 2.5171786546707153e-05, 2.6074238121509552e-05, 2.697668969631195e-05, 2.787914127111435e-05, 2.8781592845916748e-05, 2.9684044420719147e-05, 3.0586495995521545e-05, 3.1488947570323944e-05, 3.239139914512634e-05, 3.329385071992874e-05, 3.419630229473114e-05, 3.509875386953354e-05, 3.600120544433594e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 20.0, 52.0, 101.0, 247.0, 837.0, 3741.0, 46978.0, 948958.0, 42742.0, 3603.0, 780.0, 274.0, 92.0, 48.0, 26.0, 15.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5637130737304688, -0.5497894287109375, -0.5358657836914062, -0.521942138671875, -0.5080184936523438, -0.4940948486328125, -0.48017120361328125, -0.46624755859375, -0.45232391357421875, -0.4384002685546875, -0.42447662353515625, -0.410552978515625, -0.39662933349609375, -0.3827056884765625, -0.36878204345703125, -0.3548583984375, -0.34093475341796875, -0.3270111083984375, -0.31308746337890625, -0.299163818359375, -0.28524017333984375, -0.2713165283203125, -0.25739288330078125, -0.24346923828125, -0.22954559326171875, -0.2156219482421875, -0.20169830322265625, -0.187774658203125, -0.17385101318359375, -0.1599273681640625, -0.14600372314453125, -0.132080078125, -0.11815643310546875, -0.1042327880859375, -0.09030914306640625, -0.076385498046875, -0.06246185302734375, -0.0485382080078125, -0.03461456298828125, -0.02069091796875, -0.00676727294921875, 0.0071563720703125, 0.02108001708984375, 0.035003662109375, 0.04892730712890625, 0.0628509521484375, 0.07677459716796875, 0.0906982421875, 0.10462188720703125, 0.1185455322265625, 0.13246917724609375, 0.146392822265625, 0.16031646728515625, 0.1742401123046875, 0.18816375732421875, 0.20208740234375, 0.21601104736328125, 0.2299346923828125, 0.24385833740234375, 0.257781982421875, 0.27170562744140625, 0.2856292724609375, 0.29955291748046875, 0.3134765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 10.0, 13.0, 20.0, 31.0, 46.0, 53.0, 82.0, 102.0, 201.0, 116.0, 91.0, 68.0, 27.0, 27.0, 29.0, 16.0, 12.0, 9.0, 9.0, 6.0, 7.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07830810546875, -0.0755777359008789, -0.07284736633300781, -0.07011699676513672, -0.06738662719726562, -0.06465625762939453, -0.06192588806152344, -0.059195518493652344, -0.05646514892578125, -0.053734779357910156, -0.05100440979003906, -0.04827404022216797, -0.045543670654296875, -0.04281330108642578, -0.04008293151855469, -0.037352561950683594, -0.0346221923828125, -0.031891822814941406, -0.029161453247070312, -0.02643108367919922, -0.023700714111328125, -0.02097034454345703, -0.018239974975585938, -0.015509605407714844, -0.01277923583984375, -0.010048866271972656, -0.0073184967041015625, -0.004588127136230469, -0.001857757568359375, 0.0008726119995117188, 0.0036029815673828125, 0.006333351135253906, 0.009063720703125, 0.011794090270996094, 0.014524459838867188, 0.01725482940673828, 0.019985198974609375, 0.02271556854248047, 0.025445938110351562, 0.028176307678222656, 0.03090667724609375, 0.033637046813964844, 0.03636741638183594, 0.03909778594970703, 0.041828155517578125, 0.04455852508544922, 0.04728889465332031, 0.050019264221191406, 0.0527496337890625, 0.055480003356933594, 0.05821037292480469, 0.06094074249267578, 0.06367111206054688, 0.06640148162841797, 0.06913185119628906, 0.07186222076416016, 0.07459259033203125, 0.07732295989990234, 0.08005332946777344, 0.08278369903564453, 0.08551406860351562, 0.08824443817138672, 0.09097480773925781, 0.0937051773071289, 0.096435546875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 16.0, 36.0, 87.0, 192.0, 248.0, 220.0, 128.0, 54.0, 17.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6503353118896484, -2.5693631172180176, -2.488391160964966, -2.407418966293335, -2.326446771621704, -2.2454748153686523, -2.1645026206970215, -2.0835304260253906, -2.0025582313537598, -1.9215861558914185, -1.8406139612197876, -1.7596418857574463, -1.6786696910858154, -1.5976976156234741, -1.5167255401611328, -1.435753345489502, -1.3547813892364502, -1.2738093137741089, -1.192837119102478, -1.1118650436401367, -1.0308928489685059, -0.9499207735061646, -0.8689486980438232, -0.7879765629768372, -0.7070044279098511, -0.626032292842865, -0.5450601577758789, -0.4640880823135376, -0.3831159472465515, -0.30214381217956543, -0.22117170691490173, -0.14019960165023804, -0.05922746658325195, 0.021744653582572937, 0.10271677374839783, 0.18368889391422272, 0.2646610140800476, 0.3456331491470337, 0.4266052544116974, 0.5075773596763611, 0.5885494947433472, 0.6695216298103333, 0.7504937648773193, 0.8314658403396606, 0.9124379754066467, 0.9934101104736328, 1.0743821859359741, 1.1553542613983154, 1.2363264560699463, 1.3172985315322876, 1.3982707262039185, 1.4792428016662598, 1.5602149963378906, 1.641187071800232, 1.7221591472625732, 1.803131341934204, 1.8841034173965454, 1.9650754928588867, 2.0460476875305176, 2.1270198822021484, 2.2079918384552, 2.288964033126831, 2.369936227798462, 2.4509081840515137, 2.5318803787231445]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 11.0, 11.0, 10.0, 16.0, 22.0, 25.0, 36.0, 42.0, 51.0, 45.0, 48.0, 66.0, 57.0, 57.0, 54.0, 49.0, 46.0, 43.0, 38.0, 40.0, 35.0, 24.0, 24.0, 28.0, 34.0, 16.0, 21.0, 12.0, 12.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3284894227981567, -1.2798914909362793, -1.2312935590744019, -1.1826956272125244, -1.1340975761413574, -1.08549964427948, -1.0369017124176025, -0.9883037805557251, -0.9397058486938477, -0.8911079168319702, -0.8425099849700928, -0.7939119935035706, -0.7453140616416931, -0.6967161297798157, -0.6481181383132935, -0.599520206451416, -0.5509222745895386, -0.5023243427276611, -0.4537263810634613, -0.4051284193992615, -0.35653048753738403, -0.3079325556755066, -0.25933459401130676, -0.21073663234710693, -0.1621387004852295, -0.11354075372219086, -0.06494280695915222, -0.016344860196113586, 0.03225308656692505, 0.08085103332996368, 0.12944898009300232, 0.17804694175720215, 0.2266448736190796, 0.27524280548095703, 0.32384076714515686, 0.3724387288093567, 0.42103666067123413, 0.4696345925331116, 0.5182325839996338, 0.5668305158615112, 0.6154284477233887, 0.6640263795852661, 0.7126243114471436, 0.7612223029136658, 0.8098202347755432, 0.8584181666374207, 0.9070161581039429, 0.9556140899658203, 1.0042120218276978, 1.0528099536895752, 1.1014078855514526, 1.15000581741333, 1.198603868484497, 1.2472018003463745, 1.295799732208252, 1.3443976640701294, 1.3929955959320068, 1.4415935277938843, 1.4901914596557617, 1.5387893915176392, 1.5873873233795166, 1.6359853744506836, 1.684583306312561, 1.7331812381744385, 1.781779170036316]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 9.0, 13.0, 17.0, 11.0, 18.0, 23.0, 26.0, 35.0, 40.0, 43.0, 72.0, 116.0, 348.0, 1419.0, 11717.0, 474999.0, 3629524.0, 69854.0, 4497.0, 874.0, 220.0, 75.0, 61.0, 45.0, 33.0, 31.0, 31.0, 12.0, 18.0, 17.0, 15.0, 12.0, 8.0, 6.0, 12.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4208984375, -1.3740081787109375, -1.327117919921875, -1.2802276611328125, -1.23333740234375, -1.1864471435546875, -1.139556884765625, -1.0926666259765625, -1.0457763671875, -0.9988861083984375, -0.951995849609375, -0.9051055908203125, -0.85821533203125, -0.8113250732421875, -0.764434814453125, -0.7175445556640625, -0.670654296875, -0.6237640380859375, -0.576873779296875, -0.5299835205078125, -0.48309326171875, -0.4362030029296875, -0.389312744140625, -0.3424224853515625, -0.2955322265625, -0.2486419677734375, -0.201751708984375, -0.1548614501953125, -0.10797119140625, -0.0610809326171875, -0.014190673828125, 0.0326995849609375, 0.07958984375, 0.1264801025390625, 0.173370361328125, 0.2202606201171875, 0.26715087890625, 0.3140411376953125, 0.360931396484375, 0.4078216552734375, 0.4547119140625, 0.5016021728515625, 0.548492431640625, 0.5953826904296875, 0.64227294921875, 0.6891632080078125, 0.736053466796875, 0.7829437255859375, 0.829833984375, 0.8767242431640625, 0.923614501953125, 0.9705047607421875, 1.01739501953125, 1.0642852783203125, 1.111175537109375, 1.1580657958984375, 1.2049560546875, 1.2518463134765625, 1.298736572265625, 1.3456268310546875, 1.39251708984375, 1.4394073486328125, 1.486297607421875, 1.5331878662109375, 1.580078125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 9.0, 13.0, 14.0, 20.0, 16.0, 28.0, 31.0, 44.0, 40.0, 56.0, 56.0, 66.0, 55.0, 58.0, 57.0, 55.0, 46.0, 48.0, 44.0, 51.0, 36.0, 36.0, 26.0, 19.0, 21.0, 16.0, 9.0, 9.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42333984375, -0.40764617919921875, -0.3919525146484375, -0.37625885009765625, -0.360565185546875, -0.34487152099609375, -0.3291778564453125, -0.31348419189453125, -0.29779052734375, -0.28209686279296875, -0.2664031982421875, -0.25070953369140625, -0.235015869140625, -0.21932220458984375, -0.2036285400390625, -0.18793487548828125, -0.1722412109375, -0.15654754638671875, -0.1408538818359375, -0.12516021728515625, -0.109466552734375, -0.09377288818359375, -0.0780792236328125, -0.06238555908203125, -0.04669189453125, -0.03099822998046875, -0.0153045654296875, 0.00038909912109375, 0.016082763671875, 0.03177642822265625, 0.0474700927734375, 0.06316375732421875, 0.078857421875, 0.09455108642578125, 0.1102447509765625, 0.12593841552734375, 0.141632080078125, 0.15732574462890625, 0.1730194091796875, 0.18871307373046875, 0.20440673828125, 0.22010040283203125, 0.2357940673828125, 0.25148773193359375, 0.267181396484375, 0.28287506103515625, 0.2985687255859375, 0.31426239013671875, 0.3299560546875, 0.34564971923828125, 0.3613433837890625, 0.37703704833984375, 0.392730712890625, 0.40842437744140625, 0.4241180419921875, 0.43981170654296875, 0.45550537109375, 0.47119903564453125, 0.4868927001953125, 0.5025863647460938, 0.518280029296875, 0.5339736938476562, 0.5496673583984375, 0.5653610229492188, 0.5810546875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 20.0, 32.0, 71.0, 107.0, 293.0, 778.0, 3733.0, 58774.0, 3950195.0, 172269.0, 6246.0, 1070.0, 362.0, 148.0, 82.0, 35.0, 13.0, 14.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.259765625, -2.2112960815429688, -2.1628265380859375, -2.1143569946289062, -2.065887451171875, -2.0174179077148438, -1.9689483642578125, -1.9204788208007812, -1.87200927734375, -1.8235397338867188, -1.7750701904296875, -1.7266006469726562, -1.678131103515625, -1.6296615600585938, -1.5811920166015625, -1.5327224731445312, -1.4842529296875, -1.4357833862304688, -1.3873138427734375, -1.3388442993164062, -1.290374755859375, -1.2419052124023438, -1.1934356689453125, -1.1449661254882812, -1.09649658203125, -1.0480270385742188, -0.9995574951171875, -0.9510879516601562, -0.902618408203125, -0.8541488647460938, -0.8056793212890625, -0.7572097778320312, -0.708740234375, -0.6602706909179688, -0.6118011474609375, -0.5633316040039062, -0.514862060546875, -0.46639251708984375, -0.4179229736328125, -0.36945343017578125, -0.32098388671875, -0.27251434326171875, -0.2240447998046875, -0.17557525634765625, -0.127105712890625, -0.07863616943359375, -0.0301666259765625, 0.01830291748046875, 0.0667724609375, 0.11524200439453125, 0.1637115478515625, 0.21218109130859375, 0.260650634765625, 0.30912017822265625, 0.3575897216796875, 0.40605926513671875, 0.45452880859375, 0.5029983520507812, 0.5514678955078125, 0.5999374389648438, 0.648406982421875, 0.6968765258789062, 0.7453460693359375, 0.7938156127929688, 0.84228515625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 9.0, 14.0, 15.0, 23.0, 36.0, 54.0, 77.0, 107.0, 161.0, 280.0, 408.0, 547.0, 602.0, 533.0, 409.0, 270.0, 158.0, 113.0, 76.0, 46.0, 30.0, 15.0, 26.0, 6.0, 7.0, 7.0, 12.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1746826171875, -0.16834259033203125, -0.1620025634765625, -0.15566253662109375, -0.149322509765625, -0.14298248291015625, -0.1366424560546875, -0.13030242919921875, -0.12396240234375, -0.11762237548828125, -0.1112823486328125, -0.10494232177734375, -0.098602294921875, -0.09226226806640625, -0.0859222412109375, -0.07958221435546875, -0.0732421875, -0.06690216064453125, -0.0605621337890625, -0.05422210693359375, -0.047882080078125, -0.04154205322265625, -0.0352020263671875, -0.02886199951171875, -0.02252197265625, -0.01618194580078125, -0.0098419189453125, -0.00350189208984375, 0.002838134765625, 0.00917816162109375, 0.0155181884765625, 0.02185821533203125, 0.0281982421875, 0.03453826904296875, 0.0408782958984375, 0.04721832275390625, 0.053558349609375, 0.05989837646484375, 0.0662384033203125, 0.07257843017578125, 0.07891845703125, 0.08525848388671875, 0.0915985107421875, 0.09793853759765625, 0.104278564453125, 0.11061859130859375, 0.1169586181640625, 0.12329864501953125, 0.129638671875, 0.13597869873046875, 0.1423187255859375, 0.14865875244140625, 0.154998779296875, 0.16133880615234375, 0.1676788330078125, 0.17401885986328125, 0.18035888671875, 0.18669891357421875, 0.1930389404296875, 0.19937896728515625, 0.205718994140625, 0.21205902099609375, 0.2183990478515625, 0.22473907470703125, 0.2310791015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 16.0, 22.0, 58.0, 74.0, 110.0, 159.0, 157.0, 140.0, 91.0, 69.0, 38.0, 31.0, 10.0, 11.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8599148392677307, -0.8247542381286621, -0.7895936965942383, -0.7544330954551697, -0.7192724943161011, -0.6841118931770325, -0.6489512920379639, -0.61379075050354, -0.5786301493644714, -0.5434695482254028, -0.508309006690979, -0.4731484055519104, -0.4379878044128418, -0.4028272032737732, -0.367666631937027, -0.33250606060028076, -0.29734545946121216, -0.26218485832214355, -0.22702428698539734, -0.19186370074748993, -0.15670311450958252, -0.12154252827167511, -0.0863819420337677, -0.05122135579586029, -0.01606076955795288, 0.01909981667995453, 0.05426040291786194, 0.08942098915576935, 0.12458157539367676, 0.15974216163158417, 0.19490274786949158, 0.230063334107399, 0.2652238607406616, 0.3003844618797302, 0.33554503321647644, 0.37070560455322266, 0.40586620569229126, 0.44102680683135986, 0.4761873781681061, 0.5113479495048523, 0.5465085506439209, 0.5816691517829895, 0.6168297529220581, 0.6519902944564819, 0.6871508955955505, 0.7223114967346191, 0.757472038269043, 0.7926326394081116, 0.8277932405471802, 0.8629538416862488, 0.8981144428253174, 0.9332749843597412, 0.9684355854988098, 1.0035961866378784, 1.0387567281723022, 1.0739173889160156, 1.1090779304504395, 1.1442384719848633, 1.1793991327285767, 1.2145596742630005, 1.2497203350067139, 1.2848808765411377, 1.3200414180755615, 1.355202078819275, 1.3903626203536987]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 10.0, 9.0, 14.0, 16.0, 18.0, 32.0, 32.0, 39.0, 36.0, 42.0, 48.0, 65.0, 57.0, 49.0, 53.0, 58.0, 46.0, 44.0, 46.0, 44.0, 36.0, 38.0, 39.0, 23.0, 23.0, 22.0, 17.0, 10.0, 13.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43637028336524963, -0.41948458552360535, -0.40259885787963867, -0.3857131600379944, -0.3688274323940277, -0.3519417345523834, -0.33505600690841675, -0.31817030906677246, -0.3012846112251282, -0.2843989133834839, -0.2675131857395172, -0.2506274878978729, -0.23374176025390625, -0.21685606241226196, -0.19997034966945648, -0.183084636926651, -0.16619890928268433, -0.14931319653987885, -0.13242748379707336, -0.11554177850484848, -0.098656065762043, -0.08177035301923752, -0.06488464772701263, -0.04799893498420715, -0.031113222241401672, -0.01422751136124134, 0.002658199518918991, 0.019543908536434174, 0.036429621279239655, 0.053315334022045135, 0.07020103931427002, 0.0870867520570755, 0.1039724349975586, 0.12085814774036407, 0.13774386048316956, 0.15462955832481384, 0.17151528596878052, 0.1884009838104248, 0.20528669655323029, 0.22217240929603577, 0.23905812203884125, 0.25594383478164673, 0.272829532623291, 0.2897152602672577, 0.306600958108902, 0.32348668575286865, 0.34037238359451294, 0.3572580814361572, 0.3741438090801239, 0.3910295069217682, 0.40791523456573486, 0.42480093240737915, 0.4416866600513458, 0.4585723578929901, 0.4754580855369568, 0.4923437833786011, 0.5092294812202454, 0.5261151790618896, 0.5430008769035339, 0.559886634349823, 0.5767723321914673, 0.5936580300331116, 0.6105437278747559, 0.6274294853210449, 0.6443151831626892]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 4.0, 2.0, 2.0, 9.0, 7.0, 13.0, 18.0, 17.0, 40.0, 71.0, 94.0, 188.0, 392.0, 842.0, 2014.0, 5451.0, 17475.0, 107756.0, 681764.0, 195419.0, 25323.0, 6970.0, 2578.0, 1057.0, 494.0, 251.0, 131.0, 73.0, 39.0, 29.0, 12.0, 10.0, 10.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2318115234375, -0.22310447692871094, -0.21439743041992188, -0.2056903839111328, -0.19698333740234375, -0.1882762908935547, -0.17956924438476562, -0.17086219787597656, -0.1621551513671875, -0.15344810485839844, -0.14474105834960938, -0.1360340118408203, -0.12732696533203125, -0.11861991882324219, -0.10991287231445312, -0.10120582580566406, -0.092498779296875, -0.08379173278808594, -0.07508468627929688, -0.06637763977050781, -0.05767059326171875, -0.04896354675292969, -0.040256500244140625, -0.03154945373535156, -0.0228424072265625, -0.014135360717773438, -0.005428314208984375, 0.0032787322998046875, 0.01198577880859375, 0.020692825317382812, 0.029399871826171875, 0.03810691833496094, 0.04681396484375, 0.05552101135253906, 0.06422805786132812, 0.07293510437011719, 0.08164215087890625, 0.09034919738769531, 0.09905624389648438, 0.10776329040527344, 0.1164703369140625, 0.12517738342285156, 0.13388442993164062, 0.1425914764404297, 0.15129852294921875, 0.1600055694580078, 0.16871261596679688, 0.17741966247558594, 0.186126708984375, 0.19483375549316406, 0.20354080200195312, 0.2122478485107422, 0.22095489501953125, 0.2296619415283203, 0.23836898803710938, 0.24707603454589844, 0.2557830810546875, 0.26449012756347656, 0.2731971740722656, 0.2819042205810547, 0.29061126708984375, 0.2993183135986328, 0.3080253601074219, 0.31673240661621094, 0.325439453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 8.0, 22.0, 12.0, 18.0, 38.0, 43.0, 38.0, 39.0, 58.0, 55.0, 64.0, 57.0, 61.0, 62.0, 55.0, 48.0, 65.0, 42.0, 52.0, 28.0, 23.0, 27.0, 26.0, 13.0, 16.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297119140625, -0.2839698791503906, -0.27082061767578125, -0.2576713562011719, -0.2445220947265625, -0.23137283325195312, -0.21822357177734375, -0.20507431030273438, -0.191925048828125, -0.17877578735351562, -0.16562652587890625, -0.15247726440429688, -0.1393280029296875, -0.12617874145507812, -0.11302947998046875, -0.09988021850585938, -0.08673095703125, -0.07358169555664062, -0.06043243408203125, -0.047283172607421875, -0.0341339111328125, -0.020984649658203125, -0.00783538818359375, 0.005313873291015625, 0.018463134765625, 0.031612396240234375, 0.04476165771484375, 0.057910919189453125, 0.0710601806640625, 0.08420944213867188, 0.09735870361328125, 0.11050796508789062, 0.1236572265625, 0.13680648803710938, 0.14995574951171875, 0.16310501098632812, 0.1762542724609375, 0.18940353393554688, 0.20255279541015625, 0.21570205688476562, 0.228851318359375, 0.24200057983398438, 0.25514984130859375, 0.2682991027832031, 0.2814483642578125, 0.2945976257324219, 0.30774688720703125, 0.3208961486816406, 0.33404541015625, 0.3471946716308594, 0.36034393310546875, 0.3734931945800781, 0.3866424560546875, 0.3997917175292969, 0.41294097900390625, 0.4260902404785156, 0.439239501953125, 0.4523887634277344, 0.46553802490234375, 0.4786872863769531, 0.4918365478515625, 0.5049858093261719, 0.5181350708007812, 0.5312843322753906, 0.54443359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 10.0, 10.0, 10.0, 5.0, 20.0, 24.0, 31.0, 45.0, 67.0, 119.0, 165.0, 314.0, 547.0, 1001.0, 1662.0, 3409.0, 7236.0, 19633.0, 69769.0, 291354.0, 448287.0, 146680.0, 36030.0, 11714.0, 4779.0, 2423.0, 1352.0, 737.0, 425.0, 241.0, 138.0, 101.0, 68.0, 51.0, 22.0, 16.0, 14.0, 11.0, 9.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.140380859375, -0.13588905334472656, -0.13139724731445312, -0.1269054412841797, -0.12241363525390625, -0.11792182922363281, -0.11343002319335938, -0.10893821716308594, -0.1044464111328125, -0.09995460510253906, -0.09546279907226562, -0.09097099304199219, -0.08647918701171875, -0.08198738098144531, -0.07749557495117188, -0.07300376892089844, -0.068511962890625, -0.06402015686035156, -0.059528350830078125, -0.05503654479980469, -0.05054473876953125, -0.04605293273925781, -0.041561126708984375, -0.03706932067871094, -0.0325775146484375, -0.028085708618164062, -0.023593902587890625, -0.019102096557617188, -0.01461029052734375, -0.010118484497070312, -0.005626678466796875, -0.0011348724365234375, 0.00335693359375, 0.007848739624023438, 0.012340545654296875, 0.016832351684570312, 0.02132415771484375, 0.025815963745117188, 0.030307769775390625, 0.03479957580566406, 0.0392913818359375, 0.04378318786621094, 0.048274993896484375, 0.05276679992675781, 0.05725860595703125, 0.06175041198730469, 0.06624221801757812, 0.07073402404785156, 0.075225830078125, 0.07971763610839844, 0.08420944213867188, 0.08870124816894531, 0.09319305419921875, 0.09768486022949219, 0.10217666625976562, 0.10666847229003906, 0.1111602783203125, 0.11565208435058594, 0.12014389038085938, 0.12463569641113281, 0.12912750244140625, 0.1336193084716797, 0.13811111450195312, 0.14260292053222656, 0.1470947265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 7.0, 9.0, 9.0, 8.0, 19.0, 16.0, 14.0, 31.0, 28.0, 34.0, 30.0, 32.0, 43.0, 42.0, 56.0, 47.0, 60.0, 49.0, 48.0, 43.0, 28.0, 40.0, 30.0, 45.0, 37.0, 26.0, 17.0, 23.0, 20.0, 14.0, 14.0, 14.0, 9.0, 9.0, 8.0, 5.0, 3.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.66748046875, -0.6451797485351562, -0.6228790283203125, -0.6005783081054688, -0.578277587890625, -0.5559768676757812, -0.5336761474609375, -0.5113754272460938, -0.48907470703125, -0.46677398681640625, -0.4444732666015625, -0.42217254638671875, -0.399871826171875, -0.37757110595703125, -0.3552703857421875, -0.33296966552734375, -0.3106689453125, -0.28836822509765625, -0.2660675048828125, -0.24376678466796875, -0.221466064453125, -0.19916534423828125, -0.1768646240234375, -0.15456390380859375, -0.13226318359375, -0.10996246337890625, -0.0876617431640625, -0.06536102294921875, -0.043060302734375, -0.02075958251953125, 0.0015411376953125, 0.02384185791015625, 0.046142578125, 0.06844329833984375, 0.0907440185546875, 0.11304473876953125, 0.135345458984375, 0.15764617919921875, 0.1799468994140625, 0.20224761962890625, 0.22454833984375, 0.24684906005859375, 0.2691497802734375, 0.29145050048828125, 0.313751220703125, 0.33605194091796875, 0.3583526611328125, 0.38065338134765625, 0.4029541015625, 0.42525482177734375, 0.4475555419921875, 0.46985626220703125, 0.492156982421875, 0.5144577026367188, 0.5367584228515625, 0.5590591430664062, 0.58135986328125, 0.6036605834960938, 0.6259613037109375, 0.6482620239257812, 0.670562744140625, 0.6928634643554688, 0.7151641845703125, 0.7374649047851562, 0.759765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 15.0, 13.0, 20.0, 41.0, 72.0, 100.0, 117.0, 272.0, 381.0, 748.0, 1519.0, 3485.0, 10048.0, 36285.0, 249150.0, 623441.0, 92479.0, 19282.0, 6198.0, 2358.0, 1105.0, 549.0, 354.0, 188.0, 111.0, 85.0, 49.0, 21.0, 18.0, 12.0, 6.0, 7.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07648849487304688, -0.07387542724609375, -0.07126235961914062, -0.0686492919921875, -0.06603622436523438, -0.06342315673828125, -0.060810089111328125, -0.058197021484375, -0.055583953857421875, -0.05297088623046875, -0.050357818603515625, -0.0477447509765625, -0.045131683349609375, -0.04251861572265625, -0.039905548095703125, -0.03729248046875, -0.034679412841796875, -0.03206634521484375, -0.029453277587890625, -0.0268402099609375, -0.024227142333984375, -0.02161407470703125, -0.019001007080078125, -0.016387939453125, -0.013774871826171875, -0.01116180419921875, -0.008548736572265625, -0.0059356689453125, -0.003322601318359375, -0.00070953369140625, 0.001903533935546875, 0.0045166015625, 0.007129669189453125, 0.00974273681640625, 0.012355804443359375, 0.0149688720703125, 0.017581939697265625, 0.02019500732421875, 0.022808074951171875, 0.025421142578125, 0.028034210205078125, 0.03064727783203125, 0.033260345458984375, 0.0358734130859375, 0.038486480712890625, 0.04109954833984375, 0.043712615966796875, 0.04632568359375, 0.048938751220703125, 0.05155181884765625, 0.054164886474609375, 0.0567779541015625, 0.059391021728515625, 0.06200408935546875, 0.06461715698242188, 0.067230224609375, 0.06984329223632812, 0.07245635986328125, 0.07506942749023438, 0.0776824951171875, 0.08029556274414062, 0.08290863037109375, 0.08552169799804688, 0.088134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 11.0, 19.0, 47.0, 75.0, 141.0, 177.0, 205.0, 132.0, 71.0, 46.0, 22.0, 16.0, 10.0, 7.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.045797348022461e-05, -2.906564623117447e-05, -2.767331898212433e-05, -2.6280991733074188e-05, -2.4888664484024048e-05, -2.3496337234973907e-05, -2.2104009985923767e-05, -2.0711682736873627e-05, -1.9319355487823486e-05, -1.7927028238773346e-05, -1.6534700989723206e-05, -1.5142373740673065e-05, -1.3750046491622925e-05, -1.2357719242572784e-05, -1.0965391993522644e-05, -9.573064744472504e-06, -8.180737495422363e-06, -6.788410246372223e-06, -5.3960829973220825e-06, -4.003755748271942e-06, -2.6114284992218018e-06, -1.2191012501716614e-06, 1.73225998878479e-07, 1.5655532479286194e-06, 2.9578804969787598e-06, 4.3502077460289e-06, 5.7425349950790405e-06, 7.134862244129181e-06, 8.527189493179321e-06, 9.919516742229462e-06, 1.1311843991279602e-05, 1.2704171240329742e-05, 1.4096498489379883e-05, 1.5488825738430023e-05, 1.6881152987480164e-05, 1.8273480236530304e-05, 1.9665807485580444e-05, 2.1058134734630585e-05, 2.2450461983680725e-05, 2.3842789232730865e-05, 2.5235116481781006e-05, 2.6627443730831146e-05, 2.8019770979881287e-05, 2.9412098228931427e-05, 3.080442547798157e-05, 3.219675272703171e-05, 3.358907997608185e-05, 3.498140722513199e-05, 3.637373447418213e-05, 3.776606172323227e-05, 3.915838897228241e-05, 4.055071622133255e-05, 4.194304347038269e-05, 4.333537071943283e-05, 4.472769796848297e-05, 4.612002521753311e-05, 4.751235246658325e-05, 4.890467971563339e-05, 5.029700696468353e-05, 5.168933421373367e-05, 5.3081661462783813e-05, 5.4473988711833954e-05, 5.5866315960884094e-05, 5.7258643209934235e-05, 5.8650970458984375e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 7.0, 10.0, 13.0, 11.0, 11.0, 18.0, 33.0, 27.0, 40.0, 45.0, 69.0, 114.0, 156.0, 258.0, 442.0, 952.0, 1927.0, 4571.0, 12400.0, 41156.0, 197546.0, 583537.0, 152370.0, 33996.0, 10961.0, 4121.0, 1805.0, 814.0, 427.0, 253.0, 126.0, 95.0, 74.0, 34.0, 43.0, 28.0, 14.0, 10.0, 6.0, 6.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0787353515625, -0.07630729675292969, -0.07387924194335938, -0.07145118713378906, -0.06902313232421875, -0.06659507751464844, -0.06416702270507812, -0.06173896789550781, -0.0593109130859375, -0.05688285827636719, -0.054454803466796875, -0.05202674865722656, -0.04959869384765625, -0.04717063903808594, -0.044742584228515625, -0.04231452941894531, -0.039886474609375, -0.03745841979980469, -0.035030364990234375, -0.03260231018066406, -0.03017425537109375, -0.027746200561523438, -0.025318145751953125, -0.022890090942382812, -0.0204620361328125, -0.018033981323242188, -0.015605926513671875, -0.013177871704101562, -0.01074981689453125, -0.008321762084960938, -0.005893707275390625, -0.0034656524658203125, -0.00103759765625, 0.0013904571533203125, 0.003818511962890625, 0.0062465667724609375, 0.00867462158203125, 0.011102676391601562, 0.013530731201171875, 0.015958786010742188, 0.0183868408203125, 0.020814895629882812, 0.023242950439453125, 0.025671005249023438, 0.02809906005859375, 0.030527114868164062, 0.032955169677734375, 0.03538322448730469, 0.037811279296875, 0.04023933410644531, 0.042667388916015625, 0.04509544372558594, 0.04752349853515625, 0.04995155334472656, 0.052379608154296875, 0.05480766296386719, 0.0572357177734375, 0.05966377258300781, 0.062091827392578125, 0.06451988220214844, 0.06694793701171875, 0.06937599182128906, 0.07180404663085938, 0.07423210144042969, 0.07666015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 8.0, 3.0, 10.0, 13.0, 19.0, 21.0, 27.0, 38.0, 45.0, 53.0, 76.0, 92.0, 115.0, 90.0, 98.0, 73.0, 53.0, 33.0, 25.0, 20.0, 12.0, 7.0, 13.0, 12.0, 6.0, 5.0, 8.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02557373046875, -0.024761438369750977, -0.023949146270751953, -0.02313685417175293, -0.022324562072753906, -0.021512269973754883, -0.02069997787475586, -0.019887685775756836, -0.019075393676757812, -0.01826310157775879, -0.017450809478759766, -0.016638517379760742, -0.01582622528076172, -0.015013933181762695, -0.014201641082763672, -0.013389348983764648, -0.012577056884765625, -0.011764764785766602, -0.010952472686767578, -0.010140180587768555, -0.009327888488769531, -0.008515596389770508, -0.007703304290771484, -0.006891012191772461, -0.0060787200927734375, -0.005266427993774414, -0.004454135894775391, -0.003641843795776367, -0.0028295516967773438, -0.0020172595977783203, -0.0012049674987792969, -0.00039267539978027344, 0.00041961669921875, 0.0012319087982177734, 0.002044200897216797, 0.0028564929962158203, 0.0036687850952148438, 0.004481077194213867, 0.005293369293212891, 0.006105661392211914, 0.0069179534912109375, 0.007730245590209961, 0.008542537689208984, 0.009354829788208008, 0.010167121887207031, 0.010979413986206055, 0.011791706085205078, 0.012603998184204102, 0.013416290283203125, 0.014228582382202148, 0.015040874481201172, 0.015853166580200195, 0.01666545867919922, 0.017477750778198242, 0.018290042877197266, 0.01910233497619629, 0.019914627075195312, 0.020726919174194336, 0.02153921127319336, 0.022351503372192383, 0.023163795471191406, 0.02397608757019043, 0.024788379669189453, 0.025600671768188477, 0.0264129638671875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 12.0, 38.0, 84.0, 143.0, 214.0, 203.0, 132.0, 93.0, 44.0, 16.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8637725114822388, -0.8318920731544495, -0.8000116944313049, -0.7681312561035156, -0.7362508773803711, -0.7043704390525818, -0.6724900007247925, -0.640609622001648, -0.6087291836738586, -0.5768487453460693, -0.5449683666229248, -0.5130879282951355, -0.4812075197696686, -0.44932711124420166, -0.41744667291641235, -0.38556626439094543, -0.3536858558654785, -0.3218054473400116, -0.2899250388145447, -0.25804460048675537, -0.22616419196128845, -0.19428378343582153, -0.16240336000919342, -0.1305229365825653, -0.09864252805709839, -0.06676211208105087, -0.03488169610500336, -0.003001280128955841, 0.028879135847091675, 0.060759544372558594, 0.0926399677991867, 0.12452039122581482, 0.15640079975128174, 0.18828120827674866, 0.22016163170337677, 0.2520420551300049, 0.2839224636554718, 0.3158028721809387, 0.347683310508728, 0.37956371903419495, 0.41144412755966187, 0.4433245360851288, 0.4752049446105957, 0.507085382938385, 0.5389658212661743, 0.5708461999893188, 0.6027266383171082, 0.6346070766448975, 0.666487455368042, 0.6983678936958313, 0.7302482724189758, 0.7621287107467651, 0.7940090894699097, 0.825889527797699, 0.8577699661254883, 0.8896503448486328, 0.9215307831764221, 0.9534112215042114, 0.985291600227356, 1.0171719789505005, 1.0490524768829346, 1.080932855606079, 1.1128132343292236, 1.1446937322616577, 1.1765741109848022]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 7.0, 9.0, 13.0, 25.0, 31.0, 30.0, 42.0, 42.0, 36.0, 61.0, 42.0, 49.0, 60.0, 64.0, 59.0, 54.0, 45.0, 45.0, 48.0, 31.0, 40.0, 25.0, 30.0, 26.0, 26.0, 8.0, 19.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26588261127471924, -0.2541697025299072, -0.2424568235874176, -0.23074392974376678, -0.21903103590011597, -0.20731814205646515, -0.19560524821281433, -0.1838923543691635, -0.1721794605255127, -0.16046656668186188, -0.14875367283821106, -0.13704077899456024, -0.12532788515090942, -0.1136149913072586, -0.10190209746360779, -0.09018920361995697, -0.07847630977630615, -0.06676341593265533, -0.05505052208900452, -0.0433376282453537, -0.03162473440170288, -0.019911840558052063, -0.008198946714401245, 0.0035139471292495728, 0.01522684097290039, 0.02693973481655121, 0.038652628660202026, 0.050365522503852844, 0.06207841634750366, 0.07379131019115448, 0.0855042040348053, 0.09721709787845612, 0.10893002152442932, 0.12064291536808014, 0.13235580921173096, 0.14406870305538177, 0.1557815968990326, 0.1674944907426834, 0.17920738458633423, 0.19092027842998505, 0.20263317227363586, 0.21434606611728668, 0.2260589599609375, 0.23777185380458832, 0.24948474764823914, 0.26119762659072876, 0.27291053533554077, 0.2846234440803528, 0.2963363230228424, 0.30804920196533203, 0.31976211071014404, 0.33147501945495605, 0.3431878983974457, 0.3549007773399353, 0.3666136860847473, 0.3783265948295593, 0.39003947377204895, 0.4017523527145386, 0.4134652614593506, 0.4251781702041626, 0.4368910491466522, 0.44860392808914185, 0.46031683683395386, 0.47202974557876587, 0.4837426245212555]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 16.0, 7.0, 16.0, 31.0, 36.0, 57.0, 97.0, 159.0, 258.0, 508.0, 1113.0, 2551.0, 7508.0, 28899.0, 139316.0, 622839.0, 192001.0, 38159.0, 9315.0, 3117.0, 1213.0, 571.0, 310.0, 177.0, 106.0, 45.0, 34.0, 29.0, 16.0, 12.0, 12.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37207794189453125, -0.3569488525390625, -0.34181976318359375, -0.326690673828125, -0.31156158447265625, -0.2964324951171875, -0.28130340576171875, -0.26617431640625, -0.25104522705078125, -0.2359161376953125, -0.22078704833984375, -0.205657958984375, -0.19052886962890625, -0.1753997802734375, -0.16027069091796875, -0.1451416015625, -0.13001251220703125, -0.1148834228515625, -0.09975433349609375, -0.084625244140625, -0.06949615478515625, -0.0543670654296875, -0.03923797607421875, -0.02410888671875, -0.00897979736328125, 0.0061492919921875, 0.02127838134765625, 0.036407470703125, 0.05153656005859375, 0.0666656494140625, 0.08179473876953125, 0.096923828125, 0.11205291748046875, 0.1271820068359375, 0.14231109619140625, 0.157440185546875, 0.17256927490234375, 0.1876983642578125, 0.20282745361328125, 0.21795654296875, 0.23308563232421875, 0.2482147216796875, 0.26334381103515625, 0.278472900390625, 0.29360198974609375, 0.3087310791015625, 0.32386016845703125, 0.3389892578125, 0.35411834716796875, 0.3692474365234375, 0.38437652587890625, 0.399505615234375, 0.41463470458984375, 0.4297637939453125, 0.44489288330078125, 0.46002197265625, 0.47515106201171875, 0.4902801513671875, 0.5054092407226562, 0.520538330078125, 0.5356674194335938, 0.5507965087890625, 0.5659255981445312, 0.5810546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 11.0, 11.0, 15.0, 16.0, 19.0, 33.0, 37.0, 50.0, 35.0, 57.0, 59.0, 49.0, 48.0, 51.0, 48.0, 55.0, 42.0, 45.0, 52.0, 28.0, 49.0, 42.0, 29.0, 22.0, 19.0, 17.0, 12.0, 13.0, 7.0, 6.0, 7.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.509765625, -0.488555908203125, -0.46734619140625, -0.446136474609375, -0.4249267578125, -0.403717041015625, -0.38250732421875, -0.361297607421875, -0.340087890625, -0.318878173828125, -0.29766845703125, -0.276458740234375, -0.2552490234375, -0.234039306640625, -0.21282958984375, -0.191619873046875, -0.17041015625, -0.149200439453125, -0.12799072265625, -0.106781005859375, -0.0855712890625, -0.064361572265625, -0.04315185546875, -0.021942138671875, -0.000732421875, 0.020477294921875, 0.04168701171875, 0.062896728515625, 0.0841064453125, 0.105316162109375, 0.12652587890625, 0.147735595703125, 0.1689453125, 0.190155029296875, 0.21136474609375, 0.232574462890625, 0.2537841796875, 0.274993896484375, 0.29620361328125, 0.317413330078125, 0.338623046875, 0.359832763671875, 0.38104248046875, 0.402252197265625, 0.4234619140625, 0.444671630859375, 0.46588134765625, 0.487091064453125, 0.50830078125, 0.529510498046875, 0.55072021484375, 0.571929931640625, 0.5931396484375, 0.614349365234375, 0.63555908203125, 0.656768798828125, 0.677978515625, 0.699188232421875, 0.72039794921875, 0.741607666015625, 0.7628173828125, 0.784027099609375, 0.80523681640625, 0.826446533203125, 0.84765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 3.0, 5.0, 7.0, 2.0, 9.0, 8.0, 8.0, 17.0, 23.0, 34.0, 41.0, 55.0, 76.0, 104.0, 205.0, 368.0, 899.0, 3291.0, 56873.0, 928493.0, 52961.0, 3318.0, 787.0, 339.0, 179.0, 128.0, 85.0, 64.0, 34.0, 37.0, 23.0, 18.0, 9.0, 11.0, 8.0, 6.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.345703125, -1.3066864013671875, -1.267669677734375, -1.2286529541015625, -1.18963623046875, -1.1506195068359375, -1.111602783203125, -1.0725860595703125, -1.0335693359375, -0.9945526123046875, -0.955535888671875, -0.9165191650390625, -0.87750244140625, -0.8384857177734375, -0.799468994140625, -0.7604522705078125, -0.721435546875, -0.6824188232421875, -0.643402099609375, -0.6043853759765625, -0.56536865234375, -0.5263519287109375, -0.487335205078125, -0.4483184814453125, -0.4093017578125, -0.3702850341796875, -0.331268310546875, -0.2922515869140625, -0.25323486328125, -0.2142181396484375, -0.175201416015625, -0.1361846923828125, -0.09716796875, -0.0581512451171875, -0.019134521484375, 0.0198822021484375, 0.05889892578125, 0.0979156494140625, 0.136932373046875, 0.1759490966796875, 0.2149658203125, 0.2539825439453125, 0.292999267578125, 0.3320159912109375, 0.37103271484375, 0.4100494384765625, 0.449066162109375, 0.4880828857421875, 0.527099609375, 0.5661163330078125, 0.605133056640625, 0.6441497802734375, 0.68316650390625, 0.7221832275390625, 0.761199951171875, 0.8002166748046875, 0.8392333984375, 0.8782501220703125, 0.917266845703125, 0.9562835693359375, 0.99530029296875, 1.0343170166015625, 1.073333740234375, 1.1123504638671875, 1.1513671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 6.0, 2.0, 6.0, 10.0, 5.0, 16.0, 11.0, 14.0, 15.0, 23.0, 23.0, 28.0, 31.0, 41.0, 26.0, 30.0, 38.0, 36.0, 45.0, 56.0, 49.0, 49.0, 60.0, 37.0, 56.0, 40.0, 35.0, 36.0, 25.0, 24.0, 29.0, 19.0, 13.0, 11.0, 11.0, 6.0, 8.0, 6.0, 5.0, 2.0, 3.0, 6.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-0.7509765625, -0.7285919189453125, -0.706207275390625, -0.6838226318359375, -0.66143798828125, -0.6390533447265625, -0.616668701171875, -0.5942840576171875, -0.5718994140625, -0.5495147705078125, -0.527130126953125, -0.5047454833984375, -0.48236083984375, -0.4599761962890625, -0.437591552734375, -0.4152069091796875, -0.392822265625, -0.3704376220703125, -0.348052978515625, -0.3256683349609375, -0.30328369140625, -0.2808990478515625, -0.258514404296875, -0.2361297607421875, -0.2137451171875, -0.1913604736328125, -0.168975830078125, -0.1465911865234375, -0.12420654296875, -0.1018218994140625, -0.079437255859375, -0.0570526123046875, -0.03466796875, -0.0122833251953125, 0.010101318359375, 0.0324859619140625, 0.05487060546875, 0.0772552490234375, 0.099639892578125, 0.1220245361328125, 0.1444091796875, 0.1667938232421875, 0.189178466796875, 0.2115631103515625, 0.23394775390625, 0.2563323974609375, 0.278717041015625, 0.3011016845703125, 0.323486328125, 0.3458709716796875, 0.368255615234375, 0.3906402587890625, 0.41302490234375, 0.4354095458984375, 0.457794189453125, 0.4801788330078125, 0.5025634765625, 0.5249481201171875, 0.547332763671875, 0.5697174072265625, 0.59210205078125, 0.6144866943359375, 0.636871337890625, 0.6592559814453125, 0.681640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 16.0, 12.0, 19.0, 37.0, 55.0, 108.0, 239.0, 782.0, 5248.0, 130982.0, 872326.0, 35329.0, 2483.0, 525.0, 163.0, 83.0, 48.0, 23.0, 22.0, 11.0, 8.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310302734375, -0.3009910583496094, -0.29167938232421875, -0.2823677062988281, -0.2730560302734375, -0.2637443542480469, -0.25443267822265625, -0.24512100219726562, -0.235809326171875, -0.22649765014648438, -0.21718597412109375, -0.20787429809570312, -0.1985626220703125, -0.18925094604492188, -0.17993927001953125, -0.17062759399414062, -0.16131591796875, -0.15200424194335938, -0.14269256591796875, -0.13338088989257812, -0.1240692138671875, -0.11475753784179688, -0.10544586181640625, -0.09613418579101562, -0.086822509765625, -0.07751083374023438, -0.06819915771484375, -0.058887481689453125, -0.0495758056640625, -0.040264129638671875, -0.03095245361328125, -0.021640777587890625, -0.0123291015625, -0.003017425537109375, 0.00629425048828125, 0.015605926513671875, 0.0249176025390625, 0.034229278564453125, 0.04354095458984375, 0.052852630615234375, 0.062164306640625, 0.07147598266601562, 0.08078765869140625, 0.09009933471679688, 0.0994110107421875, 0.10872268676757812, 0.11803436279296875, 0.12734603881835938, 0.13665771484375, 0.14596939086914062, 0.15528106689453125, 0.16459274291992188, 0.1739044189453125, 0.18321609497070312, 0.19252777099609375, 0.20183944702148438, 0.211151123046875, 0.22046279907226562, 0.22977447509765625, 0.23908615112304688, 0.2483978271484375, 0.2577095031738281, 0.26702117919921875, 0.2763328552246094, 0.28564453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 14.0, 14.0, 13.0, 16.0, 24.0, 40.0, 52.0, 60.0, 106.0, 122.0, 167.0, 91.0, 82.0, 47.0, 41.0, 24.0, 24.0, 14.0, 14.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.5570392608642578e-05, -2.4881213903427124e-05, -2.419203519821167e-05, -2.3502856492996216e-05, -2.2813677787780762e-05, -2.2124499082565308e-05, -2.1435320377349854e-05, -2.07461416721344e-05, -2.0056962966918945e-05, -1.936778426170349e-05, -1.8678605556488037e-05, -1.7989426851272583e-05, -1.730024814605713e-05, -1.6611069440841675e-05, -1.592189073562622e-05, -1.5232712030410767e-05, -1.4543533325195312e-05, -1.3854354619979858e-05, -1.3165175914764404e-05, -1.247599720954895e-05, -1.1786818504333496e-05, -1.1097639799118042e-05, -1.0408461093902588e-05, -9.719282388687134e-06, -9.03010368347168e-06, -8.340924978256226e-06, -7.651746273040771e-06, -6.962567567825317e-06, -6.273388862609863e-06, -5.584210157394409e-06, -4.895031452178955e-06, -4.205852746963501e-06, -3.516674041748047e-06, -2.8274953365325928e-06, -2.1383166313171387e-06, -1.4491379261016846e-06, -7.599592208862305e-07, -7.078051567077637e-08, 6.183981895446777e-07, 1.3075768947601318e-06, 1.996755599975586e-06, 2.68593430519104e-06, 3.375113010406494e-06, 4.064291715621948e-06, 4.753470420837402e-06, 5.4426491260528564e-06, 6.1318278312683105e-06, 6.821006536483765e-06, 7.510185241699219e-06, 8.199363946914673e-06, 8.888542652130127e-06, 9.577721357345581e-06, 1.0266900062561035e-05, 1.095607876777649e-05, 1.1645257472991943e-05, 1.2334436178207397e-05, 1.3023614883422852e-05, 1.3712793588638306e-05, 1.440197229385376e-05, 1.5091150999069214e-05, 1.5780329704284668e-05, 1.6469508409500122e-05, 1.7158687114715576e-05, 1.784786581993103e-05, 1.8537044525146484e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 12.0, 20.0, 35.0, 74.0, 131.0, 300.0, 997.0, 4315.0, 86820.0, 922773.0, 29091.0, 2694.0, 743.0, 269.0, 139.0, 55.0, 31.0, 16.0, 8.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.5107421875, -0.4989643096923828, -0.4871864318847656, -0.47540855407714844, -0.46363067626953125, -0.45185279846191406, -0.4400749206542969, -0.4282970428466797, -0.4165191650390625, -0.4047412872314453, -0.3929634094238281, -0.38118553161621094, -0.36940765380859375, -0.35762977600097656, -0.3458518981933594, -0.3340740203857422, -0.322296142578125, -0.3105182647705078, -0.2987403869628906, -0.28696250915527344, -0.27518463134765625, -0.26340675354003906, -0.2516288757324219, -0.2398509979248047, -0.2280731201171875, -0.2162952423095703, -0.20451736450195312, -0.19273948669433594, -0.18096160888671875, -0.16918373107910156, -0.15740585327148438, -0.1456279754638672, -0.13385009765625, -0.12207221984863281, -0.11029434204101562, -0.09851646423339844, -0.08673858642578125, -0.07496070861816406, -0.06318283081054688, -0.05140495300292969, -0.0396270751953125, -0.027849197387695312, -0.016071319580078125, -0.0042934417724609375, 0.00748443603515625, 0.019262313842773438, 0.031040191650390625, 0.04281806945800781, 0.054595947265625, 0.06637382507324219, 0.07815170288085938, 0.08992958068847656, 0.10170745849609375, 0.11348533630371094, 0.12526321411132812, 0.1370410919189453, 0.1488189697265625, 0.1605968475341797, 0.17237472534179688, 0.18415260314941406, 0.19593048095703125, 0.20770835876464844, 0.21948623657226562, 0.2312641143798828, 0.2430419921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 7.0, 14.0, 14.0, 28.0, 44.0, 43.0, 46.0, 80.0, 93.0, 166.0, 116.0, 82.0, 64.0, 51.0, 39.0, 26.0, 19.0, 13.0, 6.0, 7.0, 6.0, 5.0, 5.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0560302734375, -0.05365753173828125, -0.0512847900390625, -0.04891204833984375, -0.046539306640625, -0.04416656494140625, -0.0417938232421875, -0.03942108154296875, -0.03704833984375, -0.03467559814453125, -0.0323028564453125, -0.02993011474609375, -0.027557373046875, -0.02518463134765625, -0.0228118896484375, -0.02043914794921875, -0.01806640625, -0.01569366455078125, -0.0133209228515625, -0.01094818115234375, -0.008575439453125, -0.00620269775390625, -0.0038299560546875, -0.00145721435546875, 0.00091552734375, 0.00328826904296875, 0.0056610107421875, 0.00803375244140625, 0.010406494140625, 0.01277923583984375, 0.0151519775390625, 0.01752471923828125, 0.0198974609375, 0.02227020263671875, 0.0246429443359375, 0.02701568603515625, 0.029388427734375, 0.03176116943359375, 0.0341339111328125, 0.03650665283203125, 0.03887939453125, 0.04125213623046875, 0.0436248779296875, 0.04599761962890625, 0.048370361328125, 0.05074310302734375, 0.0531158447265625, 0.05548858642578125, 0.057861328125, 0.06023406982421875, 0.0626068115234375, 0.06497955322265625, 0.067352294921875, 0.06972503662109375, 0.0720977783203125, 0.07447052001953125, 0.07684326171875, 0.07921600341796875, 0.0815887451171875, 0.08396148681640625, 0.086334228515625, 0.08870697021484375, 0.0910797119140625, 0.09345245361328125, 0.0958251953125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 16.0, 33.0, 134.0, 213.0, 296.0, 196.0, 67.0, 36.0, 15.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16535758972168, -4.077333927154541, -3.9893105030059814, -3.901287078857422, -3.813263416290283, -3.7252399921417236, -3.637216567993164, -3.5491929054260254, -3.461169481277466, -3.3731460571289062, -3.2851223945617676, -3.197098970413208, -3.1090755462646484, -3.0210518836975098, -2.93302845954895, -2.8450050354003906, -2.756981372833252, -2.6689579486846924, -2.5809342861175537, -2.492910861968994, -2.4048871994018555, -2.316863775253296, -2.2288403511047363, -2.1408166885375977, -2.052793264389038, -1.964769721031189, -1.8767461776733398, -1.7887227535247803, -1.7006992101669312, -1.612675666809082, -1.5246522426605225, -1.4366286993026733, -1.3486050367355347, -1.2605814933776855, -1.172558069229126, -1.0845345258712769, -0.9965109825134277, -0.9084874391555786, -0.8204639554023743, -0.7324404716491699, -0.6444169282913208, -0.5563933849334717, -0.46836990118026733, -0.3803463876247406, -0.29232287406921387, -0.20429936051368713, -0.1162758469581604, -0.028252363204956055, 0.059771180152893066, 0.1477946937084198, 0.23581820726394653, 0.32384172081947327, 0.411865234375, 0.49988874793052673, 0.5879122614860535, 0.6759357452392578, 0.7639592885971069, 0.851982831954956, 0.9400063157081604, 1.0280297994613647, 1.1160533428192139, 1.204076886177063, 1.292100429534912, 1.3801238536834717, 1.4681473970413208]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 5.0, 6.0, 20.0, 8.0, 13.0, 16.0, 29.0, 24.0, 25.0, 24.0, 24.0, 39.0, 31.0, 32.0, 41.0, 36.0, 51.0, 41.0, 53.0, 44.0, 56.0, 42.0, 39.0, 52.0, 41.0, 26.0, 28.0, 26.0, 18.0, 24.0, 15.0, 20.0, 7.0, 9.0, 7.0, 6.0, 3.0, 0.0, 5.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0659652948379517, -1.0279369354248047, -0.9899085760116577, -0.9518802762031555, -0.9138519167900085, -0.8758235573768616, -0.8377952575683594, -0.7997668981552124, -0.7617385387420654, -0.7237101793289185, -0.6856818199157715, -0.6476535201072693, -0.6096251606941223, -0.5715968012809753, -0.5335685014724731, -0.49554014205932617, -0.4575117826461792, -0.4194834232330322, -0.38145509362220764, -0.34342676401138306, -0.3053984045982361, -0.2673700451850891, -0.22934171557426453, -0.19131338596343994, -0.15328502655029297, -0.11525668203830719, -0.07722833752632141, -0.03919999301433563, -0.0011716485023498535, 0.036856696009635925, 0.0748850405216217, 0.11291337013244629, 0.15094172954559326, 0.18897007405757904, 0.22699841856956482, 0.2650267481803894, 0.3030551075935364, 0.34108346700668335, 0.37911179661750793, 0.4171401262283325, 0.4551684856414795, 0.49319684505462646, 0.5312252044677734, 0.5692535042762756, 0.6072818636894226, 0.6453102231025696, 0.6833385229110718, 0.7213668823242188, 0.7593952417373657, 0.7974236011505127, 0.8354519605636597, 0.8734802603721619, 0.9115086197853088, 0.9495369791984558, 0.987565279006958, 1.025593638420105, 1.063621997833252, 1.101650357246399, 1.139678716659546, 1.1777070760726929, 1.2157354354858398, 1.2537636756896973, 1.2917920351028442, 1.3298203945159912, 1.3678487539291382]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 5.0, 8.0, 11.0, 19.0, 18.0, 29.0, 30.0, 39.0, 63.0, 118.0, 173.0, 318.0, 634.0, 1394.0, 4173.0, 15750.0, 95264.0, 1387862.0, 2451348.0, 202736.0, 24703.0, 5863.0, 1890.0, 794.0, 375.0, 231.0, 125.0, 86.0, 62.0, 45.0, 23.0, 19.0, 22.0, 14.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71728515625, -0.6942596435546875, -0.671234130859375, -0.6482086181640625, -0.62518310546875, -0.6021575927734375, -0.579132080078125, -0.5561065673828125, -0.5330810546875, -0.5100555419921875, -0.487030029296875, -0.4640045166015625, -0.44097900390625, -0.4179534912109375, -0.394927978515625, -0.3719024658203125, -0.348876953125, -0.3258514404296875, -0.302825927734375, -0.2798004150390625, -0.25677490234375, -0.2337493896484375, -0.210723876953125, -0.1876983642578125, -0.1646728515625, -0.1416473388671875, -0.118621826171875, -0.0955963134765625, -0.07257080078125, -0.0495452880859375, -0.026519775390625, -0.0034942626953125, 0.01953125, 0.0425567626953125, 0.065582275390625, 0.0886077880859375, 0.11163330078125, 0.1346588134765625, 0.157684326171875, 0.1807098388671875, 0.2037353515625, 0.2267608642578125, 0.249786376953125, 0.2728118896484375, 0.29583740234375, 0.3188629150390625, 0.341888427734375, 0.3649139404296875, 0.387939453125, 0.4109649658203125, 0.433990478515625, 0.4570159912109375, 0.48004150390625, 0.5030670166015625, 0.526092529296875, 0.5491180419921875, 0.5721435546875, 0.5951690673828125, 0.618194580078125, 0.6412200927734375, 0.66424560546875, 0.6872711181640625, 0.710296630859375, 0.7333221435546875, 0.75634765625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 1.0, 11.0, 16.0, 16.0, 19.0, 22.0, 35.0, 34.0, 33.0, 53.0, 67.0, 59.0, 69.0, 62.0, 63.0, 61.0, 70.0, 48.0, 50.0, 38.0, 39.0, 23.0, 29.0, 27.0, 16.0, 6.0, 12.0, 9.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.354736328125, -0.3399925231933594, -0.32524871826171875, -0.3105049133300781, -0.2957611083984375, -0.2810173034667969, -0.26627349853515625, -0.2515296936035156, -0.236785888671875, -0.22204208374023438, -0.20729827880859375, -0.19255447387695312, -0.1778106689453125, -0.16306686401367188, -0.14832305908203125, -0.13357925415039062, -0.11883544921875, -0.10409164428710938, -0.08934783935546875, -0.07460403442382812, -0.0598602294921875, -0.045116424560546875, -0.03037261962890625, -0.015628814697265625, -0.000885009765625, 0.013858795166015625, 0.02860260009765625, 0.043346405029296875, 0.0580902099609375, 0.07283401489257812, 0.08757781982421875, 0.10232162475585938, 0.1170654296875, 0.13180923461914062, 0.14655303955078125, 0.16129684448242188, 0.1760406494140625, 0.19078445434570312, 0.20552825927734375, 0.22027206420898438, 0.235015869140625, 0.24975967407226562, 0.26450347900390625, 0.2792472839355469, 0.2939910888671875, 0.3087348937988281, 0.32347869873046875, 0.3382225036621094, 0.35296630859375, 0.3677101135253906, 0.38245391845703125, 0.3971977233886719, 0.4119415283203125, 0.4266853332519531, 0.44142913818359375, 0.4561729431152344, 0.470916748046875, 0.4856605529785156, 0.5004043579101562, 0.5151481628417969, 0.5298919677734375, 0.5446357727050781, 0.5593795776367188, 0.5741233825683594, 0.5888671875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 10.0, 11.0, 13.0, 16.0, 31.0, 54.0, 108.0, 167.0, 332.0, 742.0, 3491.0, 53317.0, 3845590.0, 279763.0, 8374.0, 1347.0, 446.0, 204.0, 95.0, 66.0, 40.0, 17.0, 10.0, 12.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.599609375, -1.553497314453125, -1.50738525390625, -1.461273193359375, -1.4151611328125, -1.369049072265625, -1.32293701171875, -1.276824951171875, -1.230712890625, -1.184600830078125, -1.13848876953125, -1.092376708984375, -1.0462646484375, -1.000152587890625, -0.95404052734375, -0.907928466796875, -0.86181640625, -0.815704345703125, -0.76959228515625, -0.723480224609375, -0.6773681640625, -0.631256103515625, -0.58514404296875, -0.539031982421875, -0.492919921875, -0.446807861328125, -0.40069580078125, -0.354583740234375, -0.3084716796875, -0.262359619140625, -0.21624755859375, -0.170135498046875, -0.1240234375, -0.077911376953125, -0.03179931640625, 0.014312744140625, 0.0604248046875, 0.106536865234375, 0.15264892578125, 0.198760986328125, 0.244873046875, 0.290985107421875, 0.33709716796875, 0.383209228515625, 0.4293212890625, 0.475433349609375, 0.52154541015625, 0.567657470703125, 0.61376953125, 0.659881591796875, 0.70599365234375, 0.752105712890625, 0.7982177734375, 0.844329833984375, 0.89044189453125, 0.936553955078125, 0.982666015625, 1.028778076171875, 1.07489013671875, 1.121002197265625, 1.1671142578125, 1.213226318359375, 1.25933837890625, 1.305450439453125, 1.3515625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 9.0, 3.0, 8.0, 25.0, 29.0, 62.0, 160.0, 311.0, 633.0, 1070.0, 878.0, 487.0, 215.0, 73.0, 46.0, 27.0, 22.0, 13.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4169921875, -0.4049949645996094, -0.39299774169921875, -0.3810005187988281, -0.3690032958984375, -0.3570060729980469, -0.34500885009765625, -0.3330116271972656, -0.321014404296875, -0.3090171813964844, -0.29701995849609375, -0.2850227355957031, -0.2730255126953125, -0.2610282897949219, -0.24903106689453125, -0.23703384399414062, -0.22503662109375, -0.21303939819335938, -0.20104217529296875, -0.18904495239257812, -0.1770477294921875, -0.16505050659179688, -0.15305328369140625, -0.14105606079101562, -0.129058837890625, -0.11706161499023438, -0.10506439208984375, -0.09306716918945312, -0.0810699462890625, -0.06907272338867188, -0.05707550048828125, -0.045078277587890625, -0.0330810546875, -0.021083831787109375, -0.00908660888671875, 0.002910614013671875, 0.0149078369140625, 0.026905059814453125, 0.03890228271484375, 0.050899505615234375, 0.062896728515625, 0.07489395141601562, 0.08689117431640625, 0.09888839721679688, 0.1108856201171875, 0.12288284301757812, 0.13488006591796875, 0.14687728881835938, 0.15887451171875, 0.17087173461914062, 0.18286895751953125, 0.19486618041992188, 0.2068634033203125, 0.21886062622070312, 0.23085784912109375, 0.24285507202148438, 0.254852294921875, 0.2668495178222656, 0.27884674072265625, 0.2908439636230469, 0.3028411865234375, 0.3148384094238281, 0.32683563232421875, 0.3388328552246094, 0.350830078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 6.0, 10.0, 15.0, 18.0, 25.0, 35.0, 36.0, 52.0, 48.0, 54.0, 61.0, 67.0, 62.0, 72.0, 68.0, 47.0, 56.0, 54.0, 45.0, 36.0, 40.0, 15.0, 21.0, 12.0, 15.0, 11.0, 6.0, 3.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3767976462841034, -0.36137092113494873, -0.34594422578811646, -0.3305175006389618, -0.31509077548980713, -0.29966408014297485, -0.2842373549938202, -0.2688106298446655, -0.25338393449783325, -0.23795722424983978, -0.2225305140018463, -0.20710378885269165, -0.19167707860469818, -0.1762503683567047, -0.16082364320755005, -0.14539693295955658, -0.1299702227115631, -0.11454351246356964, -0.09911679476499557, -0.08369007706642151, -0.06826336681842804, -0.05283665657043457, -0.037409938871860504, -0.021983221173286438, -0.006556510925292969, 0.008870203047990799, 0.024296917021274567, 0.039723630994558334, 0.0551503449678421, 0.07057705521583557, 0.08600377291440964, 0.1014304906129837, 0.11685717105865479, 0.13228388130664825, 0.14771059155464172, 0.1631373167037964, 0.17856402695178986, 0.19399073719978333, 0.209417462348938, 0.22484417259693146, 0.24027088284492493, 0.2556976079940796, 0.27112430334091187, 0.28655102849006653, 0.3019777536392212, 0.31740444898605347, 0.33283117413520813, 0.3482578992843628, 0.36368459463119507, 0.37911131978034973, 0.394538015127182, 0.40996474027633667, 0.42539143562316895, 0.4408181607723236, 0.45624488592147827, 0.47167158126831055, 0.4870983064174652, 0.5025250315666199, 0.5179517269134521, 0.5333784222602844, 0.5488051772117615, 0.5642318725585938, 0.579658567905426, 0.5950853228569031, 0.6105120182037354]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [6.0, 3.0, 4.0, 3.0, 6.0, 4.0, 5.0, 7.0, 7.0, 7.0, 12.0, 19.0, 17.0, 16.0, 21.0, 19.0, 30.0, 15.0, 30.0, 27.0, 36.0, 29.0, 34.0, 34.0, 36.0, 41.0, 39.0, 30.0, 39.0, 41.0, 36.0, 27.0, 23.0, 27.0, 38.0, 29.0, 16.0, 23.0, 26.0, 24.0, 13.0, 16.0, 14.0, 13.0, 13.0, 11.0, 10.0, 10.0, 4.0, 8.0, 4.0, 6.0, 1.0, 5.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29435452818870544, -0.2841488718986511, -0.2739432454109192, -0.26373758912086487, -0.25353196263313293, -0.2433263063430786, -0.23312066495418549, -0.22291502356529236, -0.21270936727523804, -0.2025037258863449, -0.19229808449745178, -0.18209242820739746, -0.17188678681850433, -0.1616811454296112, -0.15147550404071808, -0.14126986265182495, -0.13106422126293182, -0.1208585798740387, -0.11065293103456497, -0.10044728964567184, -0.09024164080619812, -0.08003599941730499, -0.06983035802841187, -0.05962470918893814, -0.04941906780004501, -0.03921342268586159, -0.02900777943432331, -0.018802136182785034, -0.008596491068601608, 0.0016091540455818176, 0.011814795434474945, 0.02202044427394867, 0.0322260856628418, 0.04243173077702522, 0.05263737589120865, 0.06284301728010178, 0.0730486661195755, 0.08325430750846863, 0.09345994889736176, 0.10366559773683548, 0.11387123912572861, 0.12407688051462173, 0.13428252935409546, 0.1444881707429886, 0.1546938121318817, 0.16489946842193604, 0.17510509490966797, 0.1853107511997223, 0.19551639258861542, 0.20572203397750854, 0.21592767536640167, 0.2261333167552948, 0.23633897304534912, 0.24654461443424225, 0.2567502558231354, 0.2669559121131897, 0.27716153860092163, 0.28736719489097595, 0.2975728213787079, 0.3077784776687622, 0.31798410415649414, 0.32818976044654846, 0.3383954167366028, 0.3486010432243347, 0.35880669951438904]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 7.0, 10.0, 24.0, 21.0, 26.0, 42.0, 70.0, 92.0, 162.0, 239.0, 350.0, 550.0, 907.0, 1529.0, 2630.0, 4728.0, 8808.0, 16806.0, 35082.0, 79949.0, 194066.0, 323853.0, 212758.0, 87994.0, 38278.0, 18227.0, 9278.0, 5010.0, 2814.0, 1670.0, 931.0, 552.0, 330.0, 241.0, 184.0, 116.0, 58.0, 51.0, 27.0, 22.0, 16.0, 16.0, 11.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09180355072021484, -0.08869743347167969, -0.08559131622314453, -0.08248519897460938, -0.07937908172607422, -0.07627296447753906, -0.0731668472290039, -0.07006072998046875, -0.0669546127319336, -0.06384849548339844, -0.06074237823486328, -0.057636260986328125, -0.05453014373779297, -0.05142402648925781, -0.048317909240722656, -0.0452117919921875, -0.042105674743652344, -0.03899955749511719, -0.03589344024658203, -0.032787322998046875, -0.02968120574951172, -0.026575088500976562, -0.023468971252441406, -0.02036285400390625, -0.017256736755371094, -0.014150619506835938, -0.011044502258300781, -0.007938385009765625, -0.004832267761230469, -0.0017261505126953125, 0.0013799667358398438, 0.004486083984375, 0.007592201232910156, 0.010698318481445312, 0.013804435729980469, 0.016910552978515625, 0.02001667022705078, 0.023122787475585938, 0.026228904724121094, 0.02933502197265625, 0.032441139221191406, 0.03554725646972656, 0.03865337371826172, 0.041759490966796875, 0.04486560821533203, 0.04797172546386719, 0.051077842712402344, 0.0541839599609375, 0.057290077209472656, 0.06039619445800781, 0.06350231170654297, 0.06660842895507812, 0.06971454620361328, 0.07282066345214844, 0.0759267807006836, 0.07903289794921875, 0.0821390151977539, 0.08524513244628906, 0.08835124969482422, 0.09145736694335938, 0.09456348419189453, 0.09766960144042969, 0.10077571868896484, 0.1038818359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 8.0, 11.0, 8.0, 12.0, 14.0, 19.0, 17.0, 28.0, 28.0, 27.0, 29.0, 37.0, 38.0, 33.0, 32.0, 33.0, 39.0, 51.0, 41.0, 41.0, 34.0, 32.0, 36.0, 40.0, 40.0, 34.0, 32.0, 31.0, 24.0, 18.0, 23.0, 13.0, 11.0, 14.0, 13.0, 8.0, 7.0, 15.0, 10.0, 4.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.204345703125, -0.19751358032226562, -0.19068145751953125, -0.18384933471679688, -0.1770172119140625, -0.17018508911132812, -0.16335296630859375, -0.15652084350585938, -0.149688720703125, -0.14285659790039062, -0.13602447509765625, -0.12919235229492188, -0.1223602294921875, -0.11552810668945312, -0.10869598388671875, -0.10186386108398438, -0.09503173828125, -0.08819961547851562, -0.08136749267578125, -0.07453536987304688, -0.0677032470703125, -0.060871124267578125, -0.05403900146484375, -0.047206878662109375, -0.040374755859375, -0.033542633056640625, -0.02671051025390625, -0.019878387451171875, -0.0130462646484375, -0.006214141845703125, 0.00061798095703125, 0.007450103759765625, 0.0142822265625, 0.021114349365234375, 0.02794647216796875, 0.034778594970703125, 0.0416107177734375, 0.048442840576171875, 0.05527496337890625, 0.062107086181640625, 0.068939208984375, 0.07577133178710938, 0.08260345458984375, 0.08943557739257812, 0.0962677001953125, 0.10309982299804688, 0.10993194580078125, 0.11676406860351562, 0.12359619140625, 0.13042831420898438, 0.13726043701171875, 0.14409255981445312, 0.1509246826171875, 0.15775680541992188, 0.16458892822265625, 0.17142105102539062, 0.178253173828125, 0.18508529663085938, 0.19191741943359375, 0.19874954223632812, 0.2055816650390625, 0.21241378784179688, 0.21924591064453125, 0.22607803344726562, 0.23291015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 8.0, 20.0, 26.0, 28.0, 25.0, 56.0, 60.0, 115.0, 155.0, 268.0, 406.0, 775.0, 1342.0, 2730.0, 5849.0, 12466.0, 30154.0, 79552.0, 216208.0, 355643.0, 211531.0, 77946.0, 29171.0, 12283.0, 5586.0, 2757.0, 1402.0, 801.0, 429.0, 260.0, 141.0, 107.0, 77.0, 50.0, 30.0, 20.0, 13.0, 15.0, 12.0, 3.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1015625, -0.09843635559082031, -0.09531021118164062, -0.09218406677246094, -0.08905792236328125, -0.08593177795410156, -0.08280563354492188, -0.07967948913574219, -0.0765533447265625, -0.07342720031738281, -0.07030105590820312, -0.06717491149902344, -0.06404876708984375, -0.06092262268066406, -0.057796478271484375, -0.05467033386230469, -0.051544189453125, -0.04841804504394531, -0.045291900634765625, -0.04216575622558594, -0.03903961181640625, -0.03591346740722656, -0.032787322998046875, -0.029661178588867188, -0.0265350341796875, -0.023408889770507812, -0.020282745361328125, -0.017156600952148438, -0.01403045654296875, -0.010904312133789062, -0.007778167724609375, -0.0046520233154296875, -0.00152587890625, 0.0016002655029296875, 0.004726409912109375, 0.007852554321289062, 0.01097869873046875, 0.014104843139648438, 0.017230987548828125, 0.020357131958007812, 0.0234832763671875, 0.026609420776367188, 0.029735565185546875, 0.03286170959472656, 0.03598785400390625, 0.03911399841308594, 0.042240142822265625, 0.04536628723144531, 0.048492431640625, 0.05161857604980469, 0.054744720458984375, 0.05787086486816406, 0.06099700927734375, 0.06412315368652344, 0.06724929809570312, 0.07037544250488281, 0.0735015869140625, 0.07662773132324219, 0.07975387573242188, 0.08288002014160156, 0.08600616455078125, 0.08913230895996094, 0.09225845336914062, 0.09538459777832031, 0.0985107421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 3.0, 8.0, 9.0, 11.0, 16.0, 28.0, 14.0, 18.0, 28.0, 34.0, 40.0, 40.0, 38.0, 23.0, 50.0, 48.0, 52.0, 53.0, 59.0, 46.0, 40.0, 57.0, 34.0, 33.0, 29.0, 32.0, 21.0, 18.0, 16.0, 12.0, 24.0, 13.0, 8.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5275039672851562, -0.5095977783203125, -0.49169158935546875, -0.473785400390625, -0.45587921142578125, -0.4379730224609375, -0.42006683349609375, -0.40216064453125, -0.38425445556640625, -0.3663482666015625, -0.34844207763671875, -0.330535888671875, -0.31262969970703125, -0.2947235107421875, -0.27681732177734375, -0.2589111328125, -0.24100494384765625, -0.2230987548828125, -0.20519256591796875, -0.187286376953125, -0.16938018798828125, -0.1514739990234375, -0.13356781005859375, -0.11566162109375, -0.09775543212890625, -0.0798492431640625, -0.06194305419921875, -0.044036865234375, -0.02613067626953125, -0.0082244873046875, 0.00968170166015625, 0.027587890625, 0.04549407958984375, 0.0634002685546875, 0.08130645751953125, 0.099212646484375, 0.11711883544921875, 0.1350250244140625, 0.15293121337890625, 0.17083740234375, 0.18874359130859375, 0.2066497802734375, 0.22455596923828125, 0.242462158203125, 0.26036834716796875, 0.2782745361328125, 0.29618072509765625, 0.3140869140625, 0.33199310302734375, 0.3498992919921875, 0.36780548095703125, 0.385711669921875, 0.40361785888671875, 0.4215240478515625, 0.43943023681640625, 0.45733642578125, 0.47524261474609375, 0.4931488037109375, 0.5110549926757812, 0.528961181640625, 0.5468673706054688, 0.5647735595703125, 0.5826797485351562, 0.6005859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 8.0, 15.0, 6.0, 13.0, 17.0, 28.0, 30.0, 37.0, 65.0, 114.0, 159.0, 180.0, 375.0, 550.0, 982.0, 1775.0, 3652.0, 9281.0, 29488.0, 156831.0, 623994.0, 171420.0, 31514.0, 9730.0, 3880.0, 1880.0, 945.0, 541.0, 363.0, 210.0, 142.0, 77.0, 75.0, 54.0, 39.0, 29.0, 11.0, 13.0, 5.0, 12.0, 4.0, 9.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0927734375, -0.09008598327636719, -0.08739852905273438, -0.08471107482910156, -0.08202362060546875, -0.07933616638183594, -0.07664871215820312, -0.07396125793457031, -0.0712738037109375, -0.06858634948730469, -0.06589889526367188, -0.06321144104003906, -0.06052398681640625, -0.05783653259277344, -0.055149078369140625, -0.05246162414550781, -0.049774169921875, -0.04708671569824219, -0.044399261474609375, -0.04171180725097656, -0.03902435302734375, -0.03633689880371094, -0.033649444580078125, -0.030961990356445312, -0.0282745361328125, -0.025587081909179688, -0.022899627685546875, -0.020212173461914062, -0.01752471923828125, -0.014837265014648438, -0.012149810791015625, -0.009462356567382812, -0.00677490234375, -0.0040874481201171875, -0.001399993896484375, 0.0012874603271484375, 0.00397491455078125, 0.0066623687744140625, 0.009349822998046875, 0.012037277221679688, 0.0147247314453125, 0.017412185668945312, 0.020099639892578125, 0.022787094116210938, 0.02547454833984375, 0.028162002563476562, 0.030849456787109375, 0.03353691101074219, 0.036224365234375, 0.03891181945800781, 0.041599273681640625, 0.04428672790527344, 0.04697418212890625, 0.04966163635253906, 0.052349090576171875, 0.05503654479980469, 0.0577239990234375, 0.06041145324707031, 0.06309890747070312, 0.06578636169433594, 0.06847381591796875, 0.07116127014160156, 0.07384872436523438, 0.07653617858886719, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 15.0, 20.0, 35.0, 42.0, 90.0, 127.0, 161.0, 147.0, 92.0, 90.0, 48.0, 42.0, 23.0, 12.0, 11.0, 6.0, 5.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30805778503418e-05, -3.2009556889533997e-05, -3.0938535928726196e-05, -2.9867514967918396e-05, -2.8796494007110596e-05, -2.7725473046302795e-05, -2.6654452085494995e-05, -2.5583431124687195e-05, -2.4512410163879395e-05, -2.3441389203071594e-05, -2.2370368242263794e-05, -2.1299347281455994e-05, -2.0228326320648193e-05, -1.9157305359840393e-05, -1.8086284399032593e-05, -1.7015263438224792e-05, -1.5944242477416992e-05, -1.4873221516609192e-05, -1.3802200555801392e-05, -1.2731179594993591e-05, -1.1660158634185791e-05, -1.058913767337799e-05, -9.51811671257019e-06, -8.44709575176239e-06, -7.37607479095459e-06, -6.3050538301467896e-06, -5.234032869338989e-06, -4.163011908531189e-06, -3.0919909477233887e-06, -2.0209699869155884e-06, -9.499490261077881e-07, 1.210719347000122e-07, 1.1920928955078125e-06, 2.263113856315613e-06, 3.334134817123413e-06, 4.405155777931213e-06, 5.476176738739014e-06, 6.547197699546814e-06, 7.618218660354614e-06, 8.689239621162415e-06, 9.760260581970215e-06, 1.0831281542778015e-05, 1.1902302503585815e-05, 1.2973323464393616e-05, 1.4044344425201416e-05, 1.5115365386009216e-05, 1.6186386346817017e-05, 1.7257407307624817e-05, 1.8328428268432617e-05, 1.9399449229240417e-05, 2.0470470190048218e-05, 2.1541491150856018e-05, 2.261251211166382e-05, 2.368353307247162e-05, 2.475455403327942e-05, 2.582557499408722e-05, 2.689659595489502e-05, 2.796761691570282e-05, 2.903863787651062e-05, 3.010965883731842e-05, 3.118067979812622e-05, 3.225170075893402e-05, 3.332272171974182e-05, 3.439374268054962e-05, 3.546476364135742e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 10.0, 11.0, 16.0, 20.0, 36.0, 42.0, 85.0, 194.0, 506.0, 1609.0, 6078.0, 34298.0, 459830.0, 499920.0, 36912.0, 6448.0, 1563.0, 523.0, 192.0, 82.0, 49.0, 40.0, 24.0, 14.0, 15.0, 5.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.184326171875, -0.17947769165039062, -0.17462921142578125, -0.16978073120117188, -0.1649322509765625, -0.16008377075195312, -0.15523529052734375, -0.15038681030273438, -0.145538330078125, -0.14068984985351562, -0.13584136962890625, -0.13099288940429688, -0.1261444091796875, -0.12129592895507812, -0.11644744873046875, -0.11159896850585938, -0.10675048828125, -0.10190200805664062, -0.09705352783203125, -0.09220504760742188, -0.0873565673828125, -0.08250808715820312, -0.07765960693359375, -0.07281112670898438, -0.067962646484375, -0.06311416625976562, -0.05826568603515625, -0.053417205810546875, -0.0485687255859375, -0.043720245361328125, -0.03887176513671875, -0.034023284912109375, -0.0291748046875, -0.024326324462890625, -0.01947784423828125, -0.014629364013671875, -0.0097808837890625, -0.004932403564453125, -8.392333984375e-05, 0.004764556884765625, 0.009613037109375, 0.014461517333984375, 0.01930999755859375, 0.024158477783203125, 0.0290069580078125, 0.033855438232421875, 0.03870391845703125, 0.043552398681640625, 0.04840087890625, 0.053249359130859375, 0.05809783935546875, 0.06294631958007812, 0.0677947998046875, 0.07264328002929688, 0.07749176025390625, 0.08234024047851562, 0.087188720703125, 0.09203720092773438, 0.09688568115234375, 0.10173416137695312, 0.1065826416015625, 0.11143112182617188, 0.11627960205078125, 0.12112808227539062, 0.1259765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 9.0, 4.0, 10.0, 18.0, 18.0, 28.0, 58.0, 86.0, 138.0, 168.0, 140.0, 104.0, 68.0, 41.0, 22.0, 19.0, 12.0, 7.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290374755859375, -0.027985811233520508, -0.026934146881103516, -0.025882482528686523, -0.02483081817626953, -0.02377915382385254, -0.022727489471435547, -0.021675825119018555, -0.020624160766601562, -0.01957249641418457, -0.018520832061767578, -0.017469167709350586, -0.016417503356933594, -0.015365839004516602, -0.01431417465209961, -0.013262510299682617, -0.012210845947265625, -0.011159181594848633, -0.01010751724243164, -0.009055852890014648, -0.008004188537597656, -0.006952524185180664, -0.005900859832763672, -0.00484919548034668, -0.0037975311279296875, -0.0027458667755126953, -0.0016942024230957031, -0.0006425380706787109, 0.00040912628173828125, 0.0014607906341552734, 0.0025124549865722656, 0.003564119338989258, 0.00461578369140625, 0.005667448043823242, 0.006719112396240234, 0.0077707767486572266, 0.008822441101074219, 0.009874105453491211, 0.010925769805908203, 0.011977434158325195, 0.013029098510742188, 0.01408076286315918, 0.015132427215576172, 0.016184091567993164, 0.017235755920410156, 0.01828742027282715, 0.01933908462524414, 0.020390748977661133, 0.021442413330078125, 0.022494077682495117, 0.02354574203491211, 0.0245974063873291, 0.025649070739746094, 0.026700735092163086, 0.027752399444580078, 0.02880406379699707, 0.029855728149414062, 0.030907392501831055, 0.03195905685424805, 0.03301072120666504, 0.03406238555908203, 0.03511404991149902, 0.036165714263916016, 0.03721737861633301, 0.03826904296875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 7.0, 8.0, 9.0, 19.0, 22.0, 36.0, 39.0, 54.0, 60.0, 68.0, 78.0, 70.0, 70.0, 68.0, 68.0, 53.0, 58.0, 44.0, 51.0, 23.0, 23.0, 19.0, 17.0, 12.0, 7.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2091989815235138, -0.1999453753232956, -0.1906917542219162, -0.181438148021698, -0.1721845418214798, -0.1629309356212616, -0.1536773145198822, -0.144423708319664, -0.1351701021194458, -0.1259164959192276, -0.1166628822684288, -0.10740926861763, -0.0981556624174118, -0.088902048766613, -0.07964843511581421, -0.07039482891559601, -0.061141207814216614, -0.051887597888708115, -0.042633987963199615, -0.03338037431240082, -0.02412676438689232, -0.01487315446138382, -0.005619540810585022, 0.0036340653896331787, 0.012887679040431976, 0.022141288965940475, 0.031394898891448975, 0.04064851254224777, 0.04990212246775627, 0.05915573239326477, 0.06840934604406357, 0.07766295224428177, 0.08691656589508057, 0.09617017954587936, 0.10542378574609756, 0.11467739939689636, 0.12393100559711456, 0.13318461179733276, 0.14243823289871216, 0.15169183909893036, 0.16094544529914856, 0.17019905149936676, 0.17945267260074615, 0.18870627880096436, 0.19795988500118256, 0.20721349120140076, 0.21646711230278015, 0.22572071850299835, 0.23497433960437775, 0.24422794580459595, 0.25348156690597534, 0.26273518800735474, 0.27198877930641174, 0.28124240040779114, 0.29049599170684814, 0.29974961280822754, 0.30900323390960693, 0.31825685501098633, 0.32751044631004333, 0.33676406741142273, 0.3460176885128021, 0.35527127981185913, 0.3645249009132385, 0.3737785220146179, 0.3830321133136749]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 9.0, 7.0, 7.0, 6.0, 13.0, 10.0, 12.0, 18.0, 10.0, 26.0, 25.0, 22.0, 17.0, 40.0, 35.0, 32.0, 38.0, 39.0, 41.0, 39.0, 34.0, 54.0, 41.0, 44.0, 33.0, 31.0, 35.0, 30.0, 21.0, 32.0, 27.0, 35.0, 15.0, 17.0, 16.0, 19.0, 10.0, 10.0, 15.0, 9.0, 6.0, 6.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1825002282857895, -0.1760682761669159, -0.1696363389492035, -0.1632043868303299, -0.1567724347114563, -0.1503404974937439, -0.1439085453748703, -0.1374765932559967, -0.1310446560382843, -0.1246127113699913, -0.1181807592511177, -0.11174881458282471, -0.10531686991453171, -0.09888492524623871, -0.09245297312736511, -0.08602102845907211, -0.07958907634019852, -0.07315713167190552, -0.06672517955303192, -0.06029323488473892, -0.05386129021644592, -0.047429341822862625, -0.04099739342927933, -0.03456544876098633, -0.02813350036740303, -0.021701553836464882, -0.015269606374204159, -0.008837658911943436, -0.002405712381005287, 0.004026234149932861, 0.010458182543516159, 0.01689012721180916, 0.023322075605392456, 0.029754022136330605, 0.03618596866726875, 0.04261791706085205, 0.04904986172914505, 0.05548181012272835, 0.061913758516311646, 0.06834570318460464, 0.07477764785289764, 0.08120959252119064, 0.08764154464006424, 0.09407348930835724, 0.10050543397665024, 0.10693737864494324, 0.11336933076381683, 0.11980127543210983, 0.12623322010040283, 0.13266517221927643, 0.13909710943698883, 0.14552906155586243, 0.15196101367473602, 0.15839295089244843, 0.16482490301132202, 0.17125684022903442, 0.1776888072490692, 0.1841207593679428, 0.1905526965856552, 0.1969846487045288, 0.2034166008234024, 0.2098485380411148, 0.2162804901599884, 0.2227124273777008, 0.2291443794965744]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 10.0, 6.0, 12.0, 11.0, 16.0, 25.0, 42.0, 60.0, 80.0, 135.0, 208.0, 352.0, 491.0, 844.0, 1464.0, 2724.0, 5000.0, 10060.0, 22187.0, 54963.0, 152554.0, 359600.0, 269994.0, 98953.0, 36603.0, 15651.0, 7424.0, 3900.0, 2083.0, 1182.0, 694.0, 431.0, 279.0, 189.0, 95.0, 82.0, 52.0, 28.0, 25.0, 16.0, 10.0, 3.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264892578125, -0.2556915283203125, -0.246490478515625, -0.2372894287109375, -0.22808837890625, -0.2188873291015625, -0.209686279296875, -0.2004852294921875, -0.1912841796875, -0.1820831298828125, -0.172882080078125, -0.1636810302734375, -0.15447998046875, -0.1452789306640625, -0.136077880859375, -0.1268768310546875, -0.11767578125, -0.1084747314453125, -0.099273681640625, -0.0900726318359375, -0.08087158203125, -0.0716705322265625, -0.062469482421875, -0.0532684326171875, -0.0440673828125, -0.0348663330078125, -0.025665283203125, -0.0164642333984375, -0.00726318359375, 0.0019378662109375, 0.011138916015625, 0.0203399658203125, 0.029541015625, 0.0387420654296875, 0.047943115234375, 0.0571441650390625, 0.06634521484375, 0.0755462646484375, 0.084747314453125, 0.0939483642578125, 0.1031494140625, 0.1123504638671875, 0.121551513671875, 0.1307525634765625, 0.13995361328125, 0.1491546630859375, 0.158355712890625, 0.1675567626953125, 0.1767578125, 0.1859588623046875, 0.195159912109375, 0.2043609619140625, 0.21356201171875, 0.2227630615234375, 0.231964111328125, 0.2411651611328125, 0.2503662109375, 0.2595672607421875, 0.268768310546875, 0.2779693603515625, 0.28717041015625, 0.2963714599609375, 0.305572509765625, 0.3147735595703125, 0.323974609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 8.0, 6.0, 13.0, 19.0, 9.0, 12.0, 15.0, 16.0, 23.0, 31.0, 25.0, 29.0, 36.0, 35.0, 26.0, 34.0, 34.0, 37.0, 37.0, 51.0, 40.0, 40.0, 38.0, 26.0, 31.0, 39.0, 28.0, 27.0, 31.0, 26.0, 22.0, 19.0, 16.0, 12.0, 11.0, 8.0, 13.0, 9.0, 6.0, 14.0, 6.0, 5.0, 3.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.40283203125, -0.39075469970703125, -0.3786773681640625, -0.36660003662109375, -0.354522705078125, -0.34244537353515625, -0.3303680419921875, -0.31829071044921875, -0.30621337890625, -0.29413604736328125, -0.2820587158203125, -0.26998138427734375, -0.257904052734375, -0.24582672119140625, -0.2337493896484375, -0.22167205810546875, -0.2095947265625, -0.19751739501953125, -0.1854400634765625, -0.17336273193359375, -0.161285400390625, -0.14920806884765625, -0.1371307373046875, -0.12505340576171875, -0.11297607421875, -0.10089874267578125, -0.0888214111328125, -0.07674407958984375, -0.064666748046875, -0.05258941650390625, -0.0405120849609375, -0.02843475341796875, -0.016357421875, -0.00428009033203125, 0.0077972412109375, 0.01987457275390625, 0.031951904296875, 0.04402923583984375, 0.0561065673828125, 0.06818389892578125, 0.08026123046875, 0.09233856201171875, 0.1044158935546875, 0.11649322509765625, 0.128570556640625, 0.14064788818359375, 0.1527252197265625, 0.16480255126953125, 0.1768798828125, 0.18895721435546875, 0.2010345458984375, 0.21311187744140625, 0.225189208984375, 0.23726654052734375, 0.2493438720703125, 0.26142120361328125, 0.27349853515625, 0.28557586669921875, 0.2976531982421875, 0.30973052978515625, 0.321807861328125, 0.33388519287109375, 0.3459625244140625, 0.35803985595703125, 0.3701171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 7.0, 5.0, 4.0, 12.0, 13.0, 14.0, 31.0, 33.0, 60.0, 94.0, 138.0, 229.0, 433.0, 946.0, 2478.0, 8420.0, 42694.0, 307530.0, 574785.0, 88875.0, 15177.0, 3907.0, 1324.0, 534.0, 302.0, 174.0, 108.0, 74.0, 33.0, 24.0, 24.0, 16.0, 11.0, 10.0, 9.0, 10.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.57568359375, -0.5566177368164062, -0.5375518798828125, -0.5184860229492188, -0.499420166015625, -0.48035430908203125, -0.4612884521484375, -0.44222259521484375, -0.42315673828125, -0.40409088134765625, -0.3850250244140625, -0.36595916748046875, -0.346893310546875, -0.32782745361328125, -0.3087615966796875, -0.28969573974609375, -0.2706298828125, -0.25156402587890625, -0.2324981689453125, -0.21343231201171875, -0.194366455078125, -0.17530059814453125, -0.1562347412109375, -0.13716888427734375, -0.11810302734375, -0.09903717041015625, -0.0799713134765625, -0.06090545654296875, -0.041839599609375, -0.02277374267578125, -0.0037078857421875, 0.01535797119140625, 0.034423828125, 0.05348968505859375, 0.0725555419921875, 0.09162139892578125, 0.110687255859375, 0.12975311279296875, 0.1488189697265625, 0.16788482666015625, 0.18695068359375, 0.20601654052734375, 0.2250823974609375, 0.24414825439453125, 0.263214111328125, 0.28227996826171875, 0.3013458251953125, 0.32041168212890625, 0.3394775390625, 0.35854339599609375, 0.3776092529296875, 0.39667510986328125, 0.415740966796875, 0.43480682373046875, 0.4538726806640625, 0.47293853759765625, 0.49200439453125, 0.5110702514648438, 0.5301361083984375, 0.5492019653320312, 0.568267822265625, 0.5873336791992188, 0.6063995361328125, 0.6254653930664062, 0.64453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 5.0, 14.0, 14.0, 18.0, 20.0, 19.0, 31.0, 41.0, 49.0, 43.0, 51.0, 53.0, 60.0, 65.0, 53.0, 59.0, 61.0, 50.0, 46.0, 41.0, 45.0, 31.0, 26.0, 17.0, 23.0, 10.0, 18.0, 12.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74365234375, -0.7213668823242188, -0.6990814208984375, -0.6767959594726562, -0.654510498046875, -0.6322250366210938, -0.6099395751953125, -0.5876541137695312, -0.56536865234375, -0.5430831909179688, -0.5207977294921875, -0.49851226806640625, -0.476226806640625, -0.45394134521484375, -0.4316558837890625, -0.40937042236328125, -0.3870849609375, -0.36479949951171875, -0.3425140380859375, -0.32022857666015625, -0.297943115234375, -0.27565765380859375, -0.2533721923828125, -0.23108673095703125, -0.20880126953125, -0.18651580810546875, -0.1642303466796875, -0.14194488525390625, -0.119659423828125, -0.09737396240234375, -0.0750885009765625, -0.05280303955078125, -0.030517578125, -0.00823211669921875, 0.0140533447265625, 0.03633880615234375, 0.058624267578125, 0.08090972900390625, 0.1031951904296875, 0.12548065185546875, 0.14776611328125, 0.17005157470703125, 0.1923370361328125, 0.21462249755859375, 0.236907958984375, 0.25919342041015625, 0.2814788818359375, 0.30376434326171875, 0.3260498046875, 0.34833526611328125, 0.3706207275390625, 0.39290618896484375, 0.415191650390625, 0.43747711181640625, 0.4597625732421875, 0.48204803466796875, 0.50433349609375, 0.5266189575195312, 0.5489044189453125, 0.5711898803710938, 0.593475341796875, 0.6157608032226562, 0.6380462646484375, 0.6603317260742188, 0.6826171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 11.0, 7.0, 17.0, 21.0, 33.0, 63.0, 93.0, 131.0, 239.0, 542.0, 1315.0, 4337.0, 17733.0, 103942.0, 580603.0, 282580.0, 44040.0, 8724.0, 2414.0, 852.0, 334.0, 180.0, 115.0, 68.0, 35.0, 36.0, 19.0, 14.0, 4.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.141357421875, -0.13690757751464844, -0.13245773315429688, -0.1280078887939453, -0.12355804443359375, -0.11910820007324219, -0.11465835571289062, -0.11020851135253906, -0.1057586669921875, -0.10130882263183594, -0.09685897827148438, -0.09240913391113281, -0.08795928955078125, -0.08350944519042969, -0.07905960083007812, -0.07460975646972656, -0.070159912109375, -0.06571006774902344, -0.061260223388671875, -0.05681037902832031, -0.05236053466796875, -0.04791069030761719, -0.043460845947265625, -0.03901100158691406, -0.0345611572265625, -0.030111312866210938, -0.025661468505859375, -0.021211624145507812, -0.01676177978515625, -0.012311935424804688, -0.007862091064453125, -0.0034122467041015625, 0.00103759765625, 0.0054874420166015625, 0.009937286376953125, 0.014387130737304688, 0.01883697509765625, 0.023286819458007812, 0.027736663818359375, 0.03218650817871094, 0.0366363525390625, 0.04108619689941406, 0.045536041259765625, 0.04998588562011719, 0.05443572998046875, 0.05888557434082031, 0.06333541870117188, 0.06778526306152344, 0.072235107421875, 0.07668495178222656, 0.08113479614257812, 0.08558464050292969, 0.09003448486328125, 0.09448432922363281, 0.09893417358398438, 0.10338401794433594, 0.1078338623046875, 0.11228370666503906, 0.11673355102539062, 0.12118339538574219, 0.12563323974609375, 0.1300830841064453, 0.13453292846679688, 0.13898277282714844, 0.1434326171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 9.0, 7.0, 6.0, 11.0, 9.0, 16.0, 26.0, 39.0, 57.0, 70.0, 86.0, 119.0, 147.0, 99.0, 76.0, 53.0, 42.0, 33.0, 28.0, 9.0, 20.0, 16.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.8192996978759766e-05, -2.7475878596305847e-05, -2.675876021385193e-05, -2.604164183139801e-05, -2.5324523448944092e-05, -2.4607405066490173e-05, -2.3890286684036255e-05, -2.3173168301582336e-05, -2.2456049919128418e-05, -2.17389315366745e-05, -2.102181315422058e-05, -2.0304694771766663e-05, -1.9587576389312744e-05, -1.8870458006858826e-05, -1.8153339624404907e-05, -1.743622124195099e-05, -1.671910285949707e-05, -1.6001984477043152e-05, -1.5284866094589233e-05, -1.4567747712135315e-05, -1.3850629329681396e-05, -1.3133510947227478e-05, -1.241639256477356e-05, -1.1699274182319641e-05, -1.0982155799865723e-05, -1.0265037417411804e-05, -9.547919034957886e-06, -8.830800652503967e-06, -8.113682270050049e-06, -7.39656388759613e-06, -6.679445505142212e-06, -5.9623271226882935e-06, -5.245208740234375e-06, -4.5280903577804565e-06, -3.810971975326538e-06, -3.0938535928726196e-06, -2.376735210418701e-06, -1.6596168279647827e-06, -9.424984455108643e-07, -2.253800630569458e-07, 4.917383193969727e-07, 1.2088567018508911e-06, 1.9259750843048096e-06, 2.643093466758728e-06, 3.3602118492126465e-06, 4.077330231666565e-06, 4.794448614120483e-06, 5.511566996574402e-06, 6.22868537902832e-06, 6.945803761482239e-06, 7.662922143936157e-06, 8.380040526390076e-06, 9.097158908843994e-06, 9.814277291297913e-06, 1.0531395673751831e-05, 1.124851405620575e-05, 1.1965632438659668e-05, 1.2682750821113586e-05, 1.3399869203567505e-05, 1.4116987586021423e-05, 1.4834105968475342e-05, 1.555122435092926e-05, 1.626834273338318e-05, 1.6985461115837097e-05, 1.7702579498291016e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 4.0, 5.0, 8.0, 18.0, 27.0, 43.0, 87.0, 146.0, 237.0, 539.0, 1152.0, 2722.0, 7182.0, 28664.0, 198722.0, 636199.0, 140542.0, 21963.0, 5937.0, 2251.0, 983.0, 477.0, 254.0, 152.0, 82.0, 42.0, 30.0, 18.0, 9.0, 8.0, 7.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1639404296875, -0.15855026245117188, -0.15316009521484375, -0.14776992797851562, -0.1423797607421875, -0.13698959350585938, -0.13159942626953125, -0.12620925903320312, -0.120819091796875, -0.11542892456054688, -0.11003875732421875, -0.10464859008789062, -0.0992584228515625, -0.09386825561523438, -0.08847808837890625, -0.08308792114257812, -0.07769775390625, -0.07230758666992188, -0.06691741943359375, -0.061527252197265625, -0.0561370849609375, -0.050746917724609375, -0.04535675048828125, -0.039966583251953125, -0.034576416015625, -0.029186248779296875, -0.02379608154296875, -0.018405914306640625, -0.0130157470703125, -0.007625579833984375, -0.00223541259765625, 0.003154754638671875, 0.008544921875, 0.013935089111328125, 0.01932525634765625, 0.024715423583984375, 0.0301055908203125, 0.035495758056640625, 0.04088592529296875, 0.046276092529296875, 0.051666259765625, 0.057056427001953125, 0.06244659423828125, 0.06783676147460938, 0.0732269287109375, 0.07861709594726562, 0.08400726318359375, 0.08939743041992188, 0.09478759765625, 0.10017776489257812, 0.10556793212890625, 0.11095809936523438, 0.1163482666015625, 0.12173843383789062, 0.12712860107421875, 0.13251876831054688, 0.137908935546875, 0.14329910278320312, 0.14868927001953125, 0.15407943725585938, 0.1594696044921875, 0.16485977172851562, 0.17024993896484375, 0.17564010620117188, 0.1810302734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 3.0, 5.0, 12.0, 19.0, 26.0, 20.0, 32.0, 35.0, 65.0, 76.0, 102.0, 113.0, 91.0, 77.0, 78.0, 73.0, 54.0, 20.0, 18.0, 13.0, 15.0, 10.0, 5.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07049560546875, -0.0681295394897461, -0.06576347351074219, -0.06339740753173828, -0.061031341552734375, -0.05866527557373047, -0.05629920959472656, -0.053933143615722656, -0.05156707763671875, -0.049201011657714844, -0.04683494567871094, -0.04446887969970703, -0.042102813720703125, -0.03973674774169922, -0.03737068176269531, -0.035004615783691406, -0.0326385498046875, -0.030272483825683594, -0.027906417846679688, -0.02554035186767578, -0.023174285888671875, -0.02080821990966797, -0.018442153930664062, -0.016076087951660156, -0.01371002197265625, -0.011343955993652344, -0.008977890014648438, -0.006611824035644531, -0.004245758056640625, -0.0018796920776367188, 0.0004863739013671875, 0.0028524398803710938, 0.005218505859375, 0.007584571838378906, 0.009950637817382812, 0.012316703796386719, 0.014682769775390625, 0.01704883575439453, 0.019414901733398438, 0.021780967712402344, 0.02414703369140625, 0.026513099670410156, 0.028879165649414062, 0.03124523162841797, 0.033611297607421875, 0.03597736358642578, 0.03834342956542969, 0.040709495544433594, 0.0430755615234375, 0.045441627502441406, 0.04780769348144531, 0.05017375946044922, 0.052539825439453125, 0.05490589141845703, 0.05727195739746094, 0.059638023376464844, 0.06200408935546875, 0.06437015533447266, 0.06673622131347656, 0.06910228729248047, 0.07146835327148438, 0.07383441925048828, 0.07620048522949219, 0.0785665512084961, 0.0809326171875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 28.0, 98.0, 281.0, 298.0, 194.0, 81.0, 19.0, 5.0, 1.0, 2.0], "bins": [-5.024223804473877, -4.936633586883545, -4.849043369293213, -4.761453628540039, -4.673863410949707, -4.586273193359375, -4.498682975769043, -4.411092758178711, -4.323502540588379, -4.235912322998047, -4.148322105407715, -4.060732364654541, -3.973142147064209, -3.885551929473877, -3.797961711883545, -3.710371494293213, -3.622781753540039, -3.535191535949707, -3.447601556777954, -3.360011339187622, -3.272421360015869, -3.184831142425537, -3.097240924835205, -3.009650707244873, -2.92206072807312, -2.834470510482788, -2.746880531311035, -2.659290313720703, -2.571700096130371, -2.484110116958618, -2.396519899368286, -2.308929920196533, -2.2213399410247803, -2.1337497234344482, -2.0461597442626953, -1.9585695266723633, -1.8709794282913208, -1.7833893299102783, -1.6957991123199463, -1.6082090139389038, -1.5206189155578613, -1.4330288171768188, -1.3454387187957764, -1.2578485012054443, -1.1702584028244019, -1.0826683044433594, -0.9950781464576721, -0.9074879884719849, -0.8198978304862976, -0.7323076725006104, -0.6447175741195679, -0.5571274757385254, -0.46953731775283813, -0.38194718956947327, -0.2943570613861084, -0.20676690340042114, -0.11917680501937866, -0.031586676836013794, 0.056003451347351074, 0.14359357953071594, 0.2311837077140808, 0.3187738358974457, 0.40636396408081055, 0.4939541220664978, 0.5815442204475403]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 10.0, 5.0, 6.0, 10.0, 9.0, 15.0, 13.0, 20.0, 25.0, 19.0, 24.0, 22.0, 32.0, 38.0, 40.0, 42.0, 31.0, 39.0, 43.0, 29.0, 36.0, 43.0, 41.0, 43.0, 44.0, 36.0, 28.0, 27.0, 27.0, 30.0, 22.0, 21.0, 19.0, 20.0, 9.0, 14.0, 12.0, 11.0, 11.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.8491976261138916, -0.8248525261878967, -0.8005074858665466, -0.7761623859405518, -0.7518173456192017, -0.7274722456932068, -0.7031271457672119, -0.6787821054458618, -0.6544370055198669, -0.6300919055938721, -0.605746865272522, -0.5814017653465271, -0.5570566654205322, -0.5327116250991821, -0.5083665251731873, -0.48402145504951477, -0.4596763849258423, -0.4353313148021698, -0.4109862446784973, -0.38664114475250244, -0.36229607462882996, -0.33795100450515747, -0.3136059045791626, -0.2892608344554901, -0.2649157643318176, -0.24057069420814514, -0.21622560918331146, -0.19188052415847778, -0.1675354540348053, -0.1431903839111328, -0.11884529888629913, -0.09450021386146545, -0.07015514373779297, -0.045810066163539886, -0.021464988589286804, 0.002880088984966278, 0.02722516655921936, 0.05157024413347244, 0.07591532170772552, 0.1002604067325592, 0.12460547685623169, 0.14895054697990417, 0.17329563200473785, 0.19764071702957153, 0.22198578715324402, 0.2463308572769165, 0.2706759572029114, 0.29502102732658386, 0.31936609745025635, 0.34371116757392883, 0.3680562376976013, 0.3924013376235962, 0.4167464077472687, 0.44109147787094116, 0.46543657779693604, 0.4897816479206085, 0.514126718044281, 0.5384718179702759, 0.562816858291626, 0.5871619582176208, 0.6115070581436157, 0.6358520984649658, 0.6601971983909607, 0.6845422983169556, 0.7088873386383057]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 5.0, 2.0, 5.0, 7.0, 12.0, 12.0, 13.0, 17.0, 25.0, 25.0, 65.0, 107.0, 121.0, 187.0, 344.0, 660.0, 1255.0, 2598.0, 6072.0, 16901.0, 67490.0, 492976.0, 2282197.0, 1140394.0, 138794.0, 27570.0, 8880.0, 3680.0, 1694.0, 903.0, 466.0, 263.0, 179.0, 102.0, 86.0, 42.0, 23.0, 22.0, 17.0, 23.0, 16.0, 9.0, 9.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.494384765625, -0.4797172546386719, -0.46504974365234375, -0.4503822326660156, -0.4357147216796875, -0.4210472106933594, -0.40637969970703125, -0.3917121887207031, -0.377044677734375, -0.3623771667480469, -0.34770965576171875, -0.3330421447753906, -0.3183746337890625, -0.3037071228027344, -0.28903961181640625, -0.2743721008300781, -0.25970458984375, -0.24503707885742188, -0.23036956787109375, -0.21570205688476562, -0.2010345458984375, -0.18636703491210938, -0.17169952392578125, -0.15703201293945312, -0.142364501953125, -0.12769699096679688, -0.11302947998046875, -0.09836196899414062, -0.0836944580078125, -0.06902694702148438, -0.05435943603515625, -0.039691925048828125, -0.0250244140625, -0.010356903076171875, 0.00431060791015625, 0.018978118896484375, 0.0336456298828125, 0.048313140869140625, 0.06298065185546875, 0.07764816284179688, 0.092315673828125, 0.10698318481445312, 0.12165069580078125, 0.13631820678710938, 0.1509857177734375, 0.16565322875976562, 0.18032073974609375, 0.19498825073242188, 0.20965576171875, 0.22432327270507812, 0.23899078369140625, 0.2536582946777344, 0.2683258056640625, 0.2829933166503906, 0.29766082763671875, 0.3123283386230469, 0.326995849609375, 0.3416633605957031, 0.35633087158203125, 0.3709983825683594, 0.3856658935546875, 0.4003334045410156, 0.41500091552734375, 0.4296684265136719, 0.4443359375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 9.0, 12.0, 21.0, 13.0, 16.0, 19.0, 27.0, 24.0, 35.0, 36.0, 36.0, 49.0, 53.0, 60.0, 56.0, 52.0, 50.0, 48.0, 43.0, 60.0, 40.0, 33.0, 34.0, 27.0, 25.0, 24.0, 10.0, 20.0, 12.0, 13.0, 10.0, 5.0, 9.0, 3.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.342529296875, -0.3329582214355469, -0.32338714599609375, -0.3138160705566406, -0.3042449951171875, -0.2946739196777344, -0.28510284423828125, -0.2755317687988281, -0.265960693359375, -0.2563896179199219, -0.24681854248046875, -0.23724746704101562, -0.2276763916015625, -0.21810531616210938, -0.20853424072265625, -0.19896316528320312, -0.18939208984375, -0.17982101440429688, -0.17024993896484375, -0.16067886352539062, -0.1511077880859375, -0.14153671264648438, -0.13196563720703125, -0.12239456176757812, -0.112823486328125, -0.10325241088867188, -0.09368133544921875, -0.08411026000976562, -0.0745391845703125, -0.06496810913085938, -0.05539703369140625, -0.045825958251953125, -0.0362548828125, -0.026683807373046875, -0.01711273193359375, -0.007541656494140625, 0.0020294189453125, 0.011600494384765625, 0.02117156982421875, 0.030742645263671875, 0.040313720703125, 0.049884796142578125, 0.05945587158203125, 0.06902694702148438, 0.0785980224609375, 0.08816909790039062, 0.09774017333984375, 0.10731124877929688, 0.11688232421875, 0.12645339965820312, 0.13602447509765625, 0.14559555053710938, 0.1551666259765625, 0.16473770141601562, 0.17430877685546875, 0.18387985229492188, 0.193450927734375, 0.20302200317382812, 0.21259307861328125, 0.22216415405273438, 0.2317352294921875, 0.24130630493164062, 0.25087738037109375, 0.2604484558105469, 0.27001953125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 18.0, 22.0, 52.0, 96.0, 271.0, 1176.0, 12572.0, 3647603.0, 526038.0, 5319.0, 746.0, 178.0, 71.0, 38.0, 17.0, 16.0, 7.0, 7.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9462890625, -1.89044189453125, -1.8345947265625, -1.77874755859375, -1.722900390625, -1.66705322265625, -1.6112060546875, -1.55535888671875, -1.49951171875, -1.44366455078125, -1.3878173828125, -1.33197021484375, -1.276123046875, -1.22027587890625, -1.1644287109375, -1.10858154296875, -1.052734375, -0.99688720703125, -0.9410400390625, -0.88519287109375, -0.829345703125, -0.77349853515625, -0.7176513671875, -0.66180419921875, -0.60595703125, -0.55010986328125, -0.4942626953125, -0.43841552734375, -0.382568359375, -0.32672119140625, -0.2708740234375, -0.21502685546875, -0.1591796875, -0.10333251953125, -0.0474853515625, 0.00836181640625, 0.064208984375, 0.12005615234375, 0.1759033203125, 0.23175048828125, 0.28759765625, 0.34344482421875, 0.3992919921875, 0.45513916015625, 0.510986328125, 0.56683349609375, 0.6226806640625, 0.67852783203125, 0.734375, 0.79022216796875, 0.8460693359375, 0.90191650390625, 0.957763671875, 1.01361083984375, 1.0694580078125, 1.12530517578125, 1.18115234375, 1.23699951171875, 1.2928466796875, 1.34869384765625, 1.404541015625, 1.46038818359375, 1.5162353515625, 1.57208251953125, 1.6279296875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 14.0, 23.0, 21.0, 55.0, 80.0, 127.0, 195.0, 294.0, 411.0, 546.0, 609.0, 522.0, 415.0, 261.0, 176.0, 95.0, 75.0, 31.0, 27.0, 16.0, 13.0, 7.0, 8.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2119140625, -0.2059192657470703, -0.19992446899414062, -0.19392967224121094, -0.18793487548828125, -0.18194007873535156, -0.17594528198242188, -0.1699504852294922, -0.1639556884765625, -0.1579608917236328, -0.15196609497070312, -0.14597129821777344, -0.13997650146484375, -0.13398170471191406, -0.12798690795898438, -0.12199211120605469, -0.115997314453125, -0.11000251770019531, -0.10400772094726562, -0.09801292419433594, -0.09201812744140625, -0.08602333068847656, -0.08002853393554688, -0.07403373718261719, -0.0680389404296875, -0.06204414367675781, -0.056049346923828125, -0.05005455017089844, -0.04405975341796875, -0.03806495666503906, -0.032070159912109375, -0.026075363159179688, -0.02008056640625, -0.014085769653320312, -0.008090972900390625, -0.0020961761474609375, 0.00389862060546875, 0.009893417358398438, 0.015888214111328125, 0.021883010864257812, 0.0278778076171875, 0.03387260437011719, 0.039867401123046875, 0.04586219787597656, 0.05185699462890625, 0.05785179138183594, 0.06384658813476562, 0.06984138488769531, 0.075836181640625, 0.08183097839355469, 0.08782577514648438, 0.09382057189941406, 0.09981536865234375, 0.10581016540527344, 0.11180496215820312, 0.11779975891113281, 0.1237945556640625, 0.1297893524169922, 0.13578414916992188, 0.14177894592285156, 0.14777374267578125, 0.15376853942871094, 0.15976333618164062, 0.1657581329345703, 0.1717529296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 6.0, 6.0, 17.0, 10.0, 22.0, 21.0, 33.0, 33.0, 35.0, 45.0, 46.0, 49.0, 45.0, 52.0, 55.0, 60.0, 43.0, 39.0, 48.0, 42.0, 42.0, 34.0, 36.0, 28.0, 23.0, 13.0, 26.0, 17.0, 12.0, 13.0, 8.0, 12.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34196892380714417, -0.3315484821796417, -0.3211280405521393, -0.31070759892463684, -0.3002871572971344, -0.28986674547195435, -0.2794463038444519, -0.26902586221694946, -0.258605420589447, -0.24818497896194458, -0.23776453733444214, -0.2273440957069397, -0.21692366898059845, -0.206503227353096, -0.19608278572559357, -0.18566235899925232, -0.17524190247058868, -0.16482146084308624, -0.1544010192155838, -0.14398059248924255, -0.1335601508617401, -0.12313970923423767, -0.11271926760673523, -0.10229883342981339, -0.09187839180231094, -0.0814579501748085, -0.07103751599788666, -0.060617074370384216, -0.05019663646817207, -0.03977619856595993, -0.02935575693845749, -0.018935322761535645, -0.008514881134033203, 0.0019055576995015144, 0.012325996533036232, 0.022746436297893524, 0.03316687420010567, 0.04358731210231781, 0.05400775372982025, 0.0644281879067421, 0.07484862953424454, 0.08526907116174698, 0.09568950533866882, 0.10610994696617126, 0.1165303885936737, 0.12695083022117615, 0.1373712718486786, 0.14779169857501984, 0.15821214020252228, 0.16863258183002472, 0.17905302345752716, 0.1894734501838684, 0.19989389181137085, 0.2103143334388733, 0.22073477506637573, 0.23115521669387817, 0.24157565832138062, 0.25199609994888306, 0.2624165415763855, 0.27283698320388794, 0.2832574248313904, 0.2936778664588928, 0.30409830808639526, 0.3145187199115753, 0.32493916153907776]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 14.0, 9.0, 6.0, 10.0, 15.0, 11.0, 21.0, 22.0, 20.0, 17.0, 23.0, 27.0, 23.0, 25.0, 36.0, 29.0, 29.0, 28.0, 41.0, 35.0, 48.0, 29.0, 38.0, 24.0, 45.0, 35.0, 27.0, 38.0, 38.0, 34.0, 26.0, 23.0, 29.0, 20.0, 11.0, 11.0, 10.0, 12.0, 11.0, 6.0, 8.0, 6.0, 6.0, 6.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.30970630049705505, -0.30074542760849, -0.2917845547199249, -0.2828236520290375, -0.2738627791404724, -0.26490190625190735, -0.2559410333633423, -0.24698016047477722, -0.23801927268505096, -0.2290583997964859, -0.22009751200675964, -0.21113663911819458, -0.20217576622962952, -0.19321487843990326, -0.1842540055513382, -0.17529311776161194, -0.16633224487304688, -0.1573713719844818, -0.14841048419475555, -0.1394496113061905, -0.13048872351646423, -0.12152785062789917, -0.1125669777393341, -0.10360609740018845, -0.09464521706104279, -0.08568433672189713, -0.07672345638275146, -0.0677625834941864, -0.05880170315504074, -0.04984082281589508, -0.04087994620203972, -0.03191906958818436, -0.022958189249038696, -0.013997310772538185, -0.005036432296037674, 0.003924446180462837, 0.012885324656963348, 0.02184620499610901, 0.03080708160996437, 0.03976795822381973, 0.04872883856296539, 0.05768971890211105, 0.06665059924125671, 0.07561147212982178, 0.08457235246896744, 0.0935332328081131, 0.10249410569667816, 0.11145498603582382, 0.12041586637496948, 0.12937673926353455, 0.1383376270532608, 0.14729849994182587, 0.15625938773155212, 0.1652202606201172, 0.17418113350868225, 0.18314200639724731, 0.19210289418697357, 0.20106376707553864, 0.2100246548652649, 0.21898552775382996, 0.22794640064239502, 0.23690728843212128, 0.24586816132068634, 0.2548290491104126, 0.26378992199897766]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 8.0, 10.0, 10.0, 11.0, 24.0, 15.0, 23.0, 43.0, 55.0, 71.0, 94.0, 134.0, 185.0, 331.0, 550.0, 1087.0, 2088.0, 4401.0, 11603.0, 50330.0, 405098.0, 485160.0, 63924.0, 13309.0, 4881.0, 2253.0, 1098.0, 636.0, 339.0, 241.0, 158.0, 101.0, 84.0, 52.0, 38.0, 29.0, 28.0, 13.0, 14.0, 9.0, 7.0, 4.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.123046875, -0.11866188049316406, -0.11427688598632812, -0.10989189147949219, -0.10550689697265625, -0.10112190246582031, -0.09673690795898438, -0.09235191345214844, -0.0879669189453125, -0.08358192443847656, -0.07919692993164062, -0.07481193542480469, -0.07042694091796875, -0.06604194641113281, -0.061656951904296875, -0.05727195739746094, -0.052886962890625, -0.04850196838378906, -0.044116973876953125, -0.03973197937011719, -0.03534698486328125, -0.030961990356445312, -0.026576995849609375, -0.022192001342773438, -0.0178070068359375, -0.013422012329101562, -0.009037017822265625, -0.0046520233154296875, -0.00026702880859375, 0.0041179656982421875, 0.008502960205078125, 0.012887954711914062, 0.01727294921875, 0.021657943725585938, 0.026042938232421875, 0.030427932739257812, 0.03481292724609375, 0.03919792175292969, 0.043582916259765625, 0.04796791076660156, 0.0523529052734375, 0.05673789978027344, 0.061122894287109375, 0.06550788879394531, 0.06989288330078125, 0.07427787780761719, 0.07866287231445312, 0.08304786682128906, 0.087432861328125, 0.09181785583496094, 0.09620285034179688, 0.10058784484863281, 0.10497283935546875, 0.10935783386230469, 0.11374282836914062, 0.11812782287597656, 0.1225128173828125, 0.12689781188964844, 0.13128280639648438, 0.1356678009033203, 0.14005279541015625, 0.1444377899169922, 0.14882278442382812, 0.15320777893066406, 0.1575927734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 9.0, 7.0, 14.0, 15.0, 19.0, 12.0, 16.0, 18.0, 26.0, 26.0, 26.0, 36.0, 29.0, 34.0, 43.0, 36.0, 41.0, 38.0, 43.0, 43.0, 47.0, 49.0, 42.0, 54.0, 30.0, 40.0, 22.0, 39.0, 32.0, 20.0, 15.0, 15.0, 12.0, 9.0, 9.0, 10.0, 4.0, 12.0, 4.0, 0.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.2392578125, -0.23257064819335938, -0.22588348388671875, -0.21919631958007812, -0.2125091552734375, -0.20582199096679688, -0.19913482666015625, -0.19244766235351562, -0.185760498046875, -0.17907333374023438, -0.17238616943359375, -0.16569900512695312, -0.1590118408203125, -0.15232467651367188, -0.14563751220703125, -0.13895034790039062, -0.13226318359375, -0.12557601928710938, -0.11888885498046875, -0.11220169067382812, -0.1055145263671875, -0.09882736206054688, -0.09214019775390625, -0.08545303344726562, -0.078765869140625, -0.07207870483398438, -0.06539154052734375, -0.058704376220703125, -0.0520172119140625, -0.045330047607421875, -0.03864288330078125, -0.031955718994140625, -0.0252685546875, -0.018581390380859375, -0.01189422607421875, -0.005207061767578125, 0.0014801025390625, 0.008167266845703125, 0.01485443115234375, 0.021541595458984375, 0.028228759765625, 0.034915924072265625, 0.04160308837890625, 0.048290252685546875, 0.0549774169921875, 0.061664581298828125, 0.06835174560546875, 0.07503890991210938, 0.08172607421875, 0.08841323852539062, 0.09510040283203125, 0.10178756713867188, 0.1084747314453125, 0.11516189575195312, 0.12184906005859375, 0.12853622436523438, 0.135223388671875, 0.14191055297851562, 0.14859771728515625, 0.15528488159179688, 0.1619720458984375, 0.16865921020507812, 0.17534637451171875, 0.18203353881835938, 0.188720703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 12.0, 5.0, 5.0, 18.0, 23.0, 17.0, 29.0, 54.0, 75.0, 132.0, 207.0, 323.0, 524.0, 989.0, 1840.0, 3555.0, 7768.0, 20706.0, 70426.0, 266129.0, 435475.0, 168603.0, 44408.0, 14652.0, 6033.0, 2919.0, 1476.0, 878.0, 456.0, 279.0, 182.0, 108.0, 68.0, 44.0, 27.0, 19.0, 14.0, 23.0, 15.0, 3.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.083984375, -0.08130264282226562, -0.07862091064453125, -0.07593917846679688, -0.0732574462890625, -0.07057571411132812, -0.06789398193359375, -0.06521224975585938, -0.062530517578125, -0.059848785400390625, -0.05716705322265625, -0.054485321044921875, -0.0518035888671875, -0.049121856689453125, -0.04644012451171875, -0.043758392333984375, -0.04107666015625, -0.038394927978515625, -0.03571319580078125, -0.033031463623046875, -0.0303497314453125, -0.027667999267578125, -0.02498626708984375, -0.022304534912109375, -0.019622802734375, -0.016941070556640625, -0.01425933837890625, -0.011577606201171875, -0.0088958740234375, -0.006214141845703125, -0.00353240966796875, -0.000850677490234375, 0.0018310546875, 0.004512786865234375, 0.00719451904296875, 0.009876251220703125, 0.0125579833984375, 0.015239715576171875, 0.01792144775390625, 0.020603179931640625, 0.023284912109375, 0.025966644287109375, 0.02864837646484375, 0.031330108642578125, 0.0340118408203125, 0.036693572998046875, 0.03937530517578125, 0.042057037353515625, 0.04473876953125, 0.047420501708984375, 0.05010223388671875, 0.052783966064453125, 0.0554656982421875, 0.058147430419921875, 0.06082916259765625, 0.06351089477539062, 0.066192626953125, 0.06887435913085938, 0.07155609130859375, 0.07423782348632812, 0.0769195556640625, 0.07960128784179688, 0.08228302001953125, 0.08496475219726562, 0.087646484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 9.0, 13.0, 8.0, 12.0, 22.0, 16.0, 37.0, 37.0, 30.0, 38.0, 46.0, 49.0, 46.0, 56.0, 53.0, 46.0, 59.0, 48.0, 47.0, 44.0, 27.0, 40.0, 37.0, 25.0, 28.0, 25.0, 18.0, 19.0, 13.0, 8.0, 10.0, 3.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.6264724731445312, -0.6064605712890625, -0.5864486694335938, -0.566436767578125, -0.5464248657226562, -0.5264129638671875, -0.5064010620117188, -0.48638916015625, -0.46637725830078125, -0.4463653564453125, -0.42635345458984375, -0.406341552734375, -0.38632965087890625, -0.3663177490234375, -0.34630584716796875, -0.3262939453125, -0.30628204345703125, -0.2862701416015625, -0.26625823974609375, -0.246246337890625, -0.22623443603515625, -0.2062225341796875, -0.18621063232421875, -0.16619873046875, -0.14618682861328125, -0.1261749267578125, -0.10616302490234375, -0.086151123046875, -0.06613922119140625, -0.0461273193359375, -0.02611541748046875, -0.006103515625, 0.01390838623046875, 0.0339202880859375, 0.05393218994140625, 0.073944091796875, 0.09395599365234375, 0.1139678955078125, 0.13397979736328125, 0.15399169921875, 0.17400360107421875, 0.1940155029296875, 0.21402740478515625, 0.234039306640625, 0.25405120849609375, 0.2740631103515625, 0.29407501220703125, 0.3140869140625, 0.33409881591796875, 0.3541107177734375, 0.37412261962890625, 0.394134521484375, 0.41414642333984375, 0.4341583251953125, 0.45417022705078125, 0.47418212890625, 0.49419403076171875, 0.5142059326171875, 0.5342178344726562, 0.554229736328125, 0.5742416381835938, 0.5942535400390625, 0.6142654418945312, 0.63427734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 8.0, 15.0, 15.0, 13.0, 38.0, 47.0, 67.0, 126.0, 198.0, 359.0, 561.0, 966.0, 1940.0, 4551.0, 13746.0, 59661.0, 413862.0, 460067.0, 67647.0, 15195.0, 4877.0, 2074.0, 1028.0, 557.0, 336.0, 190.0, 127.0, 70.0, 55.0, 44.0, 20.0, 16.0, 8.0, 11.0, 7.0, 11.0, 5.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056427001953125, -0.054665565490722656, -0.05290412902832031, -0.05114269256591797, -0.049381256103515625, -0.04761981964111328, -0.04585838317871094, -0.044096946716308594, -0.04233551025390625, -0.040574073791503906, -0.03881263732910156, -0.03705120086669922, -0.035289764404296875, -0.03352832794189453, -0.03176689147949219, -0.030005455017089844, -0.0282440185546875, -0.026482582092285156, -0.024721145629882812, -0.02295970916748047, -0.021198272705078125, -0.01943683624267578, -0.017675399780273438, -0.015913963317871094, -0.01415252685546875, -0.012391090393066406, -0.010629653930664062, -0.008868217468261719, -0.007106781005859375, -0.005345344543457031, -0.0035839080810546875, -0.0018224716186523438, -6.103515625e-05, 0.0017004013061523438, 0.0034618377685546875, 0.005223274230957031, 0.006984710693359375, 0.008746147155761719, 0.010507583618164062, 0.012269020080566406, 0.01403045654296875, 0.015791893005371094, 0.017553329467773438, 0.01931476593017578, 0.021076202392578125, 0.02283763885498047, 0.024599075317382812, 0.026360511779785156, 0.0281219482421875, 0.029883384704589844, 0.03164482116699219, 0.03340625762939453, 0.035167694091796875, 0.03692913055419922, 0.03869056701660156, 0.040452003479003906, 0.04221343994140625, 0.043974876403808594, 0.04573631286621094, 0.04749774932861328, 0.049259185791015625, 0.05102062225341797, 0.05278205871582031, 0.054543495178222656, 0.056304931640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 8.0, 13.0, 18.0, 15.0, 27.0, 41.0, 49.0, 87.0, 116.0, 103.0, 98.0, 104.0, 99.0, 60.0, 44.0, 28.0, 28.0, 19.0, 11.0, 5.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.5422701835632324e-05, -1.481175422668457e-05, -1.4200806617736816e-05, -1.3589859008789062e-05, -1.2978911399841309e-05, -1.2367963790893555e-05, -1.17570161819458e-05, -1.1146068572998047e-05, -1.0535120964050293e-05, -9.924173355102539e-06, -9.313225746154785e-06, -8.702278137207031e-06, -8.091330528259277e-06, -7.4803829193115234e-06, -6.8694353103637695e-06, -6.258487701416016e-06, -5.647540092468262e-06, -5.036592483520508e-06, -4.425644874572754e-06, -3.814697265625e-06, -3.203749656677246e-06, -2.592802047729492e-06, -1.9818544387817383e-06, -1.3709068298339844e-06, -7.599592208862305e-07, -1.4901161193847656e-07, 4.6193599700927734e-07, 1.0728836059570312e-06, 1.6838312149047852e-06, 2.294778823852539e-06, 2.905726432800293e-06, 3.516674041748047e-06, 4.127621650695801e-06, 4.738569259643555e-06, 5.349516868591309e-06, 5.9604644775390625e-06, 6.571412086486816e-06, 7.18235969543457e-06, 7.793307304382324e-06, 8.404254913330078e-06, 9.015202522277832e-06, 9.626150131225586e-06, 1.023709774017334e-05, 1.0848045349121094e-05, 1.1458992958068848e-05, 1.2069940567016602e-05, 1.2680888175964355e-05, 1.329183578491211e-05, 1.3902783393859863e-05, 1.4513731002807617e-05, 1.5124678611755371e-05, 1.5735626220703125e-05, 1.634657382965088e-05, 1.6957521438598633e-05, 1.7568469047546387e-05, 1.817941665649414e-05, 1.8790364265441895e-05, 1.940131187438965e-05, 2.0012259483337402e-05, 2.0623207092285156e-05, 2.123415470123291e-05, 2.1845102310180664e-05, 2.2456049919128418e-05, 2.3066997528076172e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 11.0, 16.0, 20.0, 32.0, 49.0, 69.0, 120.0, 195.0, 344.0, 633.0, 1291.0, 2835.0, 6393.0, 16304.0, 48022.0, 173572.0, 442151.0, 251014.0, 68669.0, 21411.0, 8379.0, 3521.0, 1632.0, 796.0, 429.0, 222.0, 152.0, 89.0, 66.0, 41.0, 15.0, 13.0, 13.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037506103515625, -0.03628206253051758, -0.035058021545410156, -0.033833980560302734, -0.03260993957519531, -0.03138589859008789, -0.03016185760498047, -0.028937816619873047, -0.027713775634765625, -0.026489734649658203, -0.02526569366455078, -0.02404165267944336, -0.022817611694335938, -0.021593570709228516, -0.020369529724121094, -0.019145488739013672, -0.01792144775390625, -0.016697406768798828, -0.015473365783691406, -0.014249324798583984, -0.013025283813476562, -0.01180124282836914, -0.010577201843261719, -0.009353160858154297, -0.008129119873046875, -0.006905078887939453, -0.005681037902832031, -0.004456996917724609, -0.0032329559326171875, -0.0020089149475097656, -0.0007848739624023438, 0.0004391670227050781, 0.0016632080078125, 0.002887248992919922, 0.004111289978027344, 0.005335330963134766, 0.0065593719482421875, 0.007783412933349609, 0.009007453918457031, 0.010231494903564453, 0.011455535888671875, 0.012679576873779297, 0.013903617858886719, 0.01512765884399414, 0.016351699829101562, 0.017575740814208984, 0.018799781799316406, 0.020023822784423828, 0.02124786376953125, 0.022471904754638672, 0.023695945739746094, 0.024919986724853516, 0.026144027709960938, 0.02736806869506836, 0.02859210968017578, 0.029816150665283203, 0.031040191650390625, 0.03226423263549805, 0.03348827362060547, 0.03471231460571289, 0.03593635559082031, 0.037160396575927734, 0.038384437561035156, 0.03960847854614258, 0.04083251953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 1.0, 6.0, 6.0, 13.0, 20.0, 19.0, 27.0, 38.0, 60.0, 52.0, 98.0, 119.0, 116.0, 113.0, 80.0, 60.0, 53.0, 23.0, 22.0, 15.0, 11.0, 11.0, 10.0, 4.0, 3.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157928466796875, -0.015286445617675781, -0.014780044555664062, -0.014273643493652344, -0.013767242431640625, -0.013260841369628906, -0.012754440307617188, -0.012248039245605469, -0.01174163818359375, -0.011235237121582031, -0.010728836059570312, -0.010222434997558594, -0.009716033935546875, -0.009209632873535156, -0.008703231811523438, -0.008196830749511719, -0.0076904296875, -0.007184028625488281, -0.0066776275634765625, -0.006171226501464844, -0.005664825439453125, -0.005158424377441406, -0.0046520233154296875, -0.004145622253417969, -0.00363922119140625, -0.0031328201293945312, -0.0026264190673828125, -0.0021200180053710938, -0.001613616943359375, -0.0011072158813476562, -0.0006008148193359375, -9.441375732421875e-05, 0.0004119873046875, 0.0009183883666992188, 0.0014247894287109375, 0.0019311904907226562, 0.002437591552734375, 0.0029439926147460938, 0.0034503936767578125, 0.003956794738769531, 0.00446319580078125, 0.004969596862792969, 0.0054759979248046875, 0.005982398986816406, 0.006488800048828125, 0.006995201110839844, 0.0075016021728515625, 0.008008003234863281, 0.008514404296875, 0.009020805358886719, 0.009527206420898438, 0.010033607482910156, 0.010540008544921875, 0.011046409606933594, 0.011552810668945312, 0.012059211730957031, 0.01256561279296875, 0.013072013854980469, 0.013578414916992188, 0.014084815979003906, 0.014591217041015625, 0.015097618103027344, 0.015604019165039062, 0.01611042022705078, 0.0166168212890625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 5.0, 7.0, 9.0, 4.0, 11.0, 14.0, 21.0, 14.0, 25.0, 33.0, 46.0, 36.0, 61.0, 52.0, 50.0, 48.0, 65.0, 61.0, 45.0, 64.0, 37.0, 49.0, 41.0, 26.0, 37.0, 25.0, 27.0, 16.0, 16.0, 18.0, 9.0, 7.0, 6.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.18595542013645172, -0.1792585700750351, -0.17256172001361847, -0.16586488485336304, -0.1591680347919464, -0.15247118473052979, -0.14577433466911316, -0.13907748460769653, -0.1323806494474411, -0.12568379938602448, -0.11898695677518845, -0.11229010671377182, -0.10559326410293579, -0.09889641404151917, -0.09219956398010254, -0.08550272136926651, -0.07880587130784988, -0.07210902124643326, -0.06541217863559723, -0.0587153285741806, -0.052018485963344574, -0.04532163590192795, -0.03862478956580162, -0.03192794322967529, -0.025231096893548965, -0.018534250557422638, -0.011837403289973736, -0.005140556022524834, 0.0015562903136014938, 0.00825313851237297, 0.014949984848499298, 0.021646831184625626, 0.028343677520751953, 0.03504052385687828, 0.04173737019300461, 0.048434220254421234, 0.05513106286525726, 0.06182791292667389, 0.06852476298809052, 0.07522160559892654, 0.08191844820976257, 0.0886152982711792, 0.09531214088201523, 0.10200899094343185, 0.10870583355426788, 0.11540268361568451, 0.12209953367710114, 0.12879636883735657, 0.1354932188987732, 0.14219006896018982, 0.14888691902160645, 0.15558375418186188, 0.1622806042432785, 0.16897745430469513, 0.17567430436611176, 0.1823711395263672, 0.189068004488945, 0.19576485455036163, 0.20246170461177826, 0.2091585397720337, 0.21585538983345032, 0.22255223989486694, 0.22924908995628357, 0.2359459400177002, 0.24264277517795563]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 14.0, 10.0, 7.0, 16.0, 8.0, 23.0, 18.0, 25.0, 25.0, 15.0, 17.0, 40.0, 34.0, 21.0, 30.0, 25.0, 46.0, 42.0, 29.0, 42.0, 36.0, 37.0, 35.0, 36.0, 44.0, 35.0, 34.0, 30.0, 28.0, 35.0, 23.0, 21.0, 12.0, 17.0, 10.0, 9.0, 12.0, 6.0, 6.0, 7.0, 10.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.19242826104164124, -0.18686546385288239, -0.18130266666412354, -0.1757398545742035, -0.17017705738544464, -0.1646142601966858, -0.15905144810676575, -0.1534886509180069, -0.14792585372924805, -0.1423630565404892, -0.13680025935173035, -0.1312374472618103, -0.12567465007305145, -0.1201118528842926, -0.11454904824495316, -0.10898624360561371, -0.10342344641685486, -0.09786064922809601, -0.09229784458875656, -0.08673503994941711, -0.08117224276065826, -0.07560944557189941, -0.07004664093255997, -0.06448383629322052, -0.05892103910446167, -0.05335823819041252, -0.04779543727636337, -0.042232636362314224, -0.036669835448265076, -0.031107034534215927, -0.02554423362016678, -0.01998143270611763, -0.014418631792068481, -0.008855830878019333, -0.0032930299639701843, 0.0022697709500789642, 0.007832571864128113, 0.013395372778177261, 0.01895817369222641, 0.02452097460627556, 0.030083775520324707, 0.035646576434373856, 0.041209377348423004, 0.04677217826247215, 0.0523349791765213, 0.05789778009057045, 0.0634605810046196, 0.06902338564395905, 0.0745861828327179, 0.08014898002147675, 0.08571178466081619, 0.09127458930015564, 0.09683738648891449, 0.10240018367767334, 0.10796298831701279, 0.11352579295635223, 0.11908859014511108, 0.12465138733386993, 0.13021418452262878, 0.13577699661254883, 0.14133979380130768, 0.14690259099006653, 0.15246540307998657, 0.15802820026874542, 0.16359099745750427]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 20.0, 32.0, 40.0, 60.0, 82.0, 159.0, 260.0, 484.0, 1023.0, 2061.0, 4781.0, 11512.0, 28786.0, 77900.0, 264970.0, 433249.0, 143351.0, 47324.0, 18756.0, 7437.0, 3291.0, 1406.0, 664.0, 360.0, 213.0, 125.0, 66.0, 43.0, 27.0, 23.0, 14.0, 12.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330810546875, -0.3177146911621094, -0.30461883544921875, -0.2915229797363281, -0.2784271240234375, -0.2653312683105469, -0.25223541259765625, -0.23913955688476562, -0.226043701171875, -0.21294784545898438, -0.19985198974609375, -0.18675613403320312, -0.1736602783203125, -0.16056442260742188, -0.14746856689453125, -0.13437271118164062, -0.12127685546875, -0.10818099975585938, -0.09508514404296875, -0.08198928833007812, -0.0688934326171875, -0.055797576904296875, -0.04270172119140625, -0.029605865478515625, -0.016510009765625, -0.003414154052734375, 0.00968170166015625, 0.022777557373046875, 0.0358734130859375, 0.048969268798828125, 0.06206512451171875, 0.07516098022460938, 0.0882568359375, 0.10135269165039062, 0.11444854736328125, 0.12754440307617188, 0.1406402587890625, 0.15373611450195312, 0.16683197021484375, 0.17992782592773438, 0.193023681640625, 0.20611953735351562, 0.21921539306640625, 0.23231124877929688, 0.2454071044921875, 0.2585029602050781, 0.27159881591796875, 0.2846946716308594, 0.29779052734375, 0.3108863830566406, 0.32398223876953125, 0.3370780944824219, 0.3501739501953125, 0.3632698059082031, 0.37636566162109375, 0.3894615173339844, 0.402557373046875, 0.4156532287597656, 0.42874908447265625, 0.4418449401855469, 0.4549407958984375, 0.4680366516113281, 0.48113250732421875, 0.4942283630371094, 0.50732421875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 3.0, 17.0, 10.0, 16.0, 30.0, 22.0, 26.0, 33.0, 27.0, 45.0, 39.0, 51.0, 51.0, 50.0, 53.0, 58.0, 57.0, 45.0, 47.0, 53.0, 44.0, 36.0, 31.0, 27.0, 24.0, 26.0, 13.0, 13.0, 17.0, 7.0, 3.0, 13.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.3087348937988281, -0.29544830322265625, -0.2821617126464844, -0.2688751220703125, -0.2555885314941406, -0.24230194091796875, -0.22901535034179688, -0.215728759765625, -0.20244216918945312, -0.18915557861328125, -0.17586898803710938, -0.1625823974609375, -0.14929580688476562, -0.13600921630859375, -0.12272262573242188, -0.10943603515625, -0.09614944458007812, -0.08286285400390625, -0.06957626342773438, -0.0562896728515625, -0.043003082275390625, -0.02971649169921875, -0.016429901123046875, -0.003143310546875, 0.010143280029296875, 0.02342987060546875, 0.036716461181640625, 0.0500030517578125, 0.06328964233398438, 0.07657623291015625, 0.08986282348632812, 0.1031494140625, 0.11643600463867188, 0.12972259521484375, 0.14300918579101562, 0.1562957763671875, 0.16958236694335938, 0.18286895751953125, 0.19615554809570312, 0.209442138671875, 0.22272872924804688, 0.23601531982421875, 0.24930191040039062, 0.2625885009765625, 0.2758750915527344, 0.28916168212890625, 0.3024482727050781, 0.31573486328125, 0.3290214538574219, 0.34230804443359375, 0.3555946350097656, 0.3688812255859375, 0.3821678161621094, 0.39545440673828125, 0.4087409973144531, 0.422027587890625, 0.4353141784667969, 0.44860076904296875, 0.4618873596191406, 0.4751739501953125, 0.4884605407714844, 0.5017471313476562, 0.5150337219238281, 0.5283203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 10.0, 14.0, 16.0, 21.0, 31.0, 47.0, 67.0, 102.0, 127.0, 210.0, 318.0, 462.0, 751.0, 1226.0, 2271.0, 4340.0, 8361.0, 16956.0, 36460.0, 84401.0, 209919.0, 349483.0, 190281.0, 76371.0, 33579.0, 15562.0, 7790.0, 3909.0, 2191.0, 1157.0, 720.0, 446.0, 290.0, 195.0, 140.0, 106.0, 65.0, 45.0, 27.0, 26.0, 15.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.331787109375, -0.32123565673828125, -0.3106842041015625, -0.30013275146484375, -0.289581298828125, -0.27902984619140625, -0.2684783935546875, -0.25792694091796875, -0.24737548828125, -0.23682403564453125, -0.2262725830078125, -0.21572113037109375, -0.205169677734375, -0.19461822509765625, -0.1840667724609375, -0.17351531982421875, -0.1629638671875, -0.15241241455078125, -0.1418609619140625, -0.13130950927734375, -0.120758056640625, -0.11020660400390625, -0.0996551513671875, -0.08910369873046875, -0.07855224609375, -0.06800079345703125, -0.0574493408203125, -0.04689788818359375, -0.036346435546875, -0.02579498291015625, -0.0152435302734375, -0.00469207763671875, 0.005859375, 0.01641082763671875, 0.0269622802734375, 0.03751373291015625, 0.048065185546875, 0.05861663818359375, 0.0691680908203125, 0.07971954345703125, 0.09027099609375, 0.10082244873046875, 0.1113739013671875, 0.12192535400390625, 0.132476806640625, 0.14302825927734375, 0.1535797119140625, 0.16413116455078125, 0.1746826171875, 0.18523406982421875, 0.1957855224609375, 0.20633697509765625, 0.216888427734375, 0.22743988037109375, 0.2379913330078125, 0.24854278564453125, 0.25909423828125, 0.26964569091796875, 0.2801971435546875, 0.29074859619140625, 0.301300048828125, 0.31185150146484375, 0.3224029541015625, 0.33295440673828125, 0.343505859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 9.0, 9.0, 9.0, 11.0, 13.0, 21.0, 25.0, 28.0, 34.0, 31.0, 26.0, 37.0, 39.0, 37.0, 45.0, 36.0, 49.0, 34.0, 50.0, 44.0, 55.0, 38.0, 56.0, 26.0, 37.0, 28.0, 23.0, 26.0, 18.0, 18.0, 15.0, 12.0, 12.0, 13.0, 6.0, 3.0, 2.0, 0.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3447265625, -0.33228302001953125, -0.3198394775390625, -0.30739593505859375, -0.294952392578125, -0.28250885009765625, -0.2700653076171875, -0.25762176513671875, -0.24517822265625, -0.23273468017578125, -0.2202911376953125, -0.20784759521484375, -0.195404052734375, -0.18296051025390625, -0.1705169677734375, -0.15807342529296875, -0.1456298828125, -0.13318634033203125, -0.1207427978515625, -0.10829925537109375, -0.095855712890625, -0.08341217041015625, -0.0709686279296875, -0.05852508544921875, -0.04608154296875, -0.03363800048828125, -0.0211944580078125, -0.00875091552734375, 0.003692626953125, 0.01613616943359375, 0.0285797119140625, 0.04102325439453125, 0.053466796875, 0.06591033935546875, 0.0783538818359375, 0.09079742431640625, 0.103240966796875, 0.11568450927734375, 0.1281280517578125, 0.14057159423828125, 0.15301513671875, 0.16545867919921875, 0.1779022216796875, 0.19034576416015625, 0.202789306640625, 0.21523284912109375, 0.2276763916015625, 0.24011993408203125, 0.2525634765625, 0.26500701904296875, 0.2774505615234375, 0.28989410400390625, 0.302337646484375, 0.31478118896484375, 0.3272247314453125, 0.33966827392578125, 0.35211181640625, 0.36455535888671875, 0.3769989013671875, 0.38944244384765625, 0.401885986328125, 0.41432952880859375, 0.4267730712890625, 0.43921661376953125, 0.45166015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 10.0, 11.0, 18.0, 39.0, 47.0, 54.0, 98.0, 178.0, 258.0, 380.0, 676.0, 1105.0, 1718.0, 3065.0, 5275.0, 10558.0, 24961.0, 82931.0, 319982.0, 436616.0, 104924.0, 29604.0, 11705.0, 5949.0, 3310.0, 1969.0, 1153.0, 704.0, 471.0, 296.0, 201.0, 106.0, 69.0, 34.0, 30.0, 15.0, 9.0, 6.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.10669898986816406, -0.10347366333007812, -0.10024833679199219, -0.09702301025390625, -0.09379768371582031, -0.09057235717773438, -0.08734703063964844, -0.0841217041015625, -0.08089637756347656, -0.07767105102539062, -0.07444572448730469, -0.07122039794921875, -0.06799507141113281, -0.06476974487304688, -0.06154441833496094, -0.058319091796875, -0.05509376525878906, -0.051868438720703125, -0.04864311218261719, -0.04541778564453125, -0.04219245910644531, -0.038967132568359375, -0.03574180603027344, -0.0325164794921875, -0.029291152954101562, -0.026065826416015625, -0.022840499877929688, -0.01961517333984375, -0.016389846801757812, -0.013164520263671875, -0.009939193725585938, -0.0067138671875, -0.0034885406494140625, -0.000263214111328125, 0.0029621124267578125, 0.00618743896484375, 0.009412765502929688, 0.012638092041015625, 0.015863418579101562, 0.0190887451171875, 0.022314071655273438, 0.025539398193359375, 0.028764724731445312, 0.03199005126953125, 0.03521537780761719, 0.038440704345703125, 0.04166603088378906, 0.044891357421875, 0.04811668395996094, 0.051342010498046875, 0.05456733703613281, 0.05779266357421875, 0.06101799011230469, 0.06424331665039062, 0.06746864318847656, 0.0706939697265625, 0.07391929626464844, 0.07714462280273438, 0.08036994934082031, 0.08359527587890625, 0.08682060241699219, 0.09004592895507812, 0.09327125549316406, 0.09649658203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 11.0, 17.0, 18.0, 31.0, 48.0, 80.0, 115.0, 181.0, 174.0, 110.0, 76.0, 35.0, 34.0, 21.0, 14.0, 7.0, 5.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.618001937866211e-05, -3.5113655030727386e-05, -3.4047290682792664e-05, -3.298092633485794e-05, -3.191456198692322e-05, -3.0848197638988495e-05, -2.9781833291053772e-05, -2.871546894311905e-05, -2.7649104595184326e-05, -2.6582740247249603e-05, -2.551637589931488e-05, -2.4450011551380157e-05, -2.3383647203445435e-05, -2.231728285551071e-05, -2.125091850757599e-05, -2.0184554159641266e-05, -1.9118189811706543e-05, -1.805182546377182e-05, -1.6985461115837097e-05, -1.5919096767902374e-05, -1.4852732419967651e-05, -1.3786368072032928e-05, -1.2720003724098206e-05, -1.1653639376163483e-05, -1.058727502822876e-05, -9.520910680294037e-06, -8.454546332359314e-06, -7.388181984424591e-06, -6.321817636489868e-06, -5.255453288555145e-06, -4.189088940620422e-06, -3.1227245926856995e-06, -2.0563602447509766e-06, -9.899958968162537e-07, 7.636845111846924e-08, 1.1427327990531921e-06, 2.209097146987915e-06, 3.275461494922638e-06, 4.341825842857361e-06, 5.408190190792084e-06, 6.474554538726807e-06, 7.5409188866615295e-06, 8.607283234596252e-06, 9.673647582530975e-06, 1.0740011930465698e-05, 1.1806376278400421e-05, 1.2872740626335144e-05, 1.3939104974269867e-05, 1.500546932220459e-05, 1.6071833670139313e-05, 1.7138198018074036e-05, 1.820456236600876e-05, 1.927092671394348e-05, 2.0337291061878204e-05, 2.1403655409812927e-05, 2.247001975774765e-05, 2.3536384105682373e-05, 2.4602748453617096e-05, 2.566911280155182e-05, 2.6735477149486542e-05, 2.7801841497421265e-05, 2.8868205845355988e-05, 2.993457019329071e-05, 3.100093454122543e-05, 3.2067298889160156e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 4.0, 13.0, 6.0, 9.0, 10.0, 13.0, 20.0, 32.0, 40.0, 59.0, 63.0, 86.0, 133.0, 186.0, 231.0, 335.0, 482.0, 703.0, 1134.0, 1925.0, 3315.0, 6256.0, 13794.0, 40828.0, 206052.0, 593882.0, 125408.0, 29312.0, 11185.0, 5344.0, 2814.0, 1675.0, 999.0, 659.0, 465.0, 292.0, 207.0, 159.0, 102.0, 77.0, 58.0, 45.0, 35.0, 34.0, 22.0, 17.0, 7.0, 9.0, 11.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1611328125, -0.15582656860351562, -0.15052032470703125, -0.14521408081054688, -0.1399078369140625, -0.13460159301757812, -0.12929534912109375, -0.12398910522460938, -0.118682861328125, -0.11337661743164062, -0.10807037353515625, -0.10276412963867188, -0.0974578857421875, -0.09215164184570312, -0.08684539794921875, -0.08153915405273438, -0.07623291015625, -0.07092666625976562, -0.06562042236328125, -0.060314178466796875, -0.0550079345703125, -0.049701690673828125, -0.04439544677734375, -0.039089202880859375, -0.033782958984375, -0.028476715087890625, -0.02317047119140625, -0.017864227294921875, -0.0125579833984375, -0.007251739501953125, -0.00194549560546875, 0.003360748291015625, 0.0086669921875, 0.013973236083984375, 0.01927947998046875, 0.024585723876953125, 0.0298919677734375, 0.035198211669921875, 0.04050445556640625, 0.045810699462890625, 0.051116943359375, 0.056423187255859375, 0.06172943115234375, 0.06703567504882812, 0.0723419189453125, 0.07764816284179688, 0.08295440673828125, 0.08826065063476562, 0.09356689453125, 0.09887313842773438, 0.10417938232421875, 0.10948562622070312, 0.1147918701171875, 0.12009811401367188, 0.12540435791015625, 0.13071060180664062, 0.136016845703125, 0.14132308959960938, 0.14662933349609375, 0.15193557739257812, 0.1572418212890625, 0.16254806518554688, 0.16785430908203125, 0.17316055297851562, 0.178466796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 7.0, 4.0, 5.0, 9.0, 8.0, 12.0, 16.0, 24.0, 47.0, 55.0, 61.0, 143.0, 175.0, 105.0, 81.0, 63.0, 54.0, 28.0, 31.0, 17.0, 12.0, 9.0, 6.0, 6.0, 2.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.082275390625, -0.07918643951416016, -0.07609748840332031, -0.07300853729248047, -0.06991958618164062, -0.06683063507080078, -0.06374168395996094, -0.060652732849121094, -0.05756378173828125, -0.054474830627441406, -0.05138587951660156, -0.04829692840576172, -0.045207977294921875, -0.04211902618408203, -0.03903007507324219, -0.035941123962402344, -0.0328521728515625, -0.029763221740722656, -0.026674270629882812, -0.02358531951904297, -0.020496368408203125, -0.01740741729736328, -0.014318466186523438, -0.011229515075683594, -0.00814056396484375, -0.005051612854003906, -0.0019626617431640625, 0.0011262893676757812, 0.004215240478515625, 0.007304191589355469, 0.010393142700195312, 0.013482093811035156, 0.016571044921875, 0.019659996032714844, 0.022748947143554688, 0.02583789825439453, 0.028926849365234375, 0.03201580047607422, 0.03510475158691406, 0.038193702697753906, 0.04128265380859375, 0.044371604919433594, 0.04746055603027344, 0.05054950714111328, 0.053638458251953125, 0.05672740936279297, 0.05981636047363281, 0.06290531158447266, 0.0659942626953125, 0.06908321380615234, 0.07217216491699219, 0.07526111602783203, 0.07835006713867188, 0.08143901824951172, 0.08452796936035156, 0.0876169204711914, 0.09070587158203125, 0.0937948226928711, 0.09688377380371094, 0.09997272491455078, 0.10306167602539062, 0.10615062713623047, 0.10923957824707031, 0.11232852935791016, 0.11541748046875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 8.0, 9.0, 17.0, 23.0, 35.0, 36.0, 55.0, 65.0, 80.0, 74.0, 76.0, 85.0, 90.0, 52.0, 69.0, 51.0, 45.0, 32.0, 21.0, 19.0, 17.0, 10.0, 3.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7494366765022278, -0.7291948795318604, -0.7089530825614929, -0.6887112855911255, -0.6684694290161133, -0.6482276320457458, -0.6279858350753784, -0.607744038105011, -0.5875022411346436, -0.5672604441642761, -0.5470186471939087, -0.5267768502235413, -0.5065350532531738, -0.486293226480484, -0.4660513997077942, -0.44580960273742676, -0.4255678057670593, -0.4053260087966919, -0.38508421182632446, -0.36484238505363464, -0.3446005880832672, -0.3243587911128998, -0.30411696434020996, -0.28387516736984253, -0.2636333703994751, -0.24339157342910767, -0.22314976155757904, -0.20290794968605042, -0.18266615271568298, -0.16242435574531555, -0.14218254387378693, -0.1219407320022583, -0.10169899463653564, -0.08145719021558762, -0.06121538579463959, -0.04097358137369156, -0.02073177695274353, -0.0004899725317955017, 0.019751831889152527, 0.03999364376068115, 0.060235440731048584, 0.08047724515199661, 0.10071904957294464, 0.12096085399389267, 0.1412026584148407, 0.16144445538520813, 0.18168626725673676, 0.20192807912826538, 0.2221698760986328, 0.24241167306900024, 0.2626534700393677, 0.2828952968120575, 0.3031370937824249, 0.32337889075279236, 0.3436207175254822, 0.3638625144958496, 0.38410431146621704, 0.4043461084365845, 0.4245879054069519, 0.4448297321796417, 0.46507152915000916, 0.4853133261203766, 0.5055551528930664, 0.5257969498634338, 0.5460387468338013]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 5.0, 8.0, 6.0, 15.0, 9.0, 16.0, 15.0, 17.0, 26.0, 25.0, 23.0, 18.0, 33.0, 40.0, 36.0, 37.0, 48.0, 46.0, 47.0, 48.0, 40.0, 39.0, 33.0, 38.0, 41.0, 30.0, 38.0, 38.0, 22.0, 22.0, 24.0, 18.0, 16.0, 17.0, 11.0, 10.0, 13.0, 8.0, 5.0, 8.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.647750735282898, -0.6275076866149902, -0.6072646379470825, -0.58702152967453, -0.5667784810066223, -0.5465354323387146, -0.5262923836708069, -0.5060493350028992, -0.48580625653266907, -0.46556320786476135, -0.44532012939453125, -0.42507708072662354, -0.4048340320587158, -0.3845909535884857, -0.364347904920578, -0.3441048264503479, -0.3238617777824402, -0.30361872911453247, -0.28337565064430237, -0.26313260197639465, -0.24288953840732574, -0.22264647483825684, -0.20240342617034912, -0.1821603626012802, -0.1619172990322113, -0.1416742354631424, -0.12143117934465408, -0.10118812322616577, -0.08094505965709686, -0.060701996088027954, -0.04045893996953964, -0.02021588385105133, 2.7120113372802734e-05, 0.020270179957151413, 0.04051323980093002, 0.06075629964470863, 0.08099935948848724, 0.10124242305755615, 0.12148547917604446, 0.14172853529453278, 0.16197159886360168, 0.1822146624326706, 0.2024577260017395, 0.22270077466964722, 0.24294383823871613, 0.26318690180778503, 0.28342995047569275, 0.30367302894592285, 0.32391607761383057, 0.3441591262817383, 0.3644022047519684, 0.3846452534198761, 0.4048883318901062, 0.4251313805580139, 0.44537442922592163, 0.46561747789382935, 0.48586055636405945, 0.5061036348342896, 0.5263466835021973, 0.546589732170105, 0.5668327808380127, 0.5870758295059204, 0.6073189377784729, 0.6275619864463806, 0.6478050351142883]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 6.0, 11.0, 8.0, 14.0, 20.0, 25.0, 39.0, 47.0, 87.0, 84.0, 105.0, 152.0, 206.0, 240.0, 314.0, 444.0, 536.0, 715.0, 904.0, 1154.0, 1575.0, 2059.0, 2820.0, 1026950.0, 2983.0, 2195.0, 1578.0, 1250.0, 967.0, 726.0, 562.0, 417.0, 342.0, 279.0, 188.0, 135.0, 116.0, 66.0, 76.0, 54.0, 45.0, 26.0, 23.0, 19.0, 15.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0], "bins": [-0.6502943634986877, -0.6314799785614014, -0.6126656532287598, -0.5938512682914734, -0.575036883354187, -0.5562224984169006, -0.537408173084259, -0.5185937881469727, -0.4997794032096863, -0.4809650480747223, -0.4621506631374359, -0.4433363080024719, -0.42452192306518555, -0.40570756793022156, -0.38689321279525757, -0.3680788278579712, -0.3492644727230072, -0.3304501175880432, -0.31163573265075684, -0.29282137751579285, -0.27400699257850647, -0.2551926374435425, -0.2363782674074173, -0.21756389737129211, -0.19874952733516693, -0.17993515729904175, -0.16112078726291656, -0.14230641722679138, -0.1234920546412468, -0.10467768460512161, -0.08586332201957703, -0.06704895198345184, -0.04823458194732666, -0.029420213773846626, -0.010605845600366592, 0.008208520710468292, 0.027022890746593475, 0.04583726078271866, 0.06465162336826324, 0.08346599340438843, 0.10228036344051361, 0.1210947334766388, 0.13990910351276398, 0.15872347354888916, 0.17753782868385315, 0.19635221362113953, 0.21516656875610352, 0.2339809387922287, 0.2527953088283539, 0.27160966396331787, 0.29042404890060425, 0.30923840403556824, 0.3280527889728546, 0.3468671441078186, 0.365681529045105, 0.38449588418006897, 0.40331023931503296, 0.42212459444999695, 0.4409389793872833, 0.4597533345222473, 0.4785677194595337, 0.4973820745944977, 0.5161964297294617, 0.535010814666748, 0.5538251996040344]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 38.0, 52.0, 90.0, 172.0, 538.0, 2376.0, 10497.0, 51408328.0, 38773.0, 7689.0, 1898.0, 499.0, 173.0, 68.0, 46.0, 23.0, 15.0, 6.0, 7.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.745380401611328, -4.591394424438477, -4.437408924102783, -4.283422946929932, -4.129437446594238, -3.9754514694213867, -3.821465492248535, -3.6674797534942627, -3.5134940147399902, -3.3595082759857178, -3.2055225372314453, -3.0515365600585938, -2.8975508213043213, -2.743565082550049, -2.5895791053771973, -2.435593366622925, -2.2816076278686523, -2.12762188911438, -1.9736360311508179, -1.8196501731872559, -1.6656644344329834, -1.511678695678711, -1.357692837715149, -1.203706979751587, -1.0497212409973145, -0.8957354426383972, -0.74174964427948, -0.5877638459205627, -0.4337780475616455, -0.27979224920272827, -0.12580645084381104, 0.028179407119750977, 0.18216562271118164, 0.3361514210700989, 0.4901372194290161, 0.6441230177879333, 0.7981088161468506, 0.9520946145057678, 1.106080412864685, 1.260066270828247, 1.4140520095825195, 1.568037748336792, 1.722023606300354, 1.876009464263916, 2.0299952030181885, 2.183980941772461, 2.3379669189453125, 2.491952657699585, 2.6459383964538574, 2.79992413520813, 2.9539098739624023, 3.107895851135254, 3.2618815898895264, 3.415867328643799, 3.5698533058166504, 3.723839044570923, 3.8778247833251953, 4.031810760498047, 4.18579626083374, 4.339782238006592, 4.493767738342285, 4.647753715515137, 4.801739692687988, 4.95572566986084, 5.109711170196533]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 8.0, 8.0, 9.0, 27.0, 46.0, 51.0, 82.0, 122.0, 193.0, 278.0, 419.0, 588.0, 939.0, 1494.0, 2423.0, 3776.0, 5903.0, 9787.0, 16188.0, 27570.0, 46782.0, 78155.0, 127759.0, 199437.0, 287856.0, 405032.0, 2099396.0, 1796344.0, 392559.0, 281750.0, 193065.0, 123994.0, 76288.0, 45417.0, 26655.0, 15840.0, 9379.0, 5793.0, 3617.0, 2183.0, 1494.0, 943.0, 608.0, 405.0, 272.0, 165.0, 116.0, 98.0, 43.0, 31.0, 18.0, 19.0, 12.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.4375, -0.423370361328125, -0.40924072265625, -0.395111083984375, -0.3809814453125, -0.366851806640625, -0.35272216796875, -0.338592529296875, -0.324462890625, -0.310333251953125, -0.29620361328125, -0.282073974609375, -0.2679443359375, -0.253814697265625, -0.23968505859375, -0.225555419921875, -0.21142578125, -0.197296142578125, -0.18316650390625, -0.169036865234375, -0.1549072265625, -0.140777587890625, -0.12664794921875, -0.112518310546875, -0.098388671875, -0.084259033203125, -0.07012939453125, -0.055999755859375, -0.0418701171875, -0.027740478515625, -0.01361083984375, 0.000518798828125, 0.0146484375, 0.028778076171875, 0.04290771484375, 0.057037353515625, 0.0711669921875, 0.085296630859375, 0.09942626953125, 0.113555908203125, 0.127685546875, 0.141815185546875, 0.15594482421875, 0.170074462890625, 0.1842041015625, 0.198333740234375, 0.21246337890625, 0.226593017578125, 0.24072265625, 0.254852294921875, 0.26898193359375, 0.283111572265625, 0.2972412109375, 0.311370849609375, 0.32550048828125, 0.339630126953125, 0.353759765625, 0.367889404296875, 0.38201904296875, 0.396148681640625, 0.4102783203125, 0.424407958984375, 0.43853759765625, 0.452667236328125, 0.466796875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 6.0, 7.0, 4.0, 3.0, 11.0, 16.0, 16.0, 13.0, 13.0, 18.0, 21.0, 33.0, 38.0, 36.0, 35.0, 36.0, 39.0, 42.0, 39.0, 167.0, 837.0, 125.0, 40.0, 43.0, 31.0, 59.0, 38.0, 29.0, 27.0, 23.0, 24.0, 22.0, 20.0, 23.0, 14.0, 11.0, 14.0, 8.0, 7.0, 5.0, 6.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.328125, -3.234100341796875, -3.14007568359375, -3.046051025390625, -2.9520263671875, -2.858001708984375, -2.76397705078125, -2.669952392578125, -2.575927734375, -2.481903076171875, -2.38787841796875, -2.293853759765625, -2.1998291015625, -2.105804443359375, -2.01177978515625, -1.917755126953125, -1.82373046875, -1.729705810546875, -1.63568115234375, -1.541656494140625, -1.4476318359375, -1.353607177734375, -1.25958251953125, -1.165557861328125, -1.071533203125, -0.977508544921875, -0.88348388671875, -0.789459228515625, -0.6954345703125, -0.601409912109375, -0.50738525390625, -0.413360595703125, -0.3193359375, -0.225311279296875, -0.13128662109375, -0.037261962890625, 0.0567626953125, 0.150787353515625, 0.24481201171875, 0.338836669921875, 0.432861328125, 0.526885986328125, 0.62091064453125, 0.714935302734375, 0.8089599609375, 0.902984619140625, 0.99700927734375, 1.091033935546875, 1.18505859375, 1.279083251953125, 1.37310791015625, 1.467132568359375, 1.5611572265625, 1.655181884765625, 1.74920654296875, 1.843231201171875, 1.937255859375, 2.031280517578125, 2.12530517578125, 2.219329833984375, 2.3133544921875, 2.407379150390625, 2.50140380859375, 2.595428466796875, 2.689453125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 6.0, 4.0, 10.0, 17.0, 21.0, 32.0, 35.0, 80.0, 123.0, 192.0, 348.0, 546.0, 958.0, 1584.0, 2712.0, 4438.0, 7514.0, 12289.0, 20129.0, 31990.0, 49235.0, 73589.0, 106276.0, 146225.0, 191202.0, 236494.0, 290545.0, 926580.0, 2559152.0, 544639.0, 271067.0, 223278.0, 178481.0, 133432.0, 96011.0, 66066.0, 43378.0, 28233.0, 17563.0, 10717.0, 6456.0, 3913.0, 2351.0, 1393.0, 851.0, 496.0, 318.0, 181.0, 122.0, 71.0, 48.0, 16.0, 17.0, 7.0, 4.0, 6.0, 7.0, 1.0], "bins": [-0.291259765625, -0.28278350830078125, -0.2743072509765625, -0.26583099365234375, -0.257354736328125, -0.24887847900390625, -0.2404022216796875, -0.23192596435546875, -0.22344970703125, -0.21497344970703125, -0.2064971923828125, -0.19802093505859375, -0.189544677734375, -0.18106842041015625, -0.1725921630859375, -0.16411590576171875, -0.1556396484375, -0.14716339111328125, -0.1386871337890625, -0.13021087646484375, -0.121734619140625, -0.11325836181640625, -0.1047821044921875, -0.09630584716796875, -0.08782958984375, -0.07935333251953125, -0.0708770751953125, -0.06240081787109375, -0.053924560546875, -0.04544830322265625, -0.0369720458984375, -0.02849578857421875, -0.02001953125, -0.01154327392578125, -0.0030670166015625, 0.00540924072265625, 0.013885498046875, 0.02236175537109375, 0.0308380126953125, 0.03931427001953125, 0.04779052734375, 0.05626678466796875, 0.0647430419921875, 0.07321929931640625, 0.081695556640625, 0.09017181396484375, 0.0986480712890625, 0.10712432861328125, 0.1156005859375, 0.12407684326171875, 0.1325531005859375, 0.14102935791015625, 0.149505615234375, 0.15798187255859375, 0.1664581298828125, 0.17493438720703125, 0.18341064453125, 0.19188690185546875, 0.2003631591796875, 0.20883941650390625, 0.217315673828125, 0.22579193115234375, 0.2342681884765625, 0.24274444580078125, 0.251220703125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 12.0, 9.0, 7.0, 9.0, 8.0, 9.0, 21.0, 20.0, 33.0, 21.0, 36.0, 34.0, 34.0, 32.0, 43.0, 43.0, 39.0, 29.0, 77.0, 571.0, 468.0, 66.0, 34.0, 34.0, 31.0, 30.0, 36.0, 28.0, 29.0, 27.0, 31.0, 24.0, 17.0, 14.0, 15.0, 11.0, 11.0, 10.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.982421875, -1.913787841796875, -1.84515380859375, -1.776519775390625, -1.7078857421875, -1.639251708984375, -1.57061767578125, -1.501983642578125, -1.433349609375, -1.364715576171875, -1.29608154296875, -1.227447509765625, -1.1588134765625, -1.090179443359375, -1.02154541015625, -0.952911376953125, -0.88427734375, -0.815643310546875, -0.74700927734375, -0.678375244140625, -0.6097412109375, -0.541107177734375, -0.47247314453125, -0.403839111328125, -0.335205078125, -0.266571044921875, -0.19793701171875, -0.129302978515625, -0.0606689453125, 0.007965087890625, 0.07659912109375, 0.145233154296875, 0.2138671875, 0.282501220703125, 0.35113525390625, 0.419769287109375, 0.4884033203125, 0.557037353515625, 0.62567138671875, 0.694305419921875, 0.762939453125, 0.831573486328125, 0.90020751953125, 0.968841552734375, 1.0374755859375, 1.106109619140625, 1.17474365234375, 1.243377685546875, 1.31201171875, 1.380645751953125, 1.44927978515625, 1.517913818359375, 1.5865478515625, 1.655181884765625, 1.72381591796875, 1.792449951171875, 1.861083984375, 1.929718017578125, 1.99835205078125, 2.066986083984375, 2.1356201171875, 2.204254150390625, 2.27288818359375, 2.341522216796875, 2.41015625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 0.0, 12.0, 17.0, 28.0, 44.0, 79.0, 100.0, 144.0, 223.0, 341.0, 526.0, 789.0, 1181.0, 2060.0, 4443.0, 11523.0, 38096.0, 135976.0, 415798.0, 1473015.0, 3447260.0, 508050.0, 176376.0, 49562.0, 14682.0, 5099.0, 2290.0, 1309.0, 789.0, 523.0, 368.0, 254.0, 145.0, 115.0, 73.0, 52.0, 27.0, 15.0, 18.0, 14.0, 4.0, 3.0, 1.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.74169921875, -0.718597412109375, -0.69549560546875, -0.672393798828125, -0.6492919921875, -0.626190185546875, -0.60308837890625, -0.579986572265625, -0.556884765625, -0.533782958984375, -0.51068115234375, -0.487579345703125, -0.4644775390625, -0.441375732421875, -0.41827392578125, -0.395172119140625, -0.3720703125, -0.348968505859375, -0.32586669921875, -0.302764892578125, -0.2796630859375, -0.256561279296875, -0.23345947265625, -0.210357666015625, -0.187255859375, -0.164154052734375, -0.14105224609375, -0.117950439453125, -0.0948486328125, -0.071746826171875, -0.04864501953125, -0.025543212890625, -0.00244140625, 0.020660400390625, 0.04376220703125, 0.066864013671875, 0.0899658203125, 0.113067626953125, 0.13616943359375, 0.159271240234375, 0.182373046875, 0.205474853515625, 0.22857666015625, 0.251678466796875, 0.2747802734375, 0.297882080078125, 0.32098388671875, 0.344085693359375, 0.3671875, 0.390289306640625, 0.41339111328125, 0.436492919921875, 0.4595947265625, 0.482696533203125, 0.50579833984375, 0.528900146484375, 0.552001953125, 0.575103759765625, 0.59820556640625, 0.621307373046875, 0.6444091796875, 0.667510986328125, 0.69061279296875, 0.713714599609375, 0.73681640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 3.0, 12.0, 8.0, 11.0, 19.0, 18.0, 17.0, 15.0, 18.0, 32.0, 42.0, 31.0, 52.0, 53.0, 42.0, 49.0, 158.0, 808.0, 206.0, 55.0, 48.0, 36.0, 40.0, 37.0, 39.0, 26.0, 32.0, 26.0, 19.0, 18.0, 13.0, 10.0, 6.0, 5.0, 12.0, 1.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7685546875, -1.7065277099609375, -1.644500732421875, -1.5824737548828125, -1.52044677734375, -1.4584197998046875, -1.396392822265625, -1.3343658447265625, -1.2723388671875, -1.2103118896484375, -1.148284912109375, -1.0862579345703125, -1.02423095703125, -0.9622039794921875, -0.900177001953125, -0.8381500244140625, -0.776123046875, -0.7140960693359375, -0.652069091796875, -0.5900421142578125, -0.52801513671875, -0.4659881591796875, -0.403961181640625, -0.3419342041015625, -0.2799072265625, -0.2178802490234375, -0.155853271484375, -0.0938262939453125, -0.03179931640625, 0.0302276611328125, 0.092254638671875, 0.1542816162109375, 0.21630859375, 0.2783355712890625, 0.340362548828125, 0.4023895263671875, 0.46441650390625, 0.5264434814453125, 0.588470458984375, 0.6504974365234375, 0.7125244140625, 0.7745513916015625, 0.836578369140625, 0.8986053466796875, 0.96063232421875, 1.0226593017578125, 1.084686279296875, 1.1467132568359375, 1.208740234375, 1.2707672119140625, 1.332794189453125, 1.3948211669921875, 1.45684814453125, 1.5188751220703125, 1.580902099609375, 1.6429290771484375, 1.7049560546875, 1.7669830322265625, 1.829010009765625, 1.8910369873046875, 1.95306396484375, 2.0150909423828125, 2.077117919921875, 2.1391448974609375, 2.201171875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 8.0, 32.0, 60.0, 115.0, 153.0, 202.0, 173.0, 97.0, 59.0, 32.0, 29.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6002211570739746, -2.449687957763672, -2.29915452003479, -2.1486213207244873, -1.998088002204895, -1.8475546836853027, -1.697021484375, -1.5464881658554077, -1.3959548473358154, -1.2454215288162231, -1.0948882102966309, -0.9443550109863281, -0.7938216924667358, -0.6432883739471436, -0.49275511503219604, -0.34222185611724854, -0.19168853759765625, -0.04115524888038635, 0.10937803983688354, 0.25991132855415344, 0.41044461727142334, 0.5609779357910156, 0.7115111947059631, 0.8620444536209106, 1.012577772140503, 1.1631110906600952, 1.3136444091796875, 1.4641776084899902, 1.6147109270095825, 1.7652442455291748, 1.9157774448394775, 2.0663108825683594, 2.2168445587158203, 2.367377758026123, 2.517911195755005, 2.6684443950653076, 2.8189778327941895, 2.969511032104492, 3.120044231414795, 3.2705774307250977, 3.4211108684539795, 3.5716440677642822, 3.722177505493164, 3.872710704803467, 4.0232439041137695, 4.1737775802612305, 4.324310779571533, 4.474843978881836, 4.625377178192139, 4.775910377502441, 4.926443576812744, 5.076977252960205, 5.227510452270508, 5.3780436515808105, 5.528576850891113, 5.679110050201416, 5.829643249511719, 5.9801764488220215, 6.130709648132324, 6.281243324279785, 6.431776523590088, 6.582309722900391, 6.732842922210693, 6.883376121520996, 7.033909797668457]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 4.0, 6.0, 5.0, 10.0, 8.0, 20.0, 10.0, 14.0, 13.0, 24.0, 20.0, 33.0, 23.0, 29.0, 38.0, 44.0, 36.0, 37.0, 46.0, 40.0, 43.0, 50.0, 43.0, 28.0, 36.0, 30.0, 33.0, 30.0, 32.0, 24.0, 32.0, 25.0, 16.0, 12.0, 11.0, 12.0, 17.0, 8.0, 11.0, 6.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.8203513622283936, -2.733710765838623, -2.6470701694488525, -2.560429573059082, -2.4737892150878906, -2.38714861869812, -2.3005080223083496, -2.213867425918579, -2.1272268295288086, -2.040586233139038, -1.9539457559585571, -1.8673051595687866, -1.7806646823883057, -1.6940240859985352, -1.6073834896087646, -1.5207428932189941, -1.4341025352478027, -1.3474619388580322, -1.2608214616775513, -1.1741808652877808, -1.0875403881072998, -1.0008997917175293, -0.9142591953277588, -0.8276186585426331, -0.7409781217575073, -0.6543375849723816, -0.5676970481872559, -0.48105645179748535, -0.3944159150123596, -0.3077753782272339, -0.22113478183746338, -0.13449424505233765, -0.04785346984863281, 0.038787081837654114, 0.12542763352394104, 0.21206820011138916, 0.2987087368965149, 0.3853492736816406, 0.47198987007141113, 0.5586304068565369, 0.6452709436416626, 0.7319114804267883, 0.8185520172119141, 0.9051926136016846, 0.9918331503868103, 1.078473687171936, 1.1651142835617065, 1.2517547607421875, 1.338395357131958, 1.4250359535217285, 1.5116764307022095, 1.59831702709198, 1.684957504272461, 1.7715981006622314, 1.858238697052002, 1.9448792934417725, 2.031519889831543, 2.1181604862213135, 2.204801082611084, 2.2914414405822754, 2.378082036972046, 2.4647226333618164, 2.551363229751587, 2.6380038261413574, 2.724644184112549]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 10.0, 8.0, 11.0, 13.0, 26.0, 35.0, 60.0, 101.0, 178.0, 358.0, 738.0, 1600.0, 3821.0, 10280.0, 31025.0, 225844.0, 2966823.0, 864763.0, 60431.0, 16224.0, 6715.0, 2708.0, 1255.0, 592.0, 304.0, 138.0, 65.0, 45.0, 23.0, 25.0, 18.0, 9.0, 9.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.142333984375, -0.13834857940673828, -0.13436317443847656, -0.13037776947021484, -0.12639236450195312, -0.1224069595336914, -0.11842155456542969, -0.11443614959716797, -0.11045074462890625, -0.10646533966064453, -0.10247993469238281, -0.0984945297241211, -0.09450912475585938, -0.09052371978759766, -0.08653831481933594, -0.08255290985107422, -0.0785675048828125, -0.07458209991455078, -0.07059669494628906, -0.06661128997802734, -0.06262588500976562, -0.058640480041503906, -0.05465507507324219, -0.05066967010498047, -0.04668426513671875, -0.04269886016845703, -0.03871345520019531, -0.034728050231933594, -0.030742645263671875, -0.026757240295410156, -0.022771835327148438, -0.01878643035888672, -0.014801025390625, -0.010815620422363281, -0.0068302154541015625, -0.0028448104858398438, 0.001140594482421875, 0.005125999450683594, 0.009111404418945312, 0.013096809387207031, 0.01708221435546875, 0.02106761932373047, 0.025053024291992188, 0.029038429260253906, 0.033023834228515625, 0.037009239196777344, 0.04099464416503906, 0.04498004913330078, 0.0489654541015625, 0.05295085906982422, 0.05693626403808594, 0.060921669006347656, 0.06490707397460938, 0.0688924789428711, 0.07287788391113281, 0.07686328887939453, 0.08084869384765625, 0.08483409881591797, 0.08881950378417969, 0.0928049087524414, 0.09679031372070312, 0.10077571868896484, 0.10476112365722656, 0.10874652862548828, 0.11273193359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 11.0, 12.0, 9.0, 18.0, 17.0, 32.0, 33.0, 31.0, 34.0, 35.0, 59.0, 66.0, 68.0, 58.0, 59.0, 67.0, 49.0, 35.0, 44.0, 55.0, 39.0, 23.0, 16.0, 18.0, 22.0, 25.0, 6.0, 6.0, 7.0, 7.0, 2.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06146526336669922, -0.05969810485839844, -0.057930946350097656, -0.056163787841796875, -0.054396629333496094, -0.05262947082519531, -0.05086231231689453, -0.04909515380859375, -0.04732799530029297, -0.04556083679199219, -0.043793678283691406, -0.042026519775390625, -0.040259361267089844, -0.03849220275878906, -0.03672504425048828, -0.0349578857421875, -0.03319072723388672, -0.03142356872558594, -0.029656410217285156, -0.027889251708984375, -0.026122093200683594, -0.024354934692382812, -0.02258777618408203, -0.02082061767578125, -0.01905345916748047, -0.017286300659179688, -0.015519142150878906, -0.013751983642578125, -0.011984825134277344, -0.010217666625976562, -0.008450508117675781, -0.006683349609375, -0.004916191101074219, -0.0031490325927734375, -0.0013818740844726562, 0.000385284423828125, 0.0021524429321289062, 0.0039196014404296875, 0.005686759948730469, 0.00745391845703125, 0.009221076965332031, 0.010988235473632812, 0.012755393981933594, 0.014522552490234375, 0.016289710998535156, 0.018056869506835938, 0.01982402801513672, 0.0215911865234375, 0.02335834503173828, 0.025125503540039062, 0.026892662048339844, 0.028659820556640625, 0.030426979064941406, 0.03219413757324219, 0.03396129608154297, 0.03572845458984375, 0.03749561309814453, 0.03926277160644531, 0.041029930114746094, 0.042797088623046875, 0.044564247131347656, 0.04633140563964844, 0.04809856414794922, 0.04986572265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 11.0, 8.0, 10.0, 8.0, 13.0, 20.0, 43.0, 44.0, 75.0, 130.0, 348.0, 1266.0, 6396.0, 54846.0, 1291728.0, 2703583.0, 121614.0, 11193.0, 1971.0, 492.0, 172.0, 85.0, 51.0, 28.0, 25.0, 23.0, 13.0, 13.0, 10.0, 5.0, 7.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09912109375, -0.09572029113769531, -0.09231948852539062, -0.08891868591308594, -0.08551788330078125, -0.08211708068847656, -0.07871627807617188, -0.07531547546386719, -0.0719146728515625, -0.06851387023925781, -0.06511306762695312, -0.06171226501464844, -0.05831146240234375, -0.05491065979003906, -0.051509857177734375, -0.04810905456542969, -0.044708251953125, -0.04130744934082031, -0.037906646728515625, -0.03450584411621094, -0.03110504150390625, -0.027704238891601562, -0.024303436279296875, -0.020902633666992188, -0.0175018310546875, -0.014101028442382812, -0.010700225830078125, -0.0072994232177734375, -0.00389862060546875, -0.0004978179931640625, 0.002902984619140625, 0.0063037872314453125, 0.00970458984375, 0.013105392456054688, 0.016506195068359375, 0.019906997680664062, 0.02330780029296875, 0.026708602905273438, 0.030109405517578125, 0.03351020812988281, 0.0369110107421875, 0.04031181335449219, 0.043712615966796875, 0.04711341857910156, 0.05051422119140625, 0.05391502380371094, 0.057315826416015625, 0.06071662902832031, 0.064117431640625, 0.06751823425292969, 0.07091903686523438, 0.07431983947753906, 0.07772064208984375, 0.08112144470214844, 0.08452224731445312, 0.08792304992675781, 0.0913238525390625, 0.09472465515136719, 0.09812545776367188, 0.10152626037597656, 0.10492706298828125, 0.10832786560058594, 0.11172866821289062, 0.11512947082519531, 0.1185302734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 4.0, 9.0, 9.0, 9.0, 15.0, 18.0, 28.0, 50.0, 86.0, 123.0, 164.0, 295.0, 398.0, 560.0, 598.0, 520.0, 423.0, 239.0, 174.0, 100.0, 83.0, 38.0, 36.0, 21.0, 17.0, 10.0, 15.0, 10.0, 4.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06787109375, -0.0660099983215332, -0.0641489028930664, -0.06228780746459961, -0.06042671203613281, -0.058565616607666016, -0.05670452117919922, -0.05484342575073242, -0.052982330322265625, -0.05112123489379883, -0.04926013946533203, -0.047399044036865234, -0.04553794860839844, -0.04367685317993164, -0.041815757751464844, -0.03995466232299805, -0.03809356689453125, -0.03623247146606445, -0.034371376037597656, -0.03251028060913086, -0.030649185180664062, -0.028788089752197266, -0.02692699432373047, -0.025065898895263672, -0.023204803466796875, -0.021343708038330078, -0.01948261260986328, -0.017621517181396484, -0.015760421752929688, -0.01389932632446289, -0.012038230895996094, -0.010177135467529297, -0.0083160400390625, -0.006454944610595703, -0.004593849182128906, -0.0027327537536621094, -0.0008716583251953125, 0.0009894371032714844, 0.0028505325317382812, 0.004711627960205078, 0.006572723388671875, 0.008433818817138672, 0.010294914245605469, 0.012156009674072266, 0.014017105102539062, 0.01587820053100586, 0.017739295959472656, 0.019600391387939453, 0.02146148681640625, 0.023322582244873047, 0.025183677673339844, 0.02704477310180664, 0.028905868530273438, 0.030766963958740234, 0.03262805938720703, 0.03448915481567383, 0.036350250244140625, 0.03821134567260742, 0.04007244110107422, 0.041933536529541016, 0.04379463195800781, 0.04565572738647461, 0.047516822814941406, 0.0493779182434082, 0.051239013671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 22.0, 18.0, 32.0, 34.0, 55.0, 86.0, 80.0, 106.0, 100.0, 94.0, 84.0, 80.0, 69.0, 42.0, 24.0, 29.0, 10.0, 8.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18100687861442566, -0.17542582750320435, -0.16984479129314423, -0.1642637550830841, -0.1586827039718628, -0.15310165286064148, -0.14752061665058136, -0.14193958044052124, -0.13635852932929993, -0.1307774782180786, -0.1251964420080185, -0.11961539834737778, -0.11403435468673706, -0.10845331102609634, -0.10287226736545563, -0.09729122370481491, -0.0917101800441742, -0.08612913638353348, -0.08054809272289276, -0.07496704906225204, -0.06938600540161133, -0.06380496174097061, -0.058223918080329895, -0.05264287441968918, -0.04706183075904846, -0.041480787098407745, -0.03589974343776703, -0.030318699777126312, -0.024737656116485596, -0.01915661245584488, -0.013575568795204163, -0.007994525134563446, -0.0024134814739227295, 0.003167562186717987, 0.008748605847358704, 0.01432964950799942, 0.019910693168640137, 0.025491736829280853, 0.03107278048992157, 0.036653824150562286, 0.042234867811203, 0.04781591147184372, 0.053396955132484436, 0.05897799879312515, 0.06455904245376587, 0.07014008611440659, 0.0757211297750473, 0.08130217343568802, 0.08688321709632874, 0.09246426075696945, 0.09804530441761017, 0.10362634807825089, 0.1092073917388916, 0.11478843539953232, 0.12036947906017303, 0.12595051527023315, 0.13153156638145447, 0.13711261749267578, 0.1426936537027359, 0.14827468991279602, 0.15385574102401733, 0.15943679213523865, 0.16501782834529877, 0.1705988645553589, 0.1761799156665802]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 10.0, 10.0, 13.0, 9.0, 22.0, 25.0, 19.0, 18.0, 32.0, 32.0, 33.0, 41.0, 39.0, 31.0, 40.0, 39.0, 37.0, 58.0, 43.0, 40.0, 43.0, 35.0, 34.0, 41.0, 39.0, 26.0, 32.0, 18.0, 29.0, 24.0, 20.0, 11.0, 13.0, 13.0, 7.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.11744862794876099, -0.11380114406347275, -0.11015366017818451, -0.10650617629289627, -0.10285869240760803, -0.09921121597290039, -0.09556373208761215, -0.09191624820232391, -0.08826876431703568, -0.08462128043174744, -0.0809737965464592, -0.07732631266117096, -0.07367883622646332, -0.07003134489059448, -0.06638386845588684, -0.0627363845705986, -0.059088900685310364, -0.055441416800022125, -0.05179393291473389, -0.04814645275473595, -0.04449896886944771, -0.04085148498415947, -0.03720400482416153, -0.03355652093887329, -0.029909037053585052, -0.026261553168296814, -0.022614071145653725, -0.018966589123010635, -0.015319105237722397, -0.011671621352434158, -0.008024139329791069, -0.00437665730714798, -0.0007291734218597412, 0.0029183095321059227, 0.006565792486071587, 0.01021327544003725, 0.013860758394002914, 0.017508242279291153, 0.021155724301934242, 0.02480320632457733, 0.02845069020986557, 0.03209817409515381, 0.03574565798044205, 0.03939313814043999, 0.043040622025728226, 0.046688105911016464, 0.050335586071014404, 0.05398306995630264, 0.05763055384159088, 0.06127803772687912, 0.06492552161216736, 0.0685730054974556, 0.07222048938274384, 0.07586796581745148, 0.07951544970273972, 0.08316293358802795, 0.08681041747331619, 0.09045790135860443, 0.09410538524389267, 0.09775286912918091, 0.10140034556388855, 0.10504783689975739, 0.10869531333446503, 0.11234279721975327, 0.1159902811050415]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 8.0, 12.0, 23.0, 18.0, 37.0, 48.0, 80.0, 111.0, 179.0, 310.0, 590.0, 1094.0, 2608.0, 6886.0, 24523.0, 138929.0, 612189.0, 212291.0, 33910.0, 8648.0, 3078.0, 1324.0, 658.0, 355.0, 232.0, 136.0, 77.0, 72.0, 26.0, 32.0, 19.0, 9.0, 11.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1331787109375, -0.1294384002685547, -0.12569808959960938, -0.12195777893066406, -0.11821746826171875, -0.11447715759277344, -0.11073684692382812, -0.10699653625488281, -0.1032562255859375, -0.09951591491699219, -0.09577560424804688, -0.09203529357910156, -0.08829498291015625, -0.08455467224121094, -0.08081436157226562, -0.07707405090332031, -0.073333740234375, -0.06959342956542969, -0.06585311889648438, -0.06211280822753906, -0.05837249755859375, -0.05463218688964844, -0.050891876220703125, -0.04715156555175781, -0.0434112548828125, -0.03967094421386719, -0.035930633544921875, -0.03219032287597656, -0.02845001220703125, -0.024709701538085938, -0.020969390869140625, -0.017229080200195312, -0.01348876953125, -0.009748458862304688, -0.006008148193359375, -0.0022678375244140625, 0.00147247314453125, 0.0052127838134765625, 0.008953094482421875, 0.012693405151367188, 0.0164337158203125, 0.020174026489257812, 0.023914337158203125, 0.027654647827148438, 0.03139495849609375, 0.03513526916503906, 0.038875579833984375, 0.04261589050292969, 0.046356201171875, 0.05009651184082031, 0.053836822509765625, 0.05757713317871094, 0.06131744384765625, 0.06505775451660156, 0.06879806518554688, 0.07253837585449219, 0.0762786865234375, 0.08001899719238281, 0.08375930786132812, 0.08749961853027344, 0.09123992919921875, 0.09498023986816406, 0.09872055053710938, 0.10246086120605469, 0.106201171875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 8.0, 9.0, 12.0, 6.0, 12.0, 15.0, 18.0, 23.0, 20.0, 23.0, 37.0, 40.0, 49.0, 48.0, 67.0, 62.0, 49.0, 63.0, 57.0, 56.0, 50.0, 40.0, 28.0, 30.0, 35.0, 20.0, 22.0, 23.0, 15.0, 9.0, 10.0, 12.0, 3.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054534912109375, -0.052861690521240234, -0.05118846893310547, -0.0495152473449707, -0.04784202575683594, -0.04616880416870117, -0.044495582580566406, -0.04282236099243164, -0.041149139404296875, -0.03947591781616211, -0.037802696228027344, -0.03612947463989258, -0.03445625305175781, -0.03278303146362305, -0.03110980987548828, -0.029436588287353516, -0.02776336669921875, -0.026090145111083984, -0.02441692352294922, -0.022743701934814453, -0.021070480346679688, -0.019397258758544922, -0.017724037170410156, -0.01605081558227539, -0.014377593994140625, -0.01270437240600586, -0.011031150817871094, -0.009357929229736328, -0.0076847076416015625, -0.006011486053466797, -0.004338264465332031, -0.0026650428771972656, -0.0009918212890625, 0.0006814002990722656, 0.0023546218872070312, 0.004027843475341797, 0.0057010650634765625, 0.007374286651611328, 0.009047508239746094, 0.01072072982788086, 0.012393951416015625, 0.01406717300415039, 0.015740394592285156, 0.017413616180419922, 0.019086837768554688, 0.020760059356689453, 0.02243328094482422, 0.024106502532958984, 0.02577972412109375, 0.027452945709228516, 0.02912616729736328, 0.030799388885498047, 0.03247261047363281, 0.03414583206176758, 0.035819053649902344, 0.03749227523803711, 0.039165496826171875, 0.04083871841430664, 0.042511940002441406, 0.04418516159057617, 0.04585838317871094, 0.0475316047668457, 0.04920482635498047, 0.050878047943115234, 0.05255126953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 6.0, 10.0, 10.0, 19.0, 16.0, 17.0, 34.0, 38.0, 45.0, 74.0, 129.0, 382.0, 829.0, 2424.0, 7267.0, 23740.0, 76916.0, 216706.0, 360603.0, 234774.0, 85533.0, 26538.0, 7995.0, 2615.0, 956.0, 378.0, 194.0, 97.0, 58.0, 34.0, 23.0, 18.0, 14.0, 13.0, 9.0, 4.0, 11.0, 3.0, 4.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.061187744140625, -0.05911684036254883, -0.057045936584472656, -0.054975032806396484, -0.05290412902832031, -0.05083322525024414, -0.04876232147216797, -0.0466914176940918, -0.044620513916015625, -0.04254961013793945, -0.04047870635986328, -0.03840780258178711, -0.03633689880371094, -0.034265995025634766, -0.032195091247558594, -0.030124187469482422, -0.02805328369140625, -0.025982379913330078, -0.023911476135253906, -0.021840572357177734, -0.019769668579101562, -0.01769876480102539, -0.01562786102294922, -0.013556957244873047, -0.011486053466796875, -0.009415149688720703, -0.007344245910644531, -0.005273342132568359, -0.0032024383544921875, -0.0011315345764160156, 0.0009393692016601562, 0.003010272979736328, 0.0050811767578125, 0.007152080535888672, 0.009222984313964844, 0.011293888092041016, 0.013364791870117188, 0.01543569564819336, 0.01750659942626953, 0.019577503204345703, 0.021648406982421875, 0.023719310760498047, 0.02579021453857422, 0.02786111831665039, 0.029932022094726562, 0.032002925872802734, 0.034073829650878906, 0.03614473342895508, 0.03821563720703125, 0.04028654098510742, 0.042357444763183594, 0.044428348541259766, 0.04649925231933594, 0.04857015609741211, 0.05064105987548828, 0.05271196365356445, 0.054782867431640625, 0.0568537712097168, 0.05892467498779297, 0.06099557876586914, 0.06306648254394531, 0.06513738632202148, 0.06720829010009766, 0.06927919387817383, 0.07135009765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 9.0, 13.0, 11.0, 19.0, 16.0, 23.0, 26.0, 28.0, 22.0, 32.0, 29.0, 32.0, 41.0, 31.0, 42.0, 46.0, 32.0, 34.0, 47.0, 43.0, 42.0, 31.0, 31.0, 32.0, 33.0, 28.0, 35.0, 22.0, 14.0, 19.0, 14.0, 23.0, 17.0, 13.0, 12.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.1107177734375, -0.1074228286743164, -0.10412788391113281, -0.10083293914794922, -0.09753799438476562, -0.09424304962158203, -0.09094810485839844, -0.08765316009521484, -0.08435821533203125, -0.08106327056884766, -0.07776832580566406, -0.07447338104248047, -0.07117843627929688, -0.06788349151611328, -0.06458854675292969, -0.061293601989746094, -0.0579986572265625, -0.054703712463378906, -0.05140876770019531, -0.04811382293701172, -0.044818878173828125, -0.04152393341064453, -0.03822898864746094, -0.034934043884277344, -0.03163909912109375, -0.028344154357910156, -0.025049209594726562, -0.02175426483154297, -0.018459320068359375, -0.015164375305175781, -0.011869430541992188, -0.008574485778808594, -0.005279541015625, -0.0019845962524414062, 0.0013103485107421875, 0.004605293273925781, 0.007900238037109375, 0.011195182800292969, 0.014490127563476562, 0.017785072326660156, 0.02108001708984375, 0.024374961853027344, 0.027669906616210938, 0.03096485137939453, 0.034259796142578125, 0.03755474090576172, 0.04084968566894531, 0.044144630432128906, 0.0474395751953125, 0.050734519958496094, 0.05402946472167969, 0.05732440948486328, 0.060619354248046875, 0.06391429901123047, 0.06720924377441406, 0.07050418853759766, 0.07379913330078125, 0.07709407806396484, 0.08038902282714844, 0.08368396759033203, 0.08697891235351562, 0.09027385711669922, 0.09356880187988281, 0.0968637466430664, 0.10015869140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 8.0, 6.0, 5.0, 10.0, 14.0, 18.0, 26.0, 52.0, 72.0, 153.0, 276.0, 602.0, 1120.0, 2644.0, 6975.0, 25793.0, 140635.0, 521971.0, 279940.0, 50031.0, 11332.0, 3734.0, 1564.0, 726.0, 330.0, 213.0, 124.0, 63.0, 32.0, 19.0, 18.0, 11.0, 11.0, 8.0, 9.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.030364990234375, -0.02937602996826172, -0.028387069702148438, -0.027398109436035156, -0.026409149169921875, -0.025420188903808594, -0.024431228637695312, -0.02344226837158203, -0.02245330810546875, -0.02146434783935547, -0.020475387573242188, -0.019486427307128906, -0.018497467041015625, -0.017508506774902344, -0.016519546508789062, -0.015530586242675781, -0.0145416259765625, -0.013552665710449219, -0.012563705444335938, -0.011574745178222656, -0.010585784912109375, -0.009596824645996094, -0.008607864379882812, -0.007618904113769531, -0.00662994384765625, -0.005640983581542969, -0.0046520233154296875, -0.0036630630493164062, -0.002674102783203125, -0.0016851425170898438, -0.0006961822509765625, 0.00029277801513671875, 0.00128173828125, 0.0022706985473632812, 0.0032596588134765625, 0.004248619079589844, 0.005237579345703125, 0.006226539611816406, 0.0072154998779296875, 0.008204460144042969, 0.00919342041015625, 0.010182380676269531, 0.011171340942382812, 0.012160301208496094, 0.013149261474609375, 0.014138221740722656, 0.015127182006835938, 0.01611614227294922, 0.0171051025390625, 0.01809406280517578, 0.019083023071289062, 0.020071983337402344, 0.021060943603515625, 0.022049903869628906, 0.023038864135742188, 0.02402782440185547, 0.02501678466796875, 0.02600574493408203, 0.026994705200195312, 0.027983665466308594, 0.028972625732421875, 0.029961585998535156, 0.030950546264648438, 0.03193950653076172, 0.032928466796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 10.0, 15.0, 25.0, 32.0, 45.0, 49.0, 89.0, 98.0, 118.0, 113.0, 96.0, 110.0, 51.0, 46.0, 28.0, 23.0, 5.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-05, -1.2099742889404297e-05, -1.1682510375976562e-05, -1.1265277862548828e-05, -1.0848045349121094e-05, -1.043081283569336e-05, -1.0013580322265625e-05, -9.59634780883789e-06, -9.179115295410156e-06, -8.761882781982422e-06, -8.344650268554688e-06, -7.927417755126953e-06, -7.510185241699219e-06, -7.092952728271484e-06, -6.67572021484375e-06, -6.258487701416016e-06, -5.841255187988281e-06, -5.424022674560547e-06, -5.0067901611328125e-06, -4.589557647705078e-06, -4.172325134277344e-06, -3.7550926208496094e-06, -3.337860107421875e-06, -2.9206275939941406e-06, -2.5033950805664062e-06, -2.086162567138672e-06, -1.6689300537109375e-06, -1.2516975402832031e-06, -8.344650268554688e-07, -4.172325134277344e-07, 0.0, 4.172325134277344e-07, 8.344650268554688e-07, 1.2516975402832031e-06, 1.6689300537109375e-06, 2.086162567138672e-06, 2.5033950805664062e-06, 2.9206275939941406e-06, 3.337860107421875e-06, 3.7550926208496094e-06, 4.172325134277344e-06, 4.589557647705078e-06, 5.0067901611328125e-06, 5.424022674560547e-06, 5.841255187988281e-06, 6.258487701416016e-06, 6.67572021484375e-06, 7.092952728271484e-06, 7.510185241699219e-06, 7.927417755126953e-06, 8.344650268554688e-06, 8.761882781982422e-06, 9.179115295410156e-06, 9.59634780883789e-06, 1.0013580322265625e-05, 1.043081283569336e-05, 1.0848045349121094e-05, 1.1265277862548828e-05, 1.1682510375976562e-05, 1.2099742889404297e-05, 1.2516975402832031e-05, 1.2934207916259766e-05, 1.33514404296875e-05, 1.3768672943115234e-05, 1.4185905456542969e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 6.0, 11.0, 13.0, 22.0, 22.0, 34.0, 56.0, 78.0, 113.0, 148.0, 266.0, 388.0, 703.0, 1106.0, 1866.0, 3639.0, 8008.0, 21828.0, 72600.0, 262066.0, 433176.0, 168766.0, 45635.0, 15075.0, 6081.0, 2861.0, 1510.0, 926.0, 565.0, 313.0, 216.0, 144.0, 92.0, 70.0, 41.0, 36.0, 21.0, 9.0, 13.0, 7.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.02606201171875, -0.025255680084228516, -0.02444934844970703, -0.023643016815185547, -0.022836685180664062, -0.022030353546142578, -0.021224021911621094, -0.02041769027709961, -0.019611358642578125, -0.01880502700805664, -0.017998695373535156, -0.017192363739013672, -0.016386032104492188, -0.015579700469970703, -0.014773368835449219, -0.013967037200927734, -0.01316070556640625, -0.012354373931884766, -0.011548042297363281, -0.010741710662841797, -0.009935379028320312, -0.009129047393798828, -0.008322715759277344, -0.007516384124755859, -0.006710052490234375, -0.005903720855712891, -0.005097389221191406, -0.004291057586669922, -0.0034847259521484375, -0.002678394317626953, -0.0018720626831054688, -0.0010657310485839844, -0.0002593994140625, 0.0005469322204589844, 0.0013532638549804688, 0.002159595489501953, 0.0029659271240234375, 0.003772258758544922, 0.004578590393066406, 0.005384922027587891, 0.006191253662109375, 0.006997585296630859, 0.007803916931152344, 0.008610248565673828, 0.009416580200195312, 0.010222911834716797, 0.011029243469238281, 0.011835575103759766, 0.01264190673828125, 0.013448238372802734, 0.014254570007324219, 0.015060901641845703, 0.015867233276367188, 0.016673564910888672, 0.017479896545410156, 0.01828622817993164, 0.019092559814453125, 0.01989889144897461, 0.020705223083496094, 0.021511554718017578, 0.022317886352539062, 0.023124217987060547, 0.02393054962158203, 0.024736881256103516, 0.025543212890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 11.0, 11.0, 14.0, 7.0, 14.0, 22.0, 34.0, 41.0, 48.0, 62.0, 74.0, 79.0, 88.0, 88.0, 67.0, 76.0, 49.0, 41.0, 36.0, 27.0, 19.0, 16.0, 15.0, 15.0, 2.0, 6.0, 5.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0259552001953125, -0.025131702423095703, -0.024308204650878906, -0.02348470687866211, -0.022661209106445312, -0.021837711334228516, -0.02101421356201172, -0.020190715789794922, -0.019367218017578125, -0.018543720245361328, -0.01772022247314453, -0.016896724700927734, -0.016073226928710938, -0.01524972915649414, -0.014426231384277344, -0.013602733612060547, -0.01277923583984375, -0.011955738067626953, -0.011132240295410156, -0.01030874252319336, -0.009485244750976562, -0.008661746978759766, -0.007838249206542969, -0.007014751434326172, -0.006191253662109375, -0.005367755889892578, -0.004544258117675781, -0.0037207603454589844, -0.0028972625732421875, -0.0020737648010253906, -0.0012502670288085938, -0.0004267692565917969, 0.000396728515625, 0.0012202262878417969, 0.0020437240600585938, 0.0028672218322753906, 0.0036907196044921875, 0.004514217376708984, 0.005337715148925781, 0.006161212921142578, 0.006984710693359375, 0.007808208465576172, 0.008631706237792969, 0.009455204010009766, 0.010278701782226562, 0.01110219955444336, 0.011925697326660156, 0.012749195098876953, 0.01357269287109375, 0.014396190643310547, 0.015219688415527344, 0.01604318618774414, 0.016866683959960938, 0.017690181732177734, 0.01851367950439453, 0.019337177276611328, 0.020160675048828125, 0.020984172821044922, 0.02180767059326172, 0.022631168365478516, 0.023454666137695312, 0.02427816390991211, 0.025101661682128906, 0.025925159454345703, 0.0267486572265625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 9.0, 26.0, 47.0, 88.0, 138.0, 199.0, 200.0, 129.0, 79.0, 48.0, 20.0, 9.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0309042930603027, -1.0102287530899048, -0.9895532131195068, -0.9688776135444641, -0.9482020735740662, -0.9275265336036682, -0.9068509340286255, -0.8861753940582275, -0.8654998540878296, -0.8448243141174316, -0.8241487741470337, -0.803473174571991, -0.782797634601593, -0.7621220946311951, -0.7414464950561523, -0.7207709550857544, -0.7000954151153564, -0.6794198751449585, -0.6587443351745605, -0.6380687355995178, -0.6173931956291199, -0.5967176556587219, -0.5760420560836792, -0.5553665161132812, -0.5346909761428833, -0.5140154361724854, -0.493339866399765, -0.4726642966270447, -0.45198875665664673, -0.4313132166862488, -0.41063764691352844, -0.3899620771408081, -0.36928659677505493, -0.348611056804657, -0.32793548703193665, -0.3072599172592163, -0.28658437728881836, -0.2659088373184204, -0.24523326754570007, -0.22455771267414093, -0.2038821578025818, -0.18320660293102264, -0.1625310480594635, -0.14185549318790436, -0.12117993831634521, -0.10050438344478607, -0.07982882857322693, -0.059153273701667786, -0.03847771883010864, -0.0178021639585495, 0.0028733909130096436, 0.023548945784568787, 0.04422450065612793, 0.06490005552768707, 0.08557561039924622, 0.10625116527080536, 0.1269267201423645, 0.14760227501392365, 0.1682778298854828, 0.18895338475704193, 0.20962893962860107, 0.23030449450016022, 0.25098004937171936, 0.2716556191444397, 0.29233115911483765]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 10.0, 6.0, 14.0, 12.0, 12.0, 10.0, 28.0, 27.0, 35.0, 35.0, 36.0, 43.0, 39.0, 40.0, 43.0, 45.0, 46.0, 55.0, 53.0, 38.0, 56.0, 37.0, 37.0, 23.0, 35.0, 21.0, 28.0, 17.0, 16.0, 20.0, 17.0, 16.0, 11.0, 10.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.7101544141769409, -0.6902002692222595, -0.6702460646629333, -0.650291919708252, -0.6303377151489258, -0.6103835701942444, -0.5904293656349182, -0.5704752206802368, -0.5505210161209106, -0.5305668711662292, -0.5106126666069031, -0.4906584918498993, -0.4707043170928955, -0.4507501423358917, -0.43079596757888794, -0.41084182262420654, -0.39088764786720276, -0.370933473110199, -0.3509792983531952, -0.3310251235961914, -0.3110709488391876, -0.29111677408218384, -0.27116262912750244, -0.25120842456817627, -0.23125426471233368, -0.2113000899553299, -0.1913459151983261, -0.17139175534248352, -0.15143758058547974, -0.13148340582847595, -0.11152923107147217, -0.09157505631446838, -0.0716208815574646, -0.051666706800460815, -0.03171253576874733, -0.011758364737033844, 0.00819581001996994, 0.028149984776973724, 0.04810415208339691, 0.0680583268404007, 0.08801250159740448, 0.10796667635440826, 0.12792085111141205, 0.14787501096725464, 0.16782918572425842, 0.1877833604812622, 0.207737535238266, 0.22769170999526978, 0.24764588475227356, 0.26760005950927734, 0.28755423426628113, 0.3075084090232849, 0.3274625837802887, 0.3474167585372925, 0.3673709034919739, 0.38732510805130005, 0.40727925300598145, 0.42723342776298523, 0.447187602519989, 0.4671417772769928, 0.4870959520339966, 0.507050096988678, 0.5270043015480042, 0.5469584465026855, 0.5669126510620117]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 9.0, 6.0, 17.0, 17.0, 29.0, 39.0, 51.0, 103.0, 159.0, 320.0, 823.0, 2550.0, 12117.0, 156439.0, 3832636.0, 172656.0, 12475.0, 2372.0, 752.0, 312.0, 131.0, 75.0, 54.0, 32.0, 21.0, 25.0, 11.0, 9.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29515838623046875, -0.2866058349609375, -0.27805328369140625, -0.269500732421875, -0.26094818115234375, -0.2523956298828125, -0.24384307861328125, -0.23529052734375, -0.22673797607421875, -0.2181854248046875, -0.20963287353515625, -0.201080322265625, -0.19252777099609375, -0.1839752197265625, -0.17542266845703125, -0.1668701171875, -0.15831756591796875, -0.1497650146484375, -0.14121246337890625, -0.132659912109375, -0.12410736083984375, -0.1155548095703125, -0.10700225830078125, -0.09844970703125, -0.08989715576171875, -0.0813446044921875, -0.07279205322265625, -0.064239501953125, -0.05568695068359375, -0.0471343994140625, -0.03858184814453125, -0.030029296875, -0.02147674560546875, -0.0129241943359375, -0.00437164306640625, 0.004180908203125, 0.01273345947265625, 0.0212860107421875, 0.02983856201171875, 0.03839111328125, 0.04694366455078125, 0.0554962158203125, 0.06404876708984375, 0.072601318359375, 0.08115386962890625, 0.0897064208984375, 0.09825897216796875, 0.1068115234375, 0.11536407470703125, 0.1239166259765625, 0.13246917724609375, 0.141021728515625, 0.14957427978515625, 0.1581268310546875, 0.16667938232421875, 0.17523193359375, 0.18378448486328125, 0.1923370361328125, 0.20088958740234375, 0.209442138671875, 0.21799468994140625, 0.2265472412109375, 0.23509979248046875, 0.24365234375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 7.0, 4.0, 10.0, 5.0, 8.0, 18.0, 17.0, 21.0, 28.0, 34.0, 33.0, 48.0, 46.0, 66.0, 68.0, 70.0, 69.0, 69.0, 52.0, 51.0, 58.0, 40.0, 37.0, 34.0, 21.0, 16.0, 21.0, 12.0, 7.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0823974609375, -0.08034896850585938, -0.07830047607421875, -0.07625198364257812, -0.0742034912109375, -0.07215499877929688, -0.07010650634765625, -0.06805801391601562, -0.066009521484375, -0.06396102905273438, -0.06191253662109375, -0.059864044189453125, -0.0578155517578125, -0.055767059326171875, -0.05371856689453125, -0.051670074462890625, -0.04962158203125, -0.047573089599609375, -0.04552459716796875, -0.043476104736328125, -0.0414276123046875, -0.039379119873046875, -0.03733062744140625, -0.035282135009765625, -0.033233642578125, -0.031185150146484375, -0.02913665771484375, -0.027088165283203125, -0.0250396728515625, -0.022991180419921875, -0.02094268798828125, -0.018894195556640625, -0.016845703125, -0.014797210693359375, -0.01274871826171875, -0.010700225830078125, -0.0086517333984375, -0.006603240966796875, -0.00455474853515625, -0.002506256103515625, -0.000457763671875, 0.001590728759765625, 0.00363922119140625, 0.005687713623046875, 0.0077362060546875, 0.009784698486328125, 0.01183319091796875, 0.013881683349609375, 0.01593017578125, 0.017978668212890625, 0.02002716064453125, 0.022075653076171875, 0.0241241455078125, 0.026172637939453125, 0.02822113037109375, 0.030269622802734375, 0.032318115234375, 0.034366607666015625, 0.03641510009765625, 0.038463592529296875, 0.0405120849609375, 0.042560577392578125, 0.04460906982421875, 0.046657562255859375, 0.0487060546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 1.0, 7.0, 7.0, 8.0, 20.0, 22.0, 46.0, 61.0, 95.0, 198.0, 382.0, 734.0, 1508.0, 3667.0, 8910.0, 24323.0, 78673.0, 299637.0, 1382216.0, 1827941.0, 412369.0, 103099.0, 31026.0, 11069.0, 4454.0, 1951.0, 868.0, 443.0, 250.0, 125.0, 72.0, 40.0, 14.0, 20.0, 11.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09185791015625, -0.08870220184326172, -0.08554649353027344, -0.08239078521728516, -0.07923507690429688, -0.0760793685913086, -0.07292366027832031, -0.06976795196533203, -0.06661224365234375, -0.06345653533935547, -0.06030082702636719, -0.057145118713378906, -0.053989410400390625, -0.050833702087402344, -0.04767799377441406, -0.04452228546142578, -0.0413665771484375, -0.03821086883544922, -0.03505516052246094, -0.031899452209472656, -0.028743743896484375, -0.025588035583496094, -0.022432327270507812, -0.01927661895751953, -0.01612091064453125, -0.012965202331542969, -0.009809494018554688, -0.006653785705566406, -0.003498077392578125, -0.00034236907958984375, 0.0028133392333984375, 0.005969047546386719, 0.009124755859375, 0.012280464172363281, 0.015436172485351562, 0.018591880798339844, 0.021747589111328125, 0.024903297424316406, 0.028059005737304688, 0.03121471405029297, 0.03437042236328125, 0.03752613067626953, 0.04068183898925781, 0.043837547302246094, 0.046993255615234375, 0.050148963928222656, 0.05330467224121094, 0.05646038055419922, 0.0596160888671875, 0.06277179718017578, 0.06592750549316406, 0.06908321380615234, 0.07223892211914062, 0.0753946304321289, 0.07855033874511719, 0.08170604705810547, 0.08486175537109375, 0.08801746368408203, 0.09117317199707031, 0.0943288803100586, 0.09748458862304688, 0.10064029693603516, 0.10379600524902344, 0.10695171356201172, 0.110107421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 8.0, 7.0, 21.0, 19.0, 33.0, 42.0, 52.0, 81.0, 141.0, 222.0, 326.0, 514.0, 755.0, 598.0, 432.0, 271.0, 158.0, 108.0, 96.0, 54.0, 32.0, 25.0, 25.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0732421875, -0.07077598571777344, -0.06830978393554688, -0.06584358215332031, -0.06337738037109375, -0.06091117858886719, -0.058444976806640625, -0.05597877502441406, -0.0535125732421875, -0.05104637145996094, -0.048580169677734375, -0.04611396789550781, -0.04364776611328125, -0.04118156433105469, -0.038715362548828125, -0.03624916076660156, -0.033782958984375, -0.03131675720214844, -0.028850555419921875, -0.026384353637695312, -0.02391815185546875, -0.021451950073242188, -0.018985748291015625, -0.016519546508789062, -0.0140533447265625, -0.011587142944335938, -0.009120941162109375, -0.0066547393798828125, -0.00418853759765625, -0.0017223358154296875, 0.000743865966796875, 0.0032100677490234375, 0.00567626953125, 0.008142471313476562, 0.010608673095703125, 0.013074874877929688, 0.01554107666015625, 0.018007278442382812, 0.020473480224609375, 0.022939682006835938, 0.0254058837890625, 0.027872085571289062, 0.030338287353515625, 0.03280448913574219, 0.03527069091796875, 0.03773689270019531, 0.040203094482421875, 0.04266929626464844, 0.045135498046875, 0.04760169982910156, 0.050067901611328125, 0.05253410339355469, 0.05500030517578125, 0.05746650695800781, 0.059932708740234375, 0.06239891052246094, 0.0648651123046875, 0.06733131408691406, 0.06979751586914062, 0.07226371765136719, 0.07472991943359375, 0.07719612121582031, 0.07966232299804688, 0.08212852478027344, 0.0845947265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 17.0, 16.0, 32.0, 51.0, 111.0, 94.0, 140.0, 132.0, 124.0, 76.0, 82.0, 50.0, 31.0, 13.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3740333616733551, -0.36342811584472656, -0.3528228998184204, -0.34221765398979187, -0.33161240816116333, -0.3210071921348572, -0.31040194630622864, -0.2997967004776001, -0.28919148445129395, -0.2785862386226654, -0.26798102259635925, -0.2573757767677307, -0.24677053093910217, -0.23616530001163483, -0.22556006908416748, -0.21495482325553894, -0.2043495774269104, -0.19374434649944305, -0.18313910067081451, -0.17253386974334717, -0.16192862391471863, -0.15132339298725128, -0.14071816205978394, -0.1301129162311554, -0.11950768530368805, -0.1089024469256401, -0.09829720854759216, -0.08769197762012482, -0.07708673924207687, -0.06648150086402893, -0.055876269936561584, -0.04527103155851364, -0.034665822982788086, -0.024060586467385292, -0.013455349951982498, -0.0028501152992248535, 0.00775512307882309, 0.018360361456871033, 0.02896559238433838, 0.03957083076238632, 0.050176069140434265, 0.06078130751848221, 0.07138654589653015, 0.0819917768239975, 0.09259701520204544, 0.10320225358009338, 0.11380748450756073, 0.12441272288560867, 0.13501796126365662, 0.14562319219112396, 0.1562284380197525, 0.16683366894721985, 0.1774389147758484, 0.18804414570331573, 0.19864937663078308, 0.20925462245941162, 0.21985985338687897, 0.2304650843143463, 0.24107033014297485, 0.251675546169281, 0.26228079199790955, 0.2728860378265381, 0.28349125385284424, 0.2940964996814728, 0.3047017455101013]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 3.0, 8.0, 8.0, 12.0, 12.0, 19.0, 17.0, 26.0, 44.0, 44.0, 42.0, 51.0, 58.0, 56.0, 58.0, 72.0, 52.0, 59.0, 48.0, 52.0, 48.0, 48.0, 26.0, 35.0, 26.0, 18.0, 23.0, 10.0, 6.0, 6.0, 11.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.3357384204864502, -0.3276660442352295, -0.3195936679840088, -0.3115212917327881, -0.3034489154815674, -0.2953765392303467, -0.287304162979126, -0.2792317867279053, -0.27115941047668457, -0.26308703422546387, -0.25501465797424316, -0.24694228172302246, -0.23886990547180176, -0.23079752922058105, -0.22272516787052155, -0.21465279161930084, -0.20658043026924133, -0.19850805401802063, -0.19043567776679993, -0.18236330151557922, -0.17429092526435852, -0.16621854901313782, -0.1581461876630783, -0.1500738114118576, -0.1420014351606369, -0.1339290589094162, -0.1258566826581955, -0.11778431385755539, -0.10971193760633469, -0.10163956135511398, -0.09356719255447388, -0.08549481630325317, -0.07742244005203247, -0.06935006380081177, -0.06127769127488136, -0.05320531874895096, -0.045132942497730255, -0.03706056624650955, -0.028988193720579147, -0.020915821194648743, -0.01284344494342804, -0.004771070554852486, 0.0033013038337230682, 0.011373678222298622, 0.019446052610874176, 0.02751842886209488, 0.035590801388025284, 0.04366317391395569, 0.05173555016517639, 0.059807926416397095, 0.0678803026676178, 0.0759526714682579, 0.08402504771947861, 0.09209742397069931, 0.10016979277133942, 0.10824216902256012, 0.11631454527378082, 0.12438692152500153, 0.13245929777622223, 0.14053167402744293, 0.14860403537750244, 0.15667641162872314, 0.16474878787994385, 0.17282116413116455, 0.18089354038238525]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 9.0, 9.0, 20.0, 23.0, 50.0, 60.0, 96.0, 149.0, 224.0, 325.0, 552.0, 897.0, 1577.0, 2956.0, 5736.0, 11203.0, 24052.0, 54527.0, 131845.0, 281421.0, 288133.0, 137928.0, 56992.0, 24749.0, 11758.0, 5898.0, 3153.0, 1738.0, 911.0, 587.0, 330.0, 233.0, 151.0, 90.0, 67.0, 36.0, 28.0, 16.0, 13.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08868408203125, -0.08607769012451172, -0.08347129821777344, -0.08086490631103516, -0.07825851440429688, -0.0756521224975586, -0.07304573059082031, -0.07043933868408203, -0.06783294677734375, -0.06522655487060547, -0.06262016296386719, -0.060013771057128906, -0.057407379150390625, -0.054800987243652344, -0.05219459533691406, -0.04958820343017578, -0.0469818115234375, -0.04437541961669922, -0.04176902770996094, -0.039162635803222656, -0.036556243896484375, -0.033949851989746094, -0.03134346008300781, -0.02873706817626953, -0.02613067626953125, -0.02352428436279297, -0.020917892456054688, -0.018311500549316406, -0.015705108642578125, -0.013098716735839844, -0.010492324829101562, -0.007885932922363281, -0.005279541015625, -0.0026731491088867188, -6.67572021484375e-05, 0.0025396347045898438, 0.005146026611328125, 0.007752418518066406, 0.010358810424804688, 0.012965202331542969, 0.01557159423828125, 0.01817798614501953, 0.020784378051757812, 0.023390769958496094, 0.025997161865234375, 0.028603553771972656, 0.031209945678710938, 0.03381633758544922, 0.0364227294921875, 0.03902912139892578, 0.04163551330566406, 0.044241905212402344, 0.046848297119140625, 0.049454689025878906, 0.05206108093261719, 0.05466747283935547, 0.05727386474609375, 0.05988025665283203, 0.06248664855957031, 0.0650930404663086, 0.06769943237304688, 0.07030582427978516, 0.07291221618652344, 0.07551860809326172, 0.078125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 3.0, 4.0, 8.0, 3.0, 14.0, 14.0, 11.0, 7.0, 16.0, 14.0, 26.0, 21.0, 27.0, 26.0, 43.0, 52.0, 53.0, 56.0, 53.0, 53.0, 50.0, 53.0, 51.0, 46.0, 38.0, 38.0, 35.0, 25.0, 34.0, 27.0, 19.0, 14.0, 13.0, 12.0, 12.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.062255859375, -0.0606536865234375, -0.059051513671875, -0.0574493408203125, -0.05584716796875, -0.0542449951171875, -0.052642822265625, -0.0510406494140625, -0.0494384765625, -0.0478363037109375, -0.046234130859375, -0.0446319580078125, -0.04302978515625, -0.0414276123046875, -0.039825439453125, -0.0382232666015625, -0.03662109375, -0.0350189208984375, -0.033416748046875, -0.0318145751953125, -0.03021240234375, -0.0286102294921875, -0.027008056640625, -0.0254058837890625, -0.0238037109375, -0.0222015380859375, -0.020599365234375, -0.0189971923828125, -0.01739501953125, -0.0157928466796875, -0.014190673828125, -0.0125885009765625, -0.010986328125, -0.0093841552734375, -0.007781982421875, -0.0061798095703125, -0.00457763671875, -0.0029754638671875, -0.001373291015625, 0.0002288818359375, 0.0018310546875, 0.0034332275390625, 0.005035400390625, 0.0066375732421875, 0.00823974609375, 0.0098419189453125, 0.011444091796875, 0.0130462646484375, 0.0146484375, 0.0162506103515625, 0.017852783203125, 0.0194549560546875, 0.02105712890625, 0.0226593017578125, 0.024261474609375, 0.0258636474609375, 0.0274658203125, 0.0290679931640625, 0.030670166015625, 0.0322723388671875, 0.03387451171875, 0.0354766845703125, 0.037078857421875, 0.0386810302734375, 0.040283203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 13.0, 7.0, 8.0, 14.0, 13.0, 15.0, 15.0, 29.0, 31.0, 32.0, 37.0, 37.0, 46.0, 77.0, 182.0, 501.0, 3859.0, 90089.0, 894774.0, 54969.0, 2832.0, 457.0, 132.0, 65.0, 44.0, 39.0, 21.0, 31.0, 22.0, 18.0, 16.0, 16.0, 14.0, 16.0, 12.0, 10.0, 11.0, 10.0, 9.0, 1.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.436279296875, -0.42282867431640625, -0.4093780517578125, -0.39592742919921875, -0.382476806640625, -0.36902618408203125, -0.3555755615234375, -0.34212493896484375, -0.32867431640625, -0.31522369384765625, -0.3017730712890625, -0.28832244873046875, -0.274871826171875, -0.26142120361328125, -0.2479705810546875, -0.23451995849609375, -0.2210693359375, -0.20761871337890625, -0.1941680908203125, -0.18071746826171875, -0.167266845703125, -0.15381622314453125, -0.1403656005859375, -0.12691497802734375, -0.11346435546875, -0.10001373291015625, -0.0865631103515625, -0.07311248779296875, -0.059661865234375, -0.04621124267578125, -0.0327606201171875, -0.01930999755859375, -0.005859375, 0.00759124755859375, 0.0210418701171875, 0.03449249267578125, 0.047943115234375, 0.06139373779296875, 0.0748443603515625, 0.08829498291015625, 0.10174560546875, 0.11519622802734375, 0.1286468505859375, 0.14209747314453125, 0.155548095703125, 0.16899871826171875, 0.1824493408203125, 0.19589996337890625, 0.2093505859375, 0.22280120849609375, 0.2362518310546875, 0.24970245361328125, 0.263153076171875, 0.27660369873046875, 0.2900543212890625, 0.30350494384765625, 0.31695556640625, 0.33040618896484375, 0.3438568115234375, 0.35730743408203125, 0.370758056640625, 0.38420867919921875, 0.3976593017578125, 0.41110992431640625, 0.424560546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 14.0, 8.0, 13.0, 4.0, 16.0, 18.0, 19.0, 24.0, 35.0, 31.0, 36.0, 40.0, 36.0, 46.0, 42.0, 45.0, 43.0, 47.0, 59.0, 45.0, 46.0, 44.0, 30.0, 28.0, 37.0, 26.0, 26.0, 20.0, 15.0, 16.0, 15.0, 14.0, 16.0, 10.0, 12.0, 2.0, 3.0, 8.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1048583984375, -0.10162162780761719, -0.09838485717773438, -0.09514808654785156, -0.09191131591796875, -0.08867454528808594, -0.08543777465820312, -0.08220100402832031, -0.0789642333984375, -0.07572746276855469, -0.07249069213867188, -0.06925392150878906, -0.06601715087890625, -0.06278038024902344, -0.059543609619140625, -0.05630683898925781, -0.053070068359375, -0.04983329772949219, -0.046596527099609375, -0.04335975646972656, -0.04012298583984375, -0.03688621520996094, -0.033649444580078125, -0.030412673950195312, -0.0271759033203125, -0.023939132690429688, -0.020702362060546875, -0.017465591430664062, -0.01422882080078125, -0.010992050170898438, -0.007755279541015625, -0.0045185089111328125, -0.00128173828125, 0.0019550323486328125, 0.005191802978515625, 0.008428573608398438, 0.01166534423828125, 0.014902114868164062, 0.018138885498046875, 0.021375656127929688, 0.0246124267578125, 0.027849197387695312, 0.031085968017578125, 0.03432273864746094, 0.03755950927734375, 0.04079627990722656, 0.044033050537109375, 0.04726982116699219, 0.050506591796875, 0.05374336242675781, 0.056980133056640625, 0.06021690368652344, 0.06345367431640625, 0.06669044494628906, 0.06992721557617188, 0.07316398620605469, 0.0764007568359375, 0.07963752746582031, 0.08287429809570312, 0.08611106872558594, 0.08934783935546875, 0.09258460998535156, 0.09582138061523438, 0.09905815124511719, 0.102294921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 6.0, 9.0, 10.0, 9.0, 21.0, 31.0, 38.0, 52.0, 72.0, 101.0, 167.0, 269.0, 376.0, 688.0, 1312.0, 2648.0, 5247.0, 11622.0, 28140.0, 81442.0, 243267.0, 385320.0, 186739.0, 60322.0, 22011.0, 9363.0, 4278.0, 2182.0, 1166.0, 610.0, 380.0, 202.0, 136.0, 86.0, 62.0, 32.0, 35.0, 25.0, 17.0, 13.0, 12.0, 3.0, 4.0, 6.0, 2.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.04815673828125, -0.04666900634765625, -0.0451812744140625, -0.04369354248046875, -0.042205810546875, -0.04071807861328125, -0.0392303466796875, -0.03774261474609375, -0.0362548828125, -0.03476715087890625, -0.0332794189453125, -0.03179168701171875, -0.030303955078125, -0.02881622314453125, -0.0273284912109375, -0.02584075927734375, -0.02435302734375, -0.02286529541015625, -0.0213775634765625, -0.01988983154296875, -0.018402099609375, -0.01691436767578125, -0.0154266357421875, -0.01393890380859375, -0.012451171875, -0.01096343994140625, -0.0094757080078125, -0.00798797607421875, -0.006500244140625, -0.00501251220703125, -0.0035247802734375, -0.00203704833984375, -0.00054931640625, 0.00093841552734375, 0.0024261474609375, 0.00391387939453125, 0.005401611328125, 0.00688934326171875, 0.0083770751953125, 0.00986480712890625, 0.0113525390625, 0.01284027099609375, 0.0143280029296875, 0.01581573486328125, 0.017303466796875, 0.01879119873046875, 0.0202789306640625, 0.02176666259765625, 0.02325439453125, 0.02474212646484375, 0.0262298583984375, 0.02771759033203125, 0.029205322265625, 0.03069305419921875, 0.0321807861328125, 0.03366851806640625, 0.03515625, 0.03664398193359375, 0.0381317138671875, 0.03961944580078125, 0.041107177734375, 0.04259490966796875, 0.0440826416015625, 0.04557037353515625, 0.04705810546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 16.0, 19.0, 25.0, 38.0, 83.0, 183.0, 173.0, 196.0, 111.0, 46.0, 28.0, 23.0, 9.0, 10.0, 10.0, 7.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5703182220458984e-05, -3.464147448539734e-05, -3.357976675033569e-05, -3.251805901527405e-05, -3.14563512802124e-05, -3.0394643545150757e-05, -2.933293581008911e-05, -2.8271228075027466e-05, -2.720952033996582e-05, -2.6147812604904175e-05, -2.508610486984253e-05, -2.4024397134780884e-05, -2.2962689399719238e-05, -2.1900981664657593e-05, -2.0839273929595947e-05, -1.9777566194534302e-05, -1.8715858459472656e-05, -1.765415072441101e-05, -1.6592442989349365e-05, -1.553073525428772e-05, -1.4469027519226074e-05, -1.3407319784164429e-05, -1.2345612049102783e-05, -1.1283904314041138e-05, -1.0222196578979492e-05, -9.160488843917847e-06, -8.098781108856201e-06, -7.037073373794556e-06, -5.97536563873291e-06, -4.913657903671265e-06, -3.851950168609619e-06, -2.7902424335479736e-06, -1.7285346984863281e-06, -6.668269634246826e-07, 3.948807716369629e-07, 1.4565885066986084e-06, 2.518296241760254e-06, 3.5800039768218994e-06, 4.641711711883545e-06, 5.7034194469451904e-06, 6.765127182006836e-06, 7.826834917068481e-06, 8.888542652130127e-06, 9.950250387191772e-06, 1.1011958122253418e-05, 1.2073665857315063e-05, 1.3135373592376709e-05, 1.4197081327438354e-05, 1.52587890625e-05, 1.6320496797561646e-05, 1.738220453262329e-05, 1.8443912267684937e-05, 1.9505620002746582e-05, 2.0567327737808228e-05, 2.1629035472869873e-05, 2.269074320793152e-05, 2.3752450942993164e-05, 2.481415867805481e-05, 2.5875866413116455e-05, 2.69375741481781e-05, 2.7999281883239746e-05, 2.906098961830139e-05, 3.0122697353363037e-05, 3.118440508842468e-05, 3.224611282348633e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 3.0, 3.0, 4.0, 10.0, 10.0, 14.0, 24.0, 21.0, 33.0, 54.0, 80.0, 268.0, 1281.0, 14965.0, 359704.0, 638935.0, 30242.0, 2261.0, 363.0, 90.0, 45.0, 36.0, 26.0, 21.0, 15.0, 12.0, 8.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10601806640625, -0.10261154174804688, -0.09920501708984375, -0.09579849243164062, -0.0923919677734375, -0.08898544311523438, -0.08557891845703125, -0.08217239379882812, -0.078765869140625, -0.07535934448242188, -0.07195281982421875, -0.06854629516601562, -0.0651397705078125, -0.061733245849609375, -0.05832672119140625, -0.054920196533203125, -0.051513671875, -0.048107147216796875, -0.04470062255859375, -0.041294097900390625, -0.0378875732421875, -0.034481048583984375, -0.03107452392578125, -0.027667999267578125, -0.024261474609375, -0.020854949951171875, -0.01744842529296875, -0.014041900634765625, -0.0106353759765625, -0.007228851318359375, -0.00382232666015625, -0.000415802001953125, 0.00299072265625, 0.006397247314453125, 0.00980377197265625, 0.013210296630859375, 0.0166168212890625, 0.020023345947265625, 0.02342987060546875, 0.026836395263671875, 0.030242919921875, 0.033649444580078125, 0.03705596923828125, 0.040462493896484375, 0.0438690185546875, 0.047275543212890625, 0.05068206787109375, 0.054088592529296875, 0.0574951171875, 0.060901641845703125, 0.06430816650390625, 0.06771469116210938, 0.0711212158203125, 0.07452774047851562, 0.07793426513671875, 0.08134078979492188, 0.084747314453125, 0.08815383911132812, 0.09156036376953125, 0.09496688842773438, 0.0983734130859375, 0.10177993774414062, 0.10518646240234375, 0.10859298706054688, 0.11199951171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 4.0, 3.0, 11.0, 10.0, 16.0, 24.0, 15.0, 36.0, 39.0, 47.0, 66.0, 60.0, 57.0, 78.0, 71.0, 82.0, 85.0, 72.0, 49.0, 36.0, 26.0, 26.0, 25.0, 17.0, 10.0, 6.0, 6.0, 7.0, 0.0, 7.0, 2.0, 0.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0217437744140625, -0.021045684814453125, -0.02034759521484375, -0.019649505615234375, -0.018951416015625, -0.018253326416015625, -0.01755523681640625, -0.016857147216796875, -0.0161590576171875, -0.015460968017578125, -0.01476287841796875, -0.014064788818359375, -0.01336669921875, -0.012668609619140625, -0.01197052001953125, -0.011272430419921875, -0.0105743408203125, -0.009876251220703125, -0.00917816162109375, -0.008480072021484375, -0.007781982421875, -0.007083892822265625, -0.00638580322265625, -0.005687713623046875, -0.0049896240234375, -0.004291534423828125, -0.00359344482421875, -0.002895355224609375, -0.002197265625, -0.001499176025390625, -0.00080108642578125, -0.000102996826171875, 0.0005950927734375, 0.001293182373046875, 0.00199127197265625, 0.002689361572265625, 0.003387451171875, 0.004085540771484375, 0.00478363037109375, 0.005481719970703125, 0.0061798095703125, 0.006877899169921875, 0.00757598876953125, 0.008274078369140625, 0.00897216796875, 0.009670257568359375, 0.01036834716796875, 0.011066436767578125, 0.0117645263671875, 0.012462615966796875, 0.01316070556640625, 0.013858795166015625, 0.014556884765625, 0.015254974365234375, 0.01595306396484375, 0.016651153564453125, 0.0173492431640625, 0.018047332763671875, 0.01874542236328125, 0.019443511962890625, 0.0201416015625, 0.020839691162109375, 0.02153778076171875, 0.022235870361328125, 0.0229339599609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 45.0, 192.0, 465.0, 248.0, 41.0, 12.0, 2.0], "bins": [-2.3391597270965576, -2.2998971939086914, -2.260634422302246, -2.22137188911438, -2.1821093559265137, -2.1428468227386475, -2.1035842895507812, -2.064321517944336, -2.0250589847564697, -1.9857964515686035, -1.9465337991714478, -1.907271146774292, -1.8680086135864258, -1.8287460803985596, -1.7894834280014038, -1.750220775604248, -1.7109582424163818, -1.6716957092285156, -1.6324330568313599, -1.593170404434204, -1.553907871246338, -1.5146453380584717, -1.475382685661316, -1.4361200332641602, -1.396857500076294, -1.3575949668884277, -1.318332314491272, -1.2790696620941162, -1.23980712890625, -1.2005445957183838, -1.161281943321228, -1.1220192909240723, -1.0827568769454956, -1.0434942245483398, -1.0042316913604736, -0.9649690985679626, -0.9257065057754517, -0.8864439129829407, -0.8471813201904297, -0.8079187273979187, -0.7686561346054077, -0.7293935418128967, -0.6901309490203857, -0.6508683562278748, -0.6116057634353638, -0.5723431706428528, -0.5330805778503418, -0.4938179850578308, -0.45455536246299744, -0.41529276967048645, -0.37603017687797546, -0.3367675840854645, -0.2975049912929535, -0.2582423985004425, -0.21897980570793152, -0.17971721291542053, -0.14045462012290955, -0.10119202733039856, -0.06192943453788757, -0.022666841745376587, 0.0165957510471344, 0.055858343839645386, 0.09512093663215637, 0.13438352942466736, 0.17364612221717834]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 9.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 15.0, 13.0, 15.0, 26.0, 25.0, 24.0, 28.0, 31.0, 33.0, 41.0, 43.0, 38.0, 50.0, 35.0, 50.0, 58.0, 47.0, 56.0, 43.0, 37.0, 37.0, 32.0, 32.0, 28.0, 24.0, 20.0, 14.0, 16.0, 10.0, 9.0, 9.0, 6.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33036017417907715, -0.3180713653564453, -0.3057825565338135, -0.29349371790885925, -0.2812049090862274, -0.2689161002635956, -0.25662729144096375, -0.24433846771717072, -0.23204964399337769, -0.21976083517074585, -0.20747201144695282, -0.19518320262432098, -0.18289437890052795, -0.17060557007789612, -0.15831676125526428, -0.14602793753147125, -0.13373912870883942, -0.12145031243562698, -0.10916149616241455, -0.09687268733978271, -0.08458386361598969, -0.07229505479335785, -0.060006238520145416, -0.04771742224693298, -0.03542860597372055, -0.023139789700508118, -0.010850975289940834, 0.0014378391206264496, 0.013726655393838882, 0.026015471667051315, 0.03830428421497345, 0.05059310048818588, 0.06288191676139832, 0.07517073303461075, 0.08745954930782318, 0.09974835813045502, 0.11203718185424805, 0.12432599067687988, 0.13661479949951172, 0.14890362322330475, 0.16119244694709778, 0.17348125576972961, 0.18577007949352264, 0.19805888831615448, 0.2103477120399475, 0.22263652086257935, 0.23492532968521118, 0.2472141534090042, 0.25950294733047485, 0.2717917561531067, 0.2840805649757385, 0.29636940360069275, 0.3086582124233246, 0.3209470212459564, 0.33323583006858826, 0.3455246686935425, 0.3578134775161743, 0.37010228633880615, 0.382391095161438, 0.3946799337863922, 0.40696874260902405, 0.4192575514316559, 0.4315463602542877, 0.44383519887924194, 0.4561240077018738]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 6.0, 4.0, 18.0, 15.0, 11.0, 21.0, 38.0, 49.0, 88.0, 109.0, 185.0, 234.0, 399.0, 636.0, 1189.0, 2182.0, 4361.0, 9465.0, 23436.0, 68337.0, 286096.0, 2156691.0, 1360666.0, 197205.0, 50989.0, 17820.0, 7116.0, 3237.0, 1565.0, 833.0, 439.0, 296.0, 177.0, 120.0, 77.0, 50.0, 30.0, 28.0, 13.0, 21.0, 11.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12890625, -0.1254110336303711, -0.12191581726074219, -0.11842060089111328, -0.11492538452148438, -0.11143016815185547, -0.10793495178222656, -0.10443973541259766, -0.10094451904296875, -0.09744930267333984, -0.09395408630371094, -0.09045886993408203, -0.08696365356445312, -0.08346843719482422, -0.07997322082519531, -0.0764780044555664, -0.0729827880859375, -0.0694875717163086, -0.06599235534667969, -0.06249713897705078, -0.059001922607421875, -0.05550670623779297, -0.05201148986816406, -0.048516273498535156, -0.04502105712890625, -0.041525840759277344, -0.03803062438964844, -0.03453540802001953, -0.031040191650390625, -0.02754497528076172, -0.024049758911132812, -0.020554542541503906, -0.017059326171875, -0.013564109802246094, -0.010068893432617188, -0.006573677062988281, -0.003078460693359375, 0.00041675567626953125, 0.0039119720458984375, 0.007407188415527344, 0.01090240478515625, 0.014397621154785156, 0.017892837524414062, 0.02138805389404297, 0.024883270263671875, 0.02837848663330078, 0.03187370300292969, 0.035368919372558594, 0.0388641357421875, 0.042359352111816406, 0.04585456848144531, 0.04934978485107422, 0.052845001220703125, 0.05634021759033203, 0.05983543395996094, 0.06333065032958984, 0.06682586669921875, 0.07032108306884766, 0.07381629943847656, 0.07731151580810547, 0.08080673217773438, 0.08430194854736328, 0.08779716491699219, 0.0912923812866211, 0.09478759765625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 9.0, 15.0, 9.0, 16.0, 18.0, 12.0, 19.0, 24.0, 35.0, 34.0, 33.0, 38.0, 35.0, 50.0, 48.0, 52.0, 64.0, 46.0, 49.0, 40.0, 43.0, 32.0, 41.0, 24.0, 21.0, 27.0, 23.0, 28.0, 22.0, 19.0, 12.0, 7.0, 12.0, 3.0, 1.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.056640625, -0.05509138107299805, -0.053542137145996094, -0.05199289321899414, -0.05044364929199219, -0.048894405364990234, -0.04734516143798828, -0.04579591751098633, -0.044246673583984375, -0.04269742965698242, -0.04114818572998047, -0.039598941802978516, -0.03804969787597656, -0.03650045394897461, -0.034951210021972656, -0.0334019660949707, -0.03185272216796875, -0.030303478240966797, -0.028754234313964844, -0.02720499038696289, -0.025655746459960938, -0.024106502532958984, -0.02255725860595703, -0.021008014678955078, -0.019458770751953125, -0.017909526824951172, -0.01636028289794922, -0.014811038970947266, -0.013261795043945312, -0.01171255111694336, -0.010163307189941406, -0.008614063262939453, -0.0070648193359375, -0.005515575408935547, -0.003966331481933594, -0.0024170875549316406, -0.0008678436279296875, 0.0006814002990722656, 0.0022306442260742188, 0.003779888153076172, 0.005329132080078125, 0.006878376007080078, 0.008427619934082031, 0.009976863861083984, 0.011526107788085938, 0.01307535171508789, 0.014624595642089844, 0.016173839569091797, 0.01772308349609375, 0.019272327423095703, 0.020821571350097656, 0.02237081527709961, 0.023920059204101562, 0.025469303131103516, 0.02701854705810547, 0.028567790985107422, 0.030117034912109375, 0.03166627883911133, 0.03321552276611328, 0.034764766693115234, 0.03631401062011719, 0.03786325454711914, 0.039412498474121094, 0.04096174240112305, 0.042510986328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 4.0, 17.0, 16.0, 25.0, 44.0, 59.0, 103.0, 183.0, 382.0, 764.0, 2067.0, 5920.0, 19618.0, 78549.0, 371648.0, 1952005.0, 1411416.0, 269201.0, 58986.0, 15411.0, 4629.0, 1741.0, 702.0, 337.0, 166.0, 98.0, 57.0, 41.0, 27.0, 11.0, 10.0, 16.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11160659790039062, -0.10712432861328125, -0.10264205932617188, -0.0981597900390625, -0.09367752075195312, -0.08919525146484375, -0.08471298217773438, -0.080230712890625, -0.07574844360351562, -0.07126617431640625, -0.06678390502929688, -0.0623016357421875, -0.057819366455078125, -0.05333709716796875, -0.048854827880859375, -0.04437255859375, -0.039890289306640625, -0.03540802001953125, -0.030925750732421875, -0.0264434814453125, -0.021961212158203125, -0.01747894287109375, -0.012996673583984375, -0.008514404296875, -0.004032135009765625, 0.00045013427734375, 0.004932403564453125, 0.0094146728515625, 0.013896942138671875, 0.01837921142578125, 0.022861480712890625, 0.02734375, 0.031826019287109375, 0.03630828857421875, 0.040790557861328125, 0.0452728271484375, 0.049755096435546875, 0.05423736572265625, 0.058719635009765625, 0.063201904296875, 0.06768417358398438, 0.07216644287109375, 0.07664871215820312, 0.0811309814453125, 0.08561325073242188, 0.09009552001953125, 0.09457778930664062, 0.09906005859375, 0.10354232788085938, 0.10802459716796875, 0.11250686645507812, 0.1169891357421875, 0.12147140502929688, 0.12595367431640625, 0.13043594360351562, 0.134918212890625, 0.13940048217773438, 0.14388275146484375, 0.14836502075195312, 0.1528472900390625, 0.15732955932617188, 0.16181182861328125, 0.16629409790039062, 0.1707763671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 10.0, 11.0, 15.0, 17.0, 31.0, 31.0, 70.0, 94.0, 113.0, 149.0, 257.0, 371.0, 587.0, 735.0, 495.0, 354.0, 237.0, 155.0, 111.0, 70.0, 44.0, 36.0, 22.0, 16.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09637451171875, -0.09309577941894531, -0.08981704711914062, -0.08653831481933594, -0.08325958251953125, -0.07998085021972656, -0.07670211791992188, -0.07342338562011719, -0.0701446533203125, -0.06686592102050781, -0.06358718872070312, -0.06030845642089844, -0.05702972412109375, -0.05375099182128906, -0.050472259521484375, -0.04719352722167969, -0.043914794921875, -0.04063606262207031, -0.037357330322265625, -0.03407859802246094, -0.03079986572265625, -0.027521133422851562, -0.024242401123046875, -0.020963668823242188, -0.0176849365234375, -0.014406204223632812, -0.011127471923828125, -0.007848739624023438, -0.00457000732421875, -0.0012912750244140625, 0.001987457275390625, 0.0052661895751953125, 0.008544921875, 0.011823654174804688, 0.015102386474609375, 0.018381118774414062, 0.02165985107421875, 0.024938583374023438, 0.028217315673828125, 0.03149604797363281, 0.0347747802734375, 0.03805351257324219, 0.041332244873046875, 0.04461097717285156, 0.04788970947265625, 0.05116844177246094, 0.054447174072265625, 0.05772590637207031, 0.061004638671875, 0.06428337097167969, 0.06756210327148438, 0.07084083557128906, 0.07411956787109375, 0.07739830017089844, 0.08067703247070312, 0.08395576477050781, 0.0872344970703125, 0.09051322937011719, 0.09379196166992188, 0.09707069396972656, 0.10034942626953125, 0.10362815856933594, 0.10690689086914062, 0.11018562316894531, 0.11346435546875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 9.0, 56.0, 167.0, 368.0, 284.0, 104.0, 12.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.422279715538025, -1.3846240043640137, -1.3469682931900024, -1.3093125820159912, -1.27165687084198, -1.2340011596679688, -1.196345329284668, -1.1586896181106567, -1.1210339069366455, -1.0833781957626343, -1.045722484588623, -1.0080667734146118, -0.9704110026359558, -0.9327552914619446, -0.8950995802879333, -0.8574438095092773, -0.8197881579399109, -0.7821324467658997, -0.7444767355918884, -0.7068209648132324, -0.6691652536392212, -0.63150954246521, -0.5938538312911987, -0.5561981201171875, -0.5185424089431763, -0.48088669776916504, -0.4432309567928314, -0.4055752456188202, -0.3679195046424866, -0.33026379346847534, -0.2926080822944641, -0.2549523413181305, -0.21729660034179688, -0.17964087426662445, -0.14198514819145203, -0.1043294370174408, -0.06667371094226837, -0.029017984867095947, 0.008637726306915283, 0.0462934672832489, 0.08394917845726013, 0.12160490453243256, 0.15926063060760498, 0.1969163417816162, 0.23457206785678864, 0.27222779393196106, 0.3098835051059723, 0.3475392460823059, 0.38519495725631714, 0.42285066843032837, 0.460506409406662, 0.4981621205806732, 0.5358178615570068, 0.5734735727310181, 0.6111292839050293, 0.6487849950790405, 0.6864407062530518, 0.724096417427063, 0.7617521286010742, 0.7994078397750854, 0.8370636105537415, 0.8747193217277527, 0.9123750329017639, 0.9500308036804199, 0.9876865148544312]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 8.0, 10.0, 8.0, 10.0, 14.0, 14.0, 10.0, 23.0, 21.0, 23.0, 27.0, 31.0, 42.0, 32.0, 44.0, 39.0, 53.0, 65.0, 54.0, 64.0, 51.0, 49.0, 36.0, 42.0, 33.0, 32.0, 28.0, 34.0, 19.0, 20.0, 9.0, 12.0, 7.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2994953989982605, -0.2902734875679016, -0.2810515761375427, -0.2718296945095062, -0.26260778307914734, -0.25338587164878845, -0.24416397511959076, -0.23494207859039307, -0.22572016716003418, -0.2164982557296753, -0.2072763592004776, -0.1980544626712799, -0.18883255124092102, -0.17961063981056213, -0.17038874328136444, -0.16116684675216675, -0.15194493532180786, -0.14272302389144897, -0.13350112736225128, -0.12427922338247299, -0.1150573194026947, -0.10583541542291641, -0.09661351144313812, -0.08739160746335983, -0.07816970348358154, -0.06894779950380325, -0.05972589552402496, -0.050503991544246674, -0.041282087564468384, -0.032060183584690094, -0.022838279604911804, -0.013616375625133514, -0.004394471645355225, 0.004827432334423065, 0.014049336314201355, 0.023271240293979645, 0.032493144273757935, 0.041715048253536224, 0.050936952233314514, 0.060158856213092804, 0.0693807601928711, 0.07860266417264938, 0.08782456815242767, 0.09704647213220596, 0.10626837611198425, 0.11549028009176254, 0.12471218407154083, 0.13393408060073853, 0.1431559920310974, 0.1523779034614563, 0.161599799990654, 0.17082169651985168, 0.18004360795021057, 0.18926551938056946, 0.19848741590976715, 0.20770931243896484, 0.21693122386932373, 0.22615313529968262, 0.2353750318288803, 0.244596928358078, 0.2538188397884369, 0.2630407512187958, 0.2722626328468323, 0.28148454427719116, 0.29070645570755005]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 18.0, 29.0, 28.0, 55.0, 94.0, 114.0, 211.0, 322.0, 464.0, 810.0, 1278.0, 2079.0, 3422.0, 5856.0, 10656.0, 21151.0, 47566.0, 117544.0, 258314.0, 300184.0, 156302.0, 63863.0, 27147.0, 13239.0, 7175.0, 4090.0, 2530.0, 1457.0, 929.0, 612.0, 375.0, 231.0, 167.0, 78.0, 49.0, 39.0, 29.0, 15.0, 18.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09857177734375, -0.09519195556640625, -0.0918121337890625, -0.08843231201171875, -0.085052490234375, -0.08167266845703125, -0.0782928466796875, -0.07491302490234375, -0.071533203125, -0.06815338134765625, -0.0647735595703125, -0.06139373779296875, -0.058013916015625, -0.05463409423828125, -0.0512542724609375, -0.04787445068359375, -0.04449462890625, -0.04111480712890625, -0.0377349853515625, -0.03435516357421875, -0.030975341796875, -0.02759552001953125, -0.0242156982421875, -0.02083587646484375, -0.0174560546875, -0.01407623291015625, -0.0106964111328125, -0.00731658935546875, -0.003936767578125, -0.00055694580078125, 0.0028228759765625, 0.00620269775390625, 0.00958251953125, 0.01296234130859375, 0.0163421630859375, 0.01972198486328125, 0.023101806640625, 0.02648162841796875, 0.0298614501953125, 0.03324127197265625, 0.03662109375, 0.04000091552734375, 0.0433807373046875, 0.04676055908203125, 0.050140380859375, 0.05352020263671875, 0.0569000244140625, 0.06027984619140625, 0.06365966796875, 0.06703948974609375, 0.0704193115234375, 0.07379913330078125, 0.077178955078125, 0.08055877685546875, 0.0839385986328125, 0.08731842041015625, 0.0906982421875, 0.09407806396484375, 0.0974578857421875, 0.10083770751953125, 0.104217529296875, 0.10759735107421875, 0.1109771728515625, 0.11435699462890625, 0.11773681640625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 1.0, 4.0, 4.0, 5.0, 8.0, 3.0, 10.0, 14.0, 15.0, 13.0, 16.0, 15.0, 25.0, 30.0, 31.0, 37.0, 46.0, 40.0, 41.0, 45.0, 44.0, 63.0, 54.0, 48.0, 52.0, 43.0, 45.0, 29.0, 33.0, 31.0, 20.0, 23.0, 16.0, 16.0, 16.0, 18.0, 13.0, 10.0, 5.0, 4.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.050567626953125, -0.04915046691894531, -0.047733306884765625, -0.04631614685058594, -0.04489898681640625, -0.04348182678222656, -0.042064666748046875, -0.04064750671386719, -0.0392303466796875, -0.03781318664550781, -0.036396026611328125, -0.03497886657714844, -0.03356170654296875, -0.03214454650878906, -0.030727386474609375, -0.029310226440429688, -0.02789306640625, -0.026475906372070312, -0.025058746337890625, -0.023641586303710938, -0.02222442626953125, -0.020807266235351562, -0.019390106201171875, -0.017972946166992188, -0.0165557861328125, -0.015138626098632812, -0.013721466064453125, -0.012304306030273438, -0.01088714599609375, -0.009469985961914062, -0.008052825927734375, -0.0066356658935546875, -0.005218505859375, -0.0038013458251953125, -0.002384185791015625, -0.0009670257568359375, 0.00045013427734375, 0.0018672943115234375, 0.003284454345703125, 0.0047016143798828125, 0.0061187744140625, 0.0075359344482421875, 0.008953094482421875, 0.010370254516601562, 0.01178741455078125, 0.013204574584960938, 0.014621734619140625, 0.016038894653320312, 0.0174560546875, 0.018873214721679688, 0.020290374755859375, 0.021707534790039062, 0.02312469482421875, 0.024541854858398438, 0.025959014892578125, 0.027376174926757812, 0.0287933349609375, 0.030210494995117188, 0.031627655029296875, 0.03304481506347656, 0.03446197509765625, 0.03587913513183594, 0.037296295166015625, 0.03871345520019531, 0.040130615234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 8.0, 8.0, 11.0, 12.0, 11.0, 15.0, 23.0, 31.0, 31.0, 52.0, 77.0, 95.0, 188.0, 316.0, 568.0, 1103.0, 2342.0, 5167.0, 12264.0, 30561.0, 89680.0, 281411.0, 388304.0, 154168.0, 48808.0, 18573.0, 7759.0, 3409.0, 1568.0, 795.0, 473.0, 234.0, 141.0, 110.0, 61.0, 38.0, 24.0, 33.0, 16.0, 14.0, 15.0, 11.0, 11.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.138671875, -0.13408470153808594, -0.12949752807617188, -0.12491035461425781, -0.12032318115234375, -0.11573600769042969, -0.11114883422851562, -0.10656166076660156, -0.1019744873046875, -0.09738731384277344, -0.09280014038085938, -0.08821296691894531, -0.08362579345703125, -0.07903861999511719, -0.07445144653320312, -0.06986427307128906, -0.065277099609375, -0.06068992614746094, -0.056102752685546875, -0.05151557922363281, -0.04692840576171875, -0.04234123229980469, -0.037754058837890625, -0.03316688537597656, -0.0285797119140625, -0.023992538452148438, -0.019405364990234375, -0.014818191528320312, -0.01023101806640625, -0.0056438446044921875, -0.001056671142578125, 0.0035305023193359375, 0.00811767578125, 0.012704849243164062, 0.017292022705078125, 0.021879196166992188, 0.02646636962890625, 0.031053543090820312, 0.035640716552734375, 0.04022789001464844, 0.0448150634765625, 0.04940223693847656, 0.053989410400390625, 0.05857658386230469, 0.06316375732421875, 0.06775093078613281, 0.07233810424804688, 0.07692527770996094, 0.081512451171875, 0.08609962463378906, 0.09068679809570312, 0.09527397155761719, 0.09986114501953125, 0.10444831848144531, 0.10903549194335938, 0.11362266540527344, 0.1182098388671875, 0.12279701232910156, 0.12738418579101562, 0.1319713592529297, 0.13655853271484375, 0.1411457061767578, 0.14573287963867188, 0.15032005310058594, 0.1549072265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 9.0, 4.0, 7.0, 9.0, 6.0, 7.0, 11.0, 18.0, 10.0, 16.0, 14.0, 19.0, 24.0, 29.0, 40.0, 40.0, 25.0, 34.0, 37.0, 48.0, 43.0, 48.0, 38.0, 32.0, 44.0, 40.0, 44.0, 39.0, 32.0, 31.0, 28.0, 31.0, 22.0, 21.0, 17.0, 12.0, 15.0, 19.0, 9.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10107421875, -0.09801197052001953, -0.09494972229003906, -0.0918874740600586, -0.08882522583007812, -0.08576297760009766, -0.08270072937011719, -0.07963848114013672, -0.07657623291015625, -0.07351398468017578, -0.07045173645019531, -0.06738948822021484, -0.06432723999023438, -0.061264991760253906, -0.05820274353027344, -0.05514049530029297, -0.0520782470703125, -0.04901599884033203, -0.04595375061035156, -0.042891502380371094, -0.039829254150390625, -0.036767005920410156, -0.03370475769042969, -0.03064250946044922, -0.02758026123046875, -0.02451801300048828, -0.021455764770507812, -0.018393516540527344, -0.015331268310546875, -0.012269020080566406, -0.009206771850585938, -0.006144523620605469, -0.003082275390625, -2.002716064453125e-05, 0.0030422210693359375, 0.006104469299316406, 0.009166717529296875, 0.012228965759277344, 0.015291213989257812, 0.01835346221923828, 0.02141571044921875, 0.02447795867919922, 0.027540206909179688, 0.030602455139160156, 0.033664703369140625, 0.036726951599121094, 0.03978919982910156, 0.04285144805908203, 0.0459136962890625, 0.04897594451904297, 0.05203819274902344, 0.055100440979003906, 0.058162689208984375, 0.061224937438964844, 0.06428718566894531, 0.06734943389892578, 0.07041168212890625, 0.07347393035888672, 0.07653617858886719, 0.07959842681884766, 0.08266067504882812, 0.0857229232788086, 0.08878517150878906, 0.09184741973876953, 0.09490966796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 2.0, 7.0, 18.0, 13.0, 39.0, 65.0, 82.0, 150.0, 266.0, 417.0, 642.0, 1023.0, 1826.0, 4362.0, 18997.0, 333192.0, 644777.0, 31841.0, 5698.0, 2142.0, 1105.0, 695.0, 389.0, 265.0, 189.0, 106.0, 86.0, 50.0, 34.0, 20.0, 14.0, 13.0, 9.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2257080078125, -0.21889305114746094, -0.21207809448242188, -0.2052631378173828, -0.19844818115234375, -0.1916332244873047, -0.18481826782226562, -0.17800331115722656, -0.1711883544921875, -0.16437339782714844, -0.15755844116210938, -0.1507434844970703, -0.14392852783203125, -0.1371135711669922, -0.13029861450195312, -0.12348365783691406, -0.116668701171875, -0.10985374450683594, -0.10303878784179688, -0.09622383117675781, -0.08940887451171875, -0.08259391784667969, -0.07577896118164062, -0.06896400451660156, -0.0621490478515625, -0.05533409118652344, -0.048519134521484375, -0.04170417785644531, -0.03488922119140625, -0.028074264526367188, -0.021259307861328125, -0.014444351196289062, -0.00762939453125, -0.0008144378662109375, 0.006000518798828125, 0.012815475463867188, 0.01963043212890625, 0.026445388793945312, 0.033260345458984375, 0.04007530212402344, 0.0468902587890625, 0.05370521545410156, 0.060520172119140625, 0.06733512878417969, 0.07415008544921875, 0.08096504211425781, 0.08777999877929688, 0.09459495544433594, 0.101409912109375, 0.10822486877441406, 0.11503982543945312, 0.12185478210449219, 0.12866973876953125, 0.1354846954345703, 0.14229965209960938, 0.14911460876464844, 0.1559295654296875, 0.16274452209472656, 0.16955947875976562, 0.1763744354248047, 0.18318939208984375, 0.1900043487548828, 0.19681930541992188, 0.20363426208496094, 0.21044921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 14.0, 12.0, 24.0, 28.0, 51.0, 80.0, 105.0, 127.0, 150.0, 121.0, 87.0, 67.0, 38.0, 20.0, 20.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9669532775878906e-05, -1.8967315554618835e-05, -1.8265098333358765e-05, -1.7562881112098694e-05, -1.6860663890838623e-05, -1.6158446669578552e-05, -1.545622944831848e-05, -1.475401222705841e-05, -1.405179500579834e-05, -1.3349577784538269e-05, -1.2647360563278198e-05, -1.1945143342018127e-05, -1.1242926120758057e-05, -1.0540708899497986e-05, -9.838491678237915e-06, -9.136274456977844e-06, -8.434057235717773e-06, -7.731840014457703e-06, -7.029622793197632e-06, -6.327405571937561e-06, -5.62518835067749e-06, -4.9229711294174194e-06, -4.220753908157349e-06, -3.518536686897278e-06, -2.816319465637207e-06, -2.1141022443771362e-06, -1.4118850231170654e-06, -7.096678018569946e-07, -7.450580596923828e-09, 6.94766640663147e-07, 1.3969838619232178e-06, 2.0992010831832886e-06, 2.8014183044433594e-06, 3.50363552570343e-06, 4.205852746963501e-06, 4.908069968223572e-06, 5.610287189483643e-06, 6.312504410743713e-06, 7.014721632003784e-06, 7.716938853263855e-06, 8.419156074523926e-06, 9.121373295783997e-06, 9.823590517044067e-06, 1.0525807738304138e-05, 1.1228024959564209e-05, 1.193024218082428e-05, 1.263245940208435e-05, 1.3334676623344421e-05, 1.4036893844604492e-05, 1.4739111065864563e-05, 1.5441328287124634e-05, 1.6143545508384705e-05, 1.6845762729644775e-05, 1.7547979950904846e-05, 1.8250197172164917e-05, 1.8952414393424988e-05, 1.965463161468506e-05, 2.035684883594513e-05, 2.10590660572052e-05, 2.176128327846527e-05, 2.2463500499725342e-05, 2.3165717720985413e-05, 2.3867934942245483e-05, 2.4570152163505554e-05, 2.5272369384765625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 5.0, 13.0, 22.0, 32.0, 58.0, 58.0, 127.0, 205.0, 318.0, 497.0, 981.0, 2021.0, 4668.0, 12773.0, 42317.0, 166277.0, 443261.0, 272936.0, 70001.0, 19637.0, 6710.0, 2683.0, 1248.0, 672.0, 393.0, 222.0, 137.0, 82.0, 73.0, 36.0, 30.0, 16.0, 9.0, 6.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.0670766830444336, -0.06481742858886719, -0.06255817413330078, -0.060298919677734375, -0.05803966522216797, -0.05578041076660156, -0.053521156311035156, -0.05126190185546875, -0.049002647399902344, -0.04674339294433594, -0.04448413848876953, -0.042224884033203125, -0.03996562957763672, -0.03770637512207031, -0.035447120666503906, -0.0331878662109375, -0.030928611755371094, -0.028669357299804688, -0.02641010284423828, -0.024150848388671875, -0.02189159393310547, -0.019632339477539062, -0.017373085021972656, -0.01511383056640625, -0.012854576110839844, -0.010595321655273438, -0.008336067199707031, -0.006076812744140625, -0.0038175582885742188, -0.0015583038330078125, 0.0007009506225585938, 0.002960205078125, 0.005219459533691406, 0.0074787139892578125, 0.009737968444824219, 0.011997222900390625, 0.014256477355957031, 0.016515731811523438, 0.018774986267089844, 0.02103424072265625, 0.023293495178222656, 0.025552749633789062, 0.02781200408935547, 0.030071258544921875, 0.03233051300048828, 0.03458976745605469, 0.036849021911621094, 0.0391082763671875, 0.041367530822753906, 0.04362678527832031, 0.04588603973388672, 0.048145294189453125, 0.05040454864501953, 0.05266380310058594, 0.054923057556152344, 0.05718231201171875, 0.059441566467285156, 0.06170082092285156, 0.06396007537841797, 0.06621932983398438, 0.06847858428955078, 0.07073783874511719, 0.0729970932006836, 0.07525634765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 12.0, 12.0, 15.0, 21.0, 35.0, 30.0, 44.0, 47.0, 63.0, 80.0, 53.0, 66.0, 67.0, 89.0, 58.0, 53.0, 39.0, 39.0, 40.0, 26.0, 24.0, 16.0, 10.0, 14.0, 12.0, 7.0, 13.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033905029296875, -0.03288459777832031, -0.031864166259765625, -0.030843734741210938, -0.02982330322265625, -0.028802871704101562, -0.027782440185546875, -0.026762008666992188, -0.0257415771484375, -0.024721145629882812, -0.023700714111328125, -0.022680282592773438, -0.02165985107421875, -0.020639419555664062, -0.019618988037109375, -0.018598556518554688, -0.017578125, -0.016557693481445312, -0.015537261962890625, -0.014516830444335938, -0.01349639892578125, -0.012475967407226562, -0.011455535888671875, -0.010435104370117188, -0.0094146728515625, -0.008394241333007812, -0.007373809814453125, -0.0063533782958984375, -0.00533294677734375, -0.0043125152587890625, -0.003292083740234375, -0.0022716522216796875, -0.001251220703125, -0.0002307891845703125, 0.000789642333984375, 0.0018100738525390625, 0.00283050537109375, 0.0038509368896484375, 0.004871368408203125, 0.0058917999267578125, 0.0069122314453125, 0.007932662963867188, 0.008953094482421875, 0.009973526000976562, 0.01099395751953125, 0.012014389038085938, 0.013034820556640625, 0.014055252075195312, 0.01507568359375, 0.016096115112304688, 0.017116546630859375, 0.018136978149414062, 0.01915740966796875, 0.020177841186523438, 0.021198272705078125, 0.022218704223632812, 0.0232391357421875, 0.024259567260742188, 0.025279998779296875, 0.026300430297851562, 0.02732086181640625, 0.028341293334960938, 0.029361724853515625, 0.030382156372070312, 0.031402587890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 16.0, 72.0, 198.0, 321.0, 272.0, 85.0, 27.0, 11.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8004120588302612, -1.7662330865859985, -1.7320539951324463, -1.6978750228881836, -1.663696050643921, -1.6295170783996582, -1.595337986946106, -1.5611590147018433, -1.526979923248291, -1.4928009510040283, -1.458621859550476, -1.4244428873062134, -1.3902639150619507, -1.3560848236083984, -1.3219058513641357, -1.287726879119873, -1.2535479068756104, -1.2193689346313477, -1.1851898431777954, -1.1510108709335327, -1.11683189868927, -1.0826528072357178, -1.048473834991455, -1.0142948627471924, -0.9801158308982849, -0.9459367990493774, -0.9117578268051147, -0.8775787949562073, -0.8433997631072998, -0.8092207908630371, -0.7750417590141296, -0.7408627271652222, -0.7066836357116699, -0.6725046038627625, -0.6383256316184998, -0.6041465997695923, -0.5699676275253296, -0.5357885956764221, -0.5016095638275146, -0.46743056178092957, -0.43325158953666687, -0.3990725874900818, -0.3648935556411743, -0.33071455359458923, -0.29653555154800415, -0.26235654950141907, -0.2281775325536728, -0.1939985156059265, -0.15981951355934143, -0.12564051151275635, -0.09146149456501007, -0.05728248506784439, -0.02310347557067871, 0.011075526475906372, 0.04525454342365265, 0.07943356037139893, 0.11361256241798401, 0.1477915644645691, 0.18197058141231537, 0.21614959836006165, 0.25032860040664673, 0.2845076024532318, 0.3186866044998169, 0.35286563634872437, 0.38704463839530945]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 9.0, 4.0, 4.0, 8.0, 7.0, 16.0, 16.0, 19.0, 16.0, 22.0, 28.0, 32.0, 32.0, 40.0, 41.0, 42.0, 39.0, 39.0, 35.0, 32.0, 39.0, 37.0, 44.0, 40.0, 35.0, 42.0, 32.0, 29.0, 26.0, 29.0, 21.0, 20.0, 30.0, 12.0, 12.0, 21.0, 6.0, 10.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23649901151657104, -0.22865955531597137, -0.2208200842142105, -0.21298062801361084, -0.20514117181301117, -0.1973017156124115, -0.18946224451065063, -0.18162278831005096, -0.1737833321094513, -0.16594387590885162, -0.15810440480709076, -0.1502649486064911, -0.14242549240589142, -0.13458603620529175, -0.12674656510353088, -0.11890710890293121, -0.11106763780117035, -0.10322817414999008, -0.09538871794939041, -0.08754925429821014, -0.07970979809761047, -0.0718703344464302, -0.06403087079524994, -0.05619141086935997, -0.04835195094347, -0.04051249101758003, -0.032673031091690063, -0.024833567440509796, -0.016994107514619827, -0.009154647588729858, -0.001315183937549591, 0.006524275988340378, 0.014363735914230347, 0.022203195840120316, 0.030042657628655434, 0.03788211941719055, 0.04572157934308052, 0.05356103926897049, 0.06140050292015076, 0.06923995912075043, 0.0770794227719307, 0.08491888642311096, 0.09275834262371063, 0.1005978062748909, 0.10843726992607117, 0.11627672612667084, 0.1241161897778511, 0.13195565342903137, 0.13979510962963104, 0.1476345658302307, 0.15547403693199158, 0.16331349313259125, 0.17115294933319092, 0.17899242043495178, 0.18683187663555145, 0.19467133283615112, 0.202510803937912, 0.21035026013851166, 0.21818973124027252, 0.2260291874408722, 0.23386864364147186, 0.24170809984207153, 0.2495475709438324, 0.25738704204559326, 0.26522648334503174]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 4.0, 13.0, 11.0, 27.0, 26.0, 62.0, 67.0, 107.0, 190.0, 370.0, 648.0, 1408.0, 3378.0, 8162.0, 23470.0, 82779.0, 395380.0, 1900879.0, 1431296.0, 258985.0, 58841.0, 17499.0, 6081.0, 2434.0, 1061.0, 471.0, 237.0, 144.0, 90.0, 60.0, 37.0, 14.0, 20.0, 11.0, 11.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09649658203125, -0.09356117248535156, -0.09062576293945312, -0.08769035339355469, -0.08475494384765625, -0.08181953430175781, -0.07888412475585938, -0.07594871520996094, -0.0730133056640625, -0.07007789611816406, -0.06714248657226562, -0.06420707702636719, -0.06127166748046875, -0.05833625793457031, -0.055400848388671875, -0.05246543884277344, -0.049530029296875, -0.04659461975097656, -0.043659210205078125, -0.04072380065917969, -0.03778839111328125, -0.03485298156738281, -0.031917572021484375, -0.028982162475585938, -0.0260467529296875, -0.023111343383789062, -0.020175933837890625, -0.017240524291992188, -0.01430511474609375, -0.011369705200195312, -0.008434295654296875, -0.0054988861083984375, -0.0025634765625, 0.0003719329833984375, 0.003307342529296875, 0.0062427520751953125, 0.00917816162109375, 0.012113571166992188, 0.015048980712890625, 0.017984390258789062, 0.0209197998046875, 0.023855209350585938, 0.026790618896484375, 0.029726028442382812, 0.03266143798828125, 0.03559684753417969, 0.038532257080078125, 0.04146766662597656, 0.044403076171875, 0.04733848571777344, 0.050273895263671875, 0.05320930480957031, 0.05614471435546875, 0.05908012390136719, 0.062015533447265625, 0.06495094299316406, 0.0678863525390625, 0.07082176208496094, 0.07375717163085938, 0.07669258117675781, 0.07962799072265625, 0.08256340026855469, 0.08549880981445312, 0.08843421936035156, 0.09136962890625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 6.0, 9.0, 11.0, 13.0, 29.0, 25.0, 19.0, 23.0, 33.0, 33.0, 43.0, 52.0, 53.0, 39.0, 31.0, 39.0, 40.0, 37.0, 39.0, 49.0, 32.0, 25.0, 45.0, 34.0, 31.0, 39.0, 26.0, 20.0, 19.0, 12.0, 11.0, 17.0, 9.0, 5.0, 5.0, 8.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.042694091796875, -0.0413661003112793, -0.040038108825683594, -0.03871011734008789, -0.03738212585449219, -0.036054134368896484, -0.03472614288330078, -0.03339815139770508, -0.032070159912109375, -0.030742168426513672, -0.02941417694091797, -0.028086185455322266, -0.026758193969726562, -0.02543020248413086, -0.024102210998535156, -0.022774219512939453, -0.02144622802734375, -0.020118236541748047, -0.018790245056152344, -0.01746225357055664, -0.016134262084960938, -0.014806270599365234, -0.013478279113769531, -0.012150287628173828, -0.010822296142578125, -0.009494304656982422, -0.008166313171386719, -0.006838321685791016, -0.0055103302001953125, -0.004182338714599609, -0.0028543472290039062, -0.0015263557434082031, -0.0001983642578125, 0.0011296272277832031, 0.0024576187133789062, 0.0037856101989746094, 0.0051136016845703125, 0.006441593170166016, 0.007769584655761719, 0.009097576141357422, 0.010425567626953125, 0.011753559112548828, 0.013081550598144531, 0.014409542083740234, 0.015737533569335938, 0.01706552505493164, 0.018393516540527344, 0.019721508026123047, 0.02104949951171875, 0.022377490997314453, 0.023705482482910156, 0.02503347396850586, 0.026361465454101562, 0.027689456939697266, 0.02901744842529297, 0.030345439910888672, 0.031673431396484375, 0.03300142288208008, 0.03432941436767578, 0.035657405853271484, 0.03698539733886719, 0.03831338882446289, 0.039641380310058594, 0.0409693717956543, 0.04229736328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 16.0, 13.0, 17.0, 27.0, 30.0, 34.0, 72.0, 129.0, 202.0, 335.0, 705.0, 1375.0, 3220.0, 8580.0, 25976.0, 87339.0, 315335.0, 1045615.0, 1683493.0, 726391.0, 207892.0, 58704.0, 17867.0, 6193.0, 2399.0, 1080.0, 511.0, 301.0, 140.0, 87.0, 68.0, 40.0, 23.0, 21.0, 14.0, 15.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.08723640441894531, -0.08426284790039062, -0.08128929138183594, -0.07831573486328125, -0.07534217834472656, -0.07236862182617188, -0.06939506530761719, -0.0664215087890625, -0.06344795227050781, -0.060474395751953125, -0.05750083923339844, -0.05452728271484375, -0.05155372619628906, -0.048580169677734375, -0.04560661315917969, -0.042633056640625, -0.03965950012207031, -0.036685943603515625, -0.03371238708496094, -0.03073883056640625, -0.027765274047851562, -0.024791717529296875, -0.021818161010742188, -0.0188446044921875, -0.015871047973632812, -0.012897491455078125, -0.009923934936523438, -0.00695037841796875, -0.0039768218994140625, -0.001003265380859375, 0.0019702911376953125, 0.00494384765625, 0.007917404174804688, 0.010890960693359375, 0.013864517211914062, 0.01683807373046875, 0.019811630249023438, 0.022785186767578125, 0.025758743286132812, 0.0287322998046875, 0.03170585632324219, 0.034679412841796875, 0.03765296936035156, 0.04062652587890625, 0.04360008239746094, 0.046573638916015625, 0.04954719543457031, 0.052520751953125, 0.05549430847167969, 0.058467864990234375, 0.06144142150878906, 0.06441497802734375, 0.06738853454589844, 0.07036209106445312, 0.07333564758300781, 0.0763092041015625, 0.07928276062011719, 0.08225631713867188, 0.08522987365722656, 0.08820343017578125, 0.09117698669433594, 0.09415054321289062, 0.09712409973144531, 0.10009765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 13.0, 13.0, 21.0, 26.0, 34.0, 52.0, 72.0, 83.0, 122.0, 183.0, 206.0, 295.0, 329.0, 367.0, 415.0, 384.0, 309.0, 257.0, 213.0, 153.0, 123.0, 98.0, 72.0, 62.0, 43.0, 39.0, 20.0, 21.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07659912109375, -0.07396697998046875, -0.0713348388671875, -0.06870269775390625, -0.066070556640625, -0.06343841552734375, -0.0608062744140625, -0.05817413330078125, -0.0555419921875, -0.05290985107421875, -0.0502777099609375, -0.04764556884765625, -0.045013427734375, -0.04238128662109375, -0.0397491455078125, -0.03711700439453125, -0.03448486328125, -0.03185272216796875, -0.0292205810546875, -0.02658843994140625, -0.023956298828125, -0.02132415771484375, -0.0186920166015625, -0.01605987548828125, -0.013427734375, -0.01079559326171875, -0.0081634521484375, -0.00553131103515625, -0.002899169921875, -0.00026702880859375, 0.0023651123046875, 0.00499725341796875, 0.00762939453125, 0.01026153564453125, 0.0128936767578125, 0.01552581787109375, 0.018157958984375, 0.02079010009765625, 0.0234222412109375, 0.02605438232421875, 0.0286865234375, 0.03131866455078125, 0.0339508056640625, 0.03658294677734375, 0.039215087890625, 0.04184722900390625, 0.0444793701171875, 0.04711151123046875, 0.04974365234375, 0.05237579345703125, 0.0550079345703125, 0.05764007568359375, 0.060272216796875, 0.06290435791015625, 0.0655364990234375, 0.06816864013671875, 0.07080078125, 0.07343292236328125, 0.0760650634765625, 0.07869720458984375, 0.081329345703125, 0.08396148681640625, 0.0865936279296875, 0.08922576904296875, 0.09185791015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 16.0, 23.0, 22.0, 50.0, 82.0, 114.0, 130.0, 151.0, 127.0, 101.0, 64.0, 44.0, 34.0, 19.0, 13.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4025265574455261, -0.38438695669174194, -0.36624738574028015, -0.34810781478881836, -0.3299682140350342, -0.31182861328125, -0.2936890423297882, -0.2755494713783264, -0.25740987062454224, -0.23927028477191925, -0.22113069891929626, -0.20299111306667328, -0.1848515272140503, -0.1667119413614273, -0.14857235550880432, -0.13043276965618134, -0.11229318380355835, -0.09415359795093536, -0.07601401209831238, -0.05787442624568939, -0.039734840393066406, -0.02159525454044342, -0.0034556686878204346, 0.014683917164802551, 0.03282350301742554, 0.05096308887004852, 0.06910267472267151, 0.0872422605752945, 0.10538184642791748, 0.12352143228054047, 0.14166101813316345, 0.15980060398578644, 0.17794013023376465, 0.19607971608638763, 0.21421930193901062, 0.2323588877916336, 0.2504984736442566, 0.26863807439804077, 0.28677764534950256, 0.30491721630096436, 0.32305681705474854, 0.3411964178085327, 0.3593359887599945, 0.3774755597114563, 0.3956151604652405, 0.41375476121902466, 0.43189433217048645, 0.45003390312194824, 0.4681735038757324, 0.4863131046295166, 0.5044527053833008, 0.5225922465324402, 0.5407318472862244, 0.5588714480400085, 0.577010989189148, 0.5951505899429321, 0.6132901906967163, 0.6314297914505005, 0.6495693922042847, 0.6677089333534241, 0.6858485341072083, 0.7039881348609924, 0.7221276760101318, 0.740267276763916, 0.7584068775177002]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 11.0, 9.0, 9.0, 14.0, 16.0, 18.0, 21.0, 29.0, 31.0, 30.0, 28.0, 20.0, 32.0, 46.0, 39.0, 24.0, 39.0, 49.0, 40.0, 34.0, 46.0, 53.0, 30.0, 42.0, 27.0, 32.0, 26.0, 30.0, 23.0, 23.0, 23.0, 18.0, 14.0, 15.0, 15.0, 10.0, 4.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.26721298694610596, -0.25777605175971985, -0.24833911657333374, -0.23890219628810883, -0.22946526110172272, -0.2200283259153366, -0.2105914056301117, -0.20115447044372559, -0.19171753525733948, -0.18228060007095337, -0.17284366488456726, -0.16340674459934235, -0.15396980941295624, -0.14453287422657013, -0.13509595394134521, -0.1256590187549591, -0.116222083568573, -0.10678514838218689, -0.09734822064638138, -0.08791129291057587, -0.07847435772418976, -0.06903742253780365, -0.05960049480199814, -0.05016356706619263, -0.04072663187980652, -0.03128970041871071, -0.0218527689576149, -0.012415837496519089, -0.002978906035423279, 0.006458025425672531, 0.01589495688676834, 0.025331884622573853, 0.03476881980895996, 0.04420575127005577, 0.05364268273115158, 0.06307961046695709, 0.0725165456533432, 0.08195348083972931, 0.09139040857553482, 0.10082733631134033, 0.11026427149772644, 0.11970120668411255, 0.12913814187049866, 0.13857506215572357, 0.14801199734210968, 0.1574489325284958, 0.1668858528137207, 0.1763227880001068, 0.18575972318649292, 0.19519665837287903, 0.20463359355926514, 0.21407051384449005, 0.22350744903087616, 0.23294438421726227, 0.24238130450248718, 0.2518182396888733, 0.2612551748752594, 0.2706921100616455, 0.2801290452480316, 0.2895659804344177, 0.29900288581848145, 0.30843982100486755, 0.31787675619125366, 0.32731369137763977, 0.3367506265640259]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 12.0, 16.0, 24.0, 36.0, 52.0, 65.0, 143.0, 213.0, 335.0, 649.0, 1133.0, 1997.0, 3915.0, 7191.0, 13175.0, 25171.0, 48233.0, 86433.0, 145468.0, 200986.0, 197415.0, 138481.0, 81610.0, 44573.0, 23726.0, 12669.0, 6750.0, 3500.0, 1982.0, 1093.0, 588.0, 352.0, 212.0, 129.0, 77.0, 49.0, 32.0, 26.0, 10.0, 8.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.0799713134765625, -0.077301025390625, -0.0746307373046875, -0.07196044921875, -0.0692901611328125, -0.066619873046875, -0.0639495849609375, -0.061279296875, -0.0586090087890625, -0.055938720703125, -0.0532684326171875, -0.05059814453125, -0.0479278564453125, -0.045257568359375, -0.0425872802734375, -0.0399169921875, -0.0372467041015625, -0.034576416015625, -0.0319061279296875, -0.02923583984375, -0.0265655517578125, -0.023895263671875, -0.0212249755859375, -0.0185546875, -0.0158843994140625, -0.013214111328125, -0.0105438232421875, -0.00787353515625, -0.0052032470703125, -0.002532958984375, 0.0001373291015625, 0.0028076171875, 0.0054779052734375, 0.008148193359375, 0.0108184814453125, 0.01348876953125, 0.0161590576171875, 0.018829345703125, 0.0214996337890625, 0.024169921875, 0.0268402099609375, 0.029510498046875, 0.0321807861328125, 0.03485107421875, 0.0375213623046875, 0.040191650390625, 0.0428619384765625, 0.0455322265625, 0.0482025146484375, 0.050872802734375, 0.0535430908203125, 0.05621337890625, 0.0588836669921875, 0.061553955078125, 0.0642242431640625, 0.06689453125, 0.0695648193359375, 0.072235107421875, 0.0749053955078125, 0.07757568359375, 0.0802459716796875, 0.082916259765625, 0.0855865478515625, 0.0882568359375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 1.0, 4.0, 5.0, 8.0, 10.0, 9.0, 15.0, 13.0, 17.0, 30.0, 21.0, 26.0, 28.0, 34.0, 46.0, 52.0, 44.0, 50.0, 44.0, 66.0, 48.0, 41.0, 47.0, 41.0, 49.0, 33.0, 27.0, 27.0, 32.0, 17.0, 23.0, 20.0, 21.0, 13.0, 4.0, 8.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04718017578125, -0.045813560485839844, -0.04444694519042969, -0.04308032989501953, -0.041713714599609375, -0.04034709930419922, -0.03898048400878906, -0.037613868713378906, -0.03624725341796875, -0.034880638122558594, -0.03351402282714844, -0.03214740753173828, -0.030780792236328125, -0.02941417694091797, -0.028047561645507812, -0.026680946350097656, -0.0253143310546875, -0.023947715759277344, -0.022581100463867188, -0.02121448516845703, -0.019847869873046875, -0.01848125457763672, -0.017114639282226562, -0.015748023986816406, -0.01438140869140625, -0.013014793395996094, -0.011648178100585938, -0.010281562805175781, -0.008914947509765625, -0.007548332214355469, -0.0061817169189453125, -0.004815101623535156, -0.003448486328125, -0.0020818710327148438, -0.0007152557373046875, 0.0006513595581054688, 0.002017974853515625, 0.0033845901489257812, 0.0047512054443359375, 0.006117820739746094, 0.00748443603515625, 0.008851051330566406, 0.010217666625976562, 0.011584281921386719, 0.012950897216796875, 0.014317512512207031, 0.015684127807617188, 0.017050743103027344, 0.0184173583984375, 0.019783973693847656, 0.021150588989257812, 0.02251720428466797, 0.023883819580078125, 0.02525043487548828, 0.026617050170898438, 0.027983665466308594, 0.02935028076171875, 0.030716896057128906, 0.03208351135253906, 0.03345012664794922, 0.034816741943359375, 0.03618335723876953, 0.03754997253417969, 0.038916587829589844, 0.040283203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 9.0, 8.0, 7.0, 15.0, 21.0, 24.0, 38.0, 73.0, 96.0, 132.0, 189.0, 271.0, 466.0, 726.0, 1241.0, 2065.0, 3628.0, 6366.0, 12127.0, 21168.0, 38913.0, 69021.0, 117029.0, 177686.0, 203644.0, 159815.0, 101124.0, 58609.0, 32691.0, 18071.0, 9955.0, 5408.0, 3133.0, 1794.0, 1060.0, 622.0, 413.0, 268.0, 165.0, 140.0, 96.0, 67.0, 42.0, 29.0, 20.0, 23.0, 5.0, 14.0, 8.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09283447265625, -0.08987236022949219, -0.08691024780273438, -0.08394813537597656, -0.08098602294921875, -0.07802391052246094, -0.07506179809570312, -0.07209968566894531, -0.0691375732421875, -0.06617546081542969, -0.06321334838867188, -0.06025123596191406, -0.05728912353515625, -0.05432701110839844, -0.051364898681640625, -0.04840278625488281, -0.045440673828125, -0.04247856140136719, -0.039516448974609375, -0.03655433654785156, -0.03359222412109375, -0.030630111694335938, -0.027667999267578125, -0.024705886840820312, -0.0217437744140625, -0.018781661987304688, -0.015819549560546875, -0.012857437133789062, -0.00989532470703125, -0.0069332122802734375, -0.003971099853515625, -0.0010089874267578125, 0.001953125, 0.0049152374267578125, 0.007877349853515625, 0.010839462280273438, 0.01380157470703125, 0.016763687133789062, 0.019725799560546875, 0.022687911987304688, 0.0256500244140625, 0.028612136840820312, 0.031574249267578125, 0.03453636169433594, 0.03749847412109375, 0.04046058654785156, 0.043422698974609375, 0.04638481140136719, 0.049346923828125, 0.05230903625488281, 0.055271148681640625, 0.05823326110839844, 0.06119537353515625, 0.06415748596191406, 0.06711959838867188, 0.07008171081542969, 0.0730438232421875, 0.07600593566894531, 0.07896804809570312, 0.08193016052246094, 0.08489227294921875, 0.08785438537597656, 0.09081649780273438, 0.09377861022949219, 0.09674072265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 3.0, 7.0, 3.0, 1.0, 8.0, 10.0, 7.0, 12.0, 17.0, 16.0, 30.0, 18.0, 27.0, 39.0, 35.0, 34.0, 29.0, 36.0, 39.0, 54.0, 41.0, 53.0, 62.0, 46.0, 40.0, 38.0, 38.0, 32.0, 46.0, 27.0, 22.0, 26.0, 20.0, 14.0, 12.0, 8.0, 10.0, 13.0, 6.0, 6.0, 6.0, 6.0, 5.0, 0.0, 0.0, 4.0, 3.0, 3.0], "bins": [-0.1375732421875, -0.1339397430419922, -0.13030624389648438, -0.12667274475097656, -0.12303924560546875, -0.11940574645996094, -0.11577224731445312, -0.11213874816894531, -0.1085052490234375, -0.10487174987792969, -0.10123825073242188, -0.09760475158691406, -0.09397125244140625, -0.09033775329589844, -0.08670425415039062, -0.08307075500488281, -0.079437255859375, -0.07580375671386719, -0.07217025756835938, -0.06853675842285156, -0.06490325927734375, -0.06126976013183594, -0.057636260986328125, -0.05400276184082031, -0.0503692626953125, -0.04673576354980469, -0.043102264404296875, -0.03946876525878906, -0.03583526611328125, -0.03220176696777344, -0.028568267822265625, -0.024934768676757812, -0.02130126953125, -0.017667770385742188, -0.014034271240234375, -0.010400772094726562, -0.00676727294921875, -0.0031337738037109375, 0.000499725341796875, 0.0041332244873046875, 0.0077667236328125, 0.011400222778320312, 0.015033721923828125, 0.018667221069335938, 0.02230072021484375, 0.025934219360351562, 0.029567718505859375, 0.03320121765136719, 0.036834716796875, 0.04046821594238281, 0.044101715087890625, 0.04773521423339844, 0.05136871337890625, 0.05500221252441406, 0.058635711669921875, 0.06226921081542969, 0.0659027099609375, 0.06953620910644531, 0.07316970825195312, 0.07680320739746094, 0.08043670654296875, 0.08407020568847656, 0.08770370483398438, 0.09133720397949219, 0.094970703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 2.0, 5.0, 7.0, 10.0, 8.0, 13.0, 19.0, 24.0, 26.0, 42.0, 51.0, 63.0, 117.0, 130.0, 190.0, 319.0, 460.0, 694.0, 1099.0, 1853.0, 3329.0, 8501.0, 290807.0, 713853.0, 16743.0, 4235.0, 2250.0, 1233.0, 778.0, 535.0, 322.0, 219.0, 172.0, 121.0, 85.0, 52.0, 48.0, 39.0, 19.0, 28.0, 11.0, 10.0, 8.0, 7.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.2476654052734375, -0.239715576171875, -0.2317657470703125, -0.22381591796875, -0.2158660888671875, -0.207916259765625, -0.1999664306640625, -0.1920166015625, -0.1840667724609375, -0.176116943359375, -0.1681671142578125, -0.16021728515625, -0.1522674560546875, -0.144317626953125, -0.1363677978515625, -0.12841796875, -0.1204681396484375, -0.112518310546875, -0.1045684814453125, -0.09661865234375, -0.0886688232421875, -0.080718994140625, -0.0727691650390625, -0.0648193359375, -0.0568695068359375, -0.048919677734375, -0.0409698486328125, -0.03302001953125, -0.0250701904296875, -0.017120361328125, -0.0091705322265625, -0.001220703125, 0.0067291259765625, 0.014678955078125, 0.0226287841796875, 0.03057861328125, 0.0385284423828125, 0.046478271484375, 0.0544281005859375, 0.0623779296875, 0.0703277587890625, 0.078277587890625, 0.0862274169921875, 0.09417724609375, 0.1021270751953125, 0.110076904296875, 0.1180267333984375, 0.1259765625, 0.1339263916015625, 0.141876220703125, 0.1498260498046875, 0.15777587890625, 0.1657257080078125, 0.173675537109375, 0.1816253662109375, 0.1895751953125, 0.1975250244140625, 0.205474853515625, 0.2134246826171875, 0.22137451171875, 0.2293243408203125, 0.237274169921875, 0.2452239990234375, 0.253173828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 9.0, 21.0, 65.0, 146.0, 351.0, 267.0, 83.0, 26.0, 9.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.08970832824707e-05, -8.820556104183197e-05, -8.551403880119324e-05, -8.28225165605545e-05, -8.013099431991577e-05, -7.743947207927704e-05, -7.47479498386383e-05, -7.205642759799957e-05, -6.936490535736084e-05, -6.667338311672211e-05, -6.398186087608337e-05, -6.129033863544464e-05, -5.859881639480591e-05, -5.5907294154167175e-05, -5.321577191352844e-05, -5.052424967288971e-05, -4.7832727432250977e-05, -4.5141205191612244e-05, -4.244968295097351e-05, -3.975816071033478e-05, -3.7066638469696045e-05, -3.437511622905731e-05, -3.168359398841858e-05, -2.8992071747779846e-05, -2.6300549507141113e-05, -2.360902726650238e-05, -2.0917505025863647e-05, -1.8225982785224915e-05, -1.553446054458618e-05, -1.2842938303947449e-05, -1.0151416063308716e-05, -7.459893822669983e-06, -4.76837158203125e-06, -2.076849341392517e-06, 6.146728992462158e-07, 3.3061951398849487e-06, 5.997717380523682e-06, 8.689239621162415e-06, 1.1380761861801147e-05, 1.407228410243988e-05, 1.6763806343078613e-05, 1.9455328583717346e-05, 2.214685082435608e-05, 2.4838373064994812e-05, 2.7529895305633545e-05, 3.0221417546272278e-05, 3.291293978691101e-05, 3.5604462027549744e-05, 3.8295984268188477e-05, 4.098750650882721e-05, 4.367902874946594e-05, 4.6370550990104675e-05, 4.906207323074341e-05, 5.175359547138214e-05, 5.4445117712020874e-05, 5.713663995265961e-05, 5.982816219329834e-05, 6.251968443393707e-05, 6.52112066745758e-05, 6.790272891521454e-05, 7.059425115585327e-05, 7.3285773396492e-05, 7.597729563713074e-05, 7.866881787776947e-05, 8.13603401184082e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 13.0, 25.0, 21.0, 37.0, 53.0, 93.0, 126.0, 218.0, 335.0, 528.0, 826.0, 1429.0, 2527.0, 4421.0, 8088.0, 15209.0, 28230.0, 52026.0, 88985.0, 136323.0, 173692.0, 176317.0, 141684.0, 94370.0, 55518.0, 30548.0, 16374.0, 9052.0, 4964.0, 2728.0, 1481.0, 856.0, 522.0, 347.0, 173.0, 136.0, 88.0, 60.0, 32.0, 25.0, 22.0, 15.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0262908935546875, -0.02544426918029785, -0.024597644805908203, -0.023751020431518555, -0.022904396057128906, -0.022057771682739258, -0.02121114730834961, -0.02036452293395996, -0.019517898559570312, -0.018671274185180664, -0.017824649810791016, -0.016978025436401367, -0.01613140106201172, -0.01528477668762207, -0.014438152313232422, -0.013591527938842773, -0.012744903564453125, -0.011898279190063477, -0.011051654815673828, -0.01020503044128418, -0.009358406066894531, -0.008511781692504883, -0.007665157318115234, -0.006818532943725586, -0.0059719085693359375, -0.005125284194946289, -0.004278659820556641, -0.003432035446166992, -0.0025854110717773438, -0.0017387866973876953, -0.0008921623229980469, -4.553794860839844e-05, 0.00080108642578125, 0.0016477108001708984, 0.002494335174560547, 0.0033409595489501953, 0.004187583923339844, 0.005034208297729492, 0.005880832672119141, 0.006727457046508789, 0.0075740814208984375, 0.008420705795288086, 0.009267330169677734, 0.010113954544067383, 0.010960578918457031, 0.01180720329284668, 0.012653827667236328, 0.013500452041625977, 0.014347076416015625, 0.015193700790405273, 0.016040325164794922, 0.01688694953918457, 0.01773357391357422, 0.018580198287963867, 0.019426822662353516, 0.020273447036743164, 0.021120071411132812, 0.02196669578552246, 0.02281332015991211, 0.023659944534301758, 0.024506568908691406, 0.025353193283081055, 0.026199817657470703, 0.02704644203186035, 0.02789306640625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 6.0, 5.0, 10.0, 8.0, 11.0, 16.0, 14.0, 18.0, 24.0, 37.0, 34.0, 36.0, 42.0, 41.0, 43.0, 46.0, 58.0, 42.0, 38.0, 53.0, 51.0, 55.0, 34.0, 39.0, 43.0, 35.0, 30.0, 19.0, 22.0, 15.0, 19.0, 14.0, 9.0, 10.0, 5.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02227783203125, -0.02154374122619629, -0.020809650421142578, -0.020075559616088867, -0.019341468811035156, -0.018607378005981445, -0.017873287200927734, -0.017139196395874023, -0.016405105590820312, -0.0156710147857666, -0.01493692398071289, -0.01420283317565918, -0.013468742370605469, -0.012734651565551758, -0.012000560760498047, -0.011266469955444336, -0.010532379150390625, -0.009798288345336914, -0.009064197540283203, -0.008330106735229492, -0.007596015930175781, -0.00686192512512207, -0.006127834320068359, -0.0053937435150146484, -0.0046596527099609375, -0.0039255619049072266, -0.0031914710998535156, -0.0024573802947998047, -0.0017232894897460938, -0.0009891986846923828, -0.0002551078796386719, 0.00047898292541503906, 0.00121307373046875, 0.001947164535522461, 0.002681255340576172, 0.003415346145629883, 0.004149436950683594, 0.004883527755737305, 0.005617618560791016, 0.0063517093658447266, 0.0070858001708984375, 0.007819890975952148, 0.00855398178100586, 0.00928807258605957, 0.010022163391113281, 0.010756254196166992, 0.011490345001220703, 0.012224435806274414, 0.012958526611328125, 0.013692617416381836, 0.014426708221435547, 0.015160799026489258, 0.01589488983154297, 0.01662898063659668, 0.01736307144165039, 0.0180971622467041, 0.018831253051757812, 0.019565343856811523, 0.020299434661865234, 0.021033525466918945, 0.021767616271972656, 0.022501707077026367, 0.023235797882080078, 0.02396988868713379, 0.0247039794921875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 17.0, 26.0, 39.0, 43.0, 71.0, 92.0, 90.0, 129.0, 112.0, 85.0, 69.0, 60.0, 56.0, 27.0, 20.0, 16.0, 12.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5351299047470093, -0.5216425657272339, -0.5081552863121033, -0.4946679472923279, -0.4811806082725525, -0.4676932990550995, -0.4542059898376465, -0.4407186508178711, -0.4272313117980957, -0.4137440025806427, -0.4002566635608673, -0.3867693543434143, -0.3732820153236389, -0.3597947061061859, -0.3463073968887329, -0.3328200578689575, -0.3193327486515045, -0.3058454394340515, -0.2923581004142761, -0.2788707911968231, -0.26538345217704773, -0.2518961429595947, -0.23840881884098053, -0.22492149472236633, -0.21143417060375214, -0.19794684648513794, -0.18445952236652374, -0.17097219824790955, -0.15748488903045654, -0.14399755001068115, -0.13051024079322815, -0.11702291667461395, -0.10353562235832214, -0.09004829823970795, -0.07656097412109375, -0.06307365745306015, -0.04958633333444595, -0.03609900921583176, -0.022611692547798157, -0.00912436842918396, 0.004362955689430237, 0.017850277945399284, 0.03133760020136833, 0.04482492059469223, 0.05831224471330643, 0.07179956883192062, 0.08528688549995422, 0.09877420961856842, 0.11226153373718262, 0.12574885785579681, 0.139236181974411, 0.152723491191864, 0.1662108302116394, 0.1796981394290924, 0.1931854635477066, 0.2066727876663208, 0.220160111784935, 0.2336474359035492, 0.2471347600221634, 0.2606220841407776, 0.2741093933582306, 0.287596732378006, 0.301084041595459, 0.3145713806152344, 0.3280586898326874]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 8.0, 12.0, 17.0, 15.0, 23.0, 18.0, 28.0, 25.0, 47.0, 37.0, 50.0, 36.0, 64.0, 43.0, 55.0, 48.0, 63.0, 38.0, 51.0, 33.0, 33.0, 34.0, 42.0, 22.0, 29.0, 22.0, 29.0, 30.0, 17.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31229859590530396, -0.2995697259902954, -0.28684088587760925, -0.2741120159626007, -0.26138317584991455, -0.248654305934906, -0.23592543601989746, -0.2231965810060501, -0.21046772599220276, -0.1977388709783554, -0.18501001596450806, -0.1722811460494995, -0.15955229103565216, -0.1468234360218048, -0.13409456610679626, -0.12136571109294891, -0.10863685607910156, -0.09590800106525421, -0.08317913860082626, -0.07045027613639832, -0.057721421122550964, -0.04499256610870361, -0.032263703644275665, -0.019534841179847717, -0.006805986166000366, 0.005922872573137283, 0.018651731312274933, 0.03138059005141258, 0.04410944879055023, 0.05683830380439758, 0.06956716626882553, 0.08229602873325348, 0.09502488374710083, 0.10775373876094818, 0.12048260122537613, 0.13321146368980408, 0.14594031870365143, 0.15866917371749878, 0.17139804363250732, 0.18412689864635468, 0.19685575366020203, 0.20958460867404938, 0.22231346368789673, 0.23504233360290527, 0.24777118861675262, 0.2605000436306, 0.2732289135456085, 0.2859577536582947, 0.2986866235733032, 0.31141549348831177, 0.3241443336009979, 0.33687320351600647, 0.3496020436286926, 0.36233091354370117, 0.3750597834587097, 0.38778865337371826, 0.4005174934864044, 0.41324636340141296, 0.4259752035140991, 0.43870407342910767, 0.4514329433441162, 0.46416178345680237, 0.4768906533718109, 0.48961949348449707, 0.5023483633995056]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 8.0, 9.0, 11.0, 14.0, 21.0, 19.0, 33.0, 40.0, 83.0, 128.0, 198.0, 354.0, 775.0, 1852.0, 4653.0, 13988.0, 53285.0, 317838.0, 2115805.0, 1452231.0, 181374.0, 35744.0, 9883.0, 3309.0, 1285.0, 569.0, 273.0, 147.0, 96.0, 58.0, 47.0, 33.0, 30.0, 11.0, 21.0, 10.0, 7.0, 7.0, 4.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09918212890625, -0.09596824645996094, -0.09275436401367188, -0.08954048156738281, -0.08632659912109375, -0.08311271667480469, -0.07989883422851562, -0.07668495178222656, -0.0734710693359375, -0.07025718688964844, -0.06704330444335938, -0.06382942199707031, -0.06061553955078125, -0.05740165710449219, -0.054187774658203125, -0.05097389221191406, -0.047760009765625, -0.04454612731933594, -0.041332244873046875, -0.03811836242675781, -0.03490447998046875, -0.03169059753417969, -0.028476715087890625, -0.025262832641601562, -0.0220489501953125, -0.018835067749023438, -0.015621185302734375, -0.012407302856445312, -0.00919342041015625, -0.0059795379638671875, -0.002765655517578125, 0.0004482269287109375, 0.003662109375, 0.0068759918212890625, 0.010089874267578125, 0.013303756713867188, 0.01651763916015625, 0.019731521606445312, 0.022945404052734375, 0.026159286499023438, 0.0293731689453125, 0.03258705139160156, 0.035800933837890625, 0.03901481628417969, 0.04222869873046875, 0.04544258117675781, 0.048656463623046875, 0.05187034606933594, 0.055084228515625, 0.05829811096191406, 0.061511993408203125, 0.06472587585449219, 0.06793975830078125, 0.07115364074707031, 0.07436752319335938, 0.07758140563964844, 0.0807952880859375, 0.08400917053222656, 0.08722305297851562, 0.09043693542480469, 0.09365081787109375, 0.09686470031738281, 0.10007858276367188, 0.10329246520996094, 0.10650634765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 18.0, 19.0, 11.0, 13.0, 20.0, 17.0, 20.0, 30.0, 33.0, 49.0, 36.0, 43.0, 44.0, 41.0, 40.0, 35.0, 41.0, 43.0, 56.0, 42.0, 42.0, 44.0, 28.0, 30.0, 23.0, 21.0, 19.0, 21.0, 19.0, 24.0, 8.0, 10.0, 2.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.040069580078125, -0.03867959976196289, -0.03728961944580078, -0.03589963912963867, -0.03450965881347656, -0.03311967849731445, -0.031729698181152344, -0.030339717864990234, -0.028949737548828125, -0.027559757232666016, -0.026169776916503906, -0.024779796600341797, -0.023389816284179688, -0.021999835968017578, -0.02060985565185547, -0.01921987533569336, -0.01782989501953125, -0.01643991470336914, -0.015049934387207031, -0.013659954071044922, -0.012269973754882812, -0.010879993438720703, -0.009490013122558594, -0.008100032806396484, -0.006710052490234375, -0.005320072174072266, -0.003930091857910156, -0.002540111541748047, -0.0011501312255859375, 0.00023984909057617188, 0.0016298294067382812, 0.0030198097229003906, 0.0044097900390625, 0.005799770355224609, 0.007189750671386719, 0.008579730987548828, 0.009969711303710938, 0.011359691619873047, 0.012749671936035156, 0.014139652252197266, 0.015529632568359375, 0.016919612884521484, 0.018309593200683594, 0.019699573516845703, 0.021089553833007812, 0.022479534149169922, 0.02386951446533203, 0.02525949478149414, 0.02664947509765625, 0.02803945541381836, 0.02942943572998047, 0.030819416046142578, 0.03220939636230469, 0.0335993766784668, 0.034989356994628906, 0.036379337310791016, 0.037769317626953125, 0.039159297943115234, 0.040549278259277344, 0.04193925857543945, 0.04332923889160156, 0.04471921920776367, 0.04610919952392578, 0.04749917984008789, 0.04888916015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 6.0, 8.0, 14.0, 9.0, 22.0, 31.0, 66.0, 89.0, 160.0, 268.0, 463.0, 1110.0, 2962.0, 9416.0, 35878.0, 153119.0, 715646.0, 2104488.0, 914082.0, 193769.0, 44828.0, 11577.0, 3624.0, 1299.0, 576.0, 307.0, 178.0, 93.0, 67.0, 45.0, 27.0, 26.0, 9.0, 5.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.12213134765625, -0.11879253387451172, -0.11545372009277344, -0.11211490631103516, -0.10877609252929688, -0.1054372787475586, -0.10209846496582031, -0.09875965118408203, -0.09542083740234375, -0.09208202362060547, -0.08874320983886719, -0.0854043960571289, -0.08206558227539062, -0.07872676849365234, -0.07538795471191406, -0.07204914093017578, -0.0687103271484375, -0.06537151336669922, -0.06203269958496094, -0.058693885803222656, -0.055355072021484375, -0.052016258239746094, -0.04867744445800781, -0.04533863067626953, -0.04199981689453125, -0.03866100311279297, -0.03532218933105469, -0.031983375549316406, -0.028644561767578125, -0.025305747985839844, -0.021966934204101562, -0.01862812042236328, -0.015289306640625, -0.011950492858886719, -0.008611679077148438, -0.005272865295410156, -0.001934051513671875, 0.0014047622680664062, 0.0047435760498046875, 0.008082389831542969, 0.01142120361328125, 0.014760017395019531, 0.018098831176757812, 0.021437644958496094, 0.024776458740234375, 0.028115272521972656, 0.03145408630371094, 0.03479290008544922, 0.0381317138671875, 0.04147052764892578, 0.04480934143066406, 0.048148155212402344, 0.051486968994140625, 0.054825782775878906, 0.05816459655761719, 0.06150341033935547, 0.06484222412109375, 0.06818103790283203, 0.07151985168457031, 0.0748586654663086, 0.07819747924804688, 0.08153629302978516, 0.08487510681152344, 0.08821392059326172, 0.091552734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 11.0, 9.0, 16.0, 18.0, 17.0, 39.0, 67.0, 58.0, 77.0, 114.0, 146.0, 182.0, 249.0, 272.0, 395.0, 446.0, 396.0, 363.0, 270.0, 196.0, 162.0, 127.0, 100.0, 76.0, 59.0, 42.0, 43.0, 40.0, 18.0, 23.0, 11.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07720947265625, -0.07478141784667969, -0.07235336303710938, -0.06992530822753906, -0.06749725341796875, -0.06506919860839844, -0.06264114379882812, -0.06021308898925781, -0.0577850341796875, -0.05535697937011719, -0.052928924560546875, -0.05050086975097656, -0.04807281494140625, -0.04564476013183594, -0.043216705322265625, -0.04078865051269531, -0.038360595703125, -0.03593254089355469, -0.033504486083984375, -0.031076431274414062, -0.02864837646484375, -0.026220321655273438, -0.023792266845703125, -0.021364212036132812, -0.0189361572265625, -0.016508102416992188, -0.014080047607421875, -0.011651992797851562, -0.00922393798828125, -0.0067958831787109375, -0.004367828369140625, -0.0019397735595703125, 0.00048828125, 0.0029163360595703125, 0.005344390869140625, 0.0077724456787109375, 0.01020050048828125, 0.012628555297851562, 0.015056610107421875, 0.017484664916992188, 0.0199127197265625, 0.022340774536132812, 0.024768829345703125, 0.027196884155273438, 0.02962493896484375, 0.03205299377441406, 0.034481048583984375, 0.03690910339355469, 0.039337158203125, 0.04176521301269531, 0.044193267822265625, 0.04662132263183594, 0.04904937744140625, 0.05147743225097656, 0.053905487060546875, 0.05633354187011719, 0.0587615966796875, 0.06118965148925781, 0.06361770629882812, 0.06604576110839844, 0.06847381591796875, 0.07090187072753906, 0.07332992553710938, 0.07575798034667969, 0.07818603515625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 3.0, 5.0, 6.0, 14.0, 12.0, 17.0, 14.0, 29.0, 22.0, 43.0, 43.0, 50.0, 57.0, 55.0, 49.0, 54.0, 56.0, 57.0, 48.0, 63.0, 54.0, 50.0, 41.0, 33.0, 23.0, 19.0, 21.0, 12.0, 15.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.25628912448883057, -0.24867519736289978, -0.2410612851381302, -0.2334473729133606, -0.2258334457874298, -0.21821951866149902, -0.21060560643672943, -0.20299169421195984, -0.19537776708602905, -0.18776383996009827, -0.18014992773532867, -0.17253601551055908, -0.1649220883846283, -0.1573081612586975, -0.14969424903392792, -0.14208033680915833, -0.13446640968322754, -0.12685248255729675, -0.11923857033252716, -0.11162465065717697, -0.10401073098182678, -0.09639681130647659, -0.0887828916311264, -0.08116897195577621, -0.07355505228042603, -0.06594113260507584, -0.05832721292972565, -0.05071329325437546, -0.04309937357902527, -0.03548545390367508, -0.02787153422832489, -0.0202576145529747, -0.012643679976463318, -0.005029760301113129, 0.0025841593742370605, 0.01019807904958725, 0.01781199872493744, 0.025425918400287628, 0.03303983807563782, 0.04065375775098801, 0.048267677426338196, 0.055881597101688385, 0.06349551677703857, 0.07110943645238876, 0.07872335612773895, 0.08633727580308914, 0.09395119547843933, 0.10156511515378952, 0.10917903482913971, 0.1167929545044899, 0.12440687417984009, 0.13202080130577087, 0.13963471353054047, 0.14724862575531006, 0.15486255288124084, 0.16247648000717163, 0.17009039223194122, 0.17770430445671082, 0.1853182315826416, 0.1929321587085724, 0.20054607093334198, 0.20815998315811157, 0.21577391028404236, 0.22338783740997314, 0.23100174963474274]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 9.0, 9.0, 8.0, 5.0, 9.0, 12.0, 19.0, 12.0, 21.0, 10.0, 20.0, 25.0, 37.0, 34.0, 23.0, 34.0, 46.0, 34.0, 56.0, 47.0, 38.0, 41.0, 34.0, 35.0, 45.0, 41.0, 27.0, 40.0, 25.0, 35.0, 26.0, 24.0, 16.0, 13.0, 23.0, 9.0, 8.0, 9.0, 6.0, 7.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0], "bins": [-0.27842628955841064, -0.2706246078014374, -0.2628229260444641, -0.25502124428749084, -0.24721956253051758, -0.2394178807735443, -0.23161618411540985, -0.22381450235843658, -0.21601282060146332, -0.20821113884449005, -0.20040945708751678, -0.19260777533054352, -0.18480607867240906, -0.1770043969154358, -0.16920271515846252, -0.16140103340148926, -0.153599351644516, -0.14579766988754272, -0.13799598813056946, -0.1301943063735962, -0.12239261716604233, -0.11459093540906906, -0.1067892462015152, -0.09898756444454193, -0.09118588268756866, -0.0833842009305954, -0.07558251917362213, -0.06778082996606827, -0.059979148209095, -0.052177466452121735, -0.04437578096985817, -0.036574095487594604, -0.028772413730621338, -0.020970730111002922, -0.013169046491384506, -0.00536736287176609, 0.0024343207478523254, 0.010236002504825592, 0.018037687987089157, 0.025839373469352722, 0.03364105522632599, 0.041442736983299255, 0.04924442246556282, 0.057046107947826385, 0.06484778970479965, 0.07264947146177292, 0.08045116066932678, 0.08825284242630005, 0.09605452418327332, 0.10385620594024658, 0.11165788769721985, 0.11945957690477371, 0.12726125121116638, 0.13506293296813965, 0.1428646296262741, 0.15066631138324738, 0.15846799314022064, 0.1662696748971939, 0.17407135665416718, 0.18187303841114044, 0.1896747350692749, 0.19747641682624817, 0.20527809858322144, 0.2130797803401947, 0.22088146209716797]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 20.0, 30.0, 37.0, 77.0, 136.0, 179.0, 351.0, 570.0, 999.0, 1879.0, 3326.0, 6035.0, 11024.0, 20696.0, 38949.0, 73518.0, 131992.0, 198324.0, 212561.0, 154872.0, 89970.0, 47616.0, 25065.0, 13415.0, 7483.0, 4072.0, 2293.0, 1297.0, 696.0, 417.0, 258.0, 140.0, 76.0, 54.0, 39.0, 27.0, 13.0, 11.0, 4.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0865478515625, -0.08358001708984375, -0.0806121826171875, -0.07764434814453125, -0.074676513671875, -0.07170867919921875, -0.0687408447265625, -0.06577301025390625, -0.06280517578125, -0.05983734130859375, -0.0568695068359375, -0.05390167236328125, -0.050933837890625, -0.04796600341796875, -0.0449981689453125, -0.04203033447265625, -0.0390625, -0.03609466552734375, -0.0331268310546875, -0.03015899658203125, -0.027191162109375, -0.02422332763671875, -0.0212554931640625, -0.01828765869140625, -0.01531982421875, -0.01235198974609375, -0.0093841552734375, -0.00641632080078125, -0.003448486328125, -0.00048065185546875, 0.0024871826171875, 0.00545501708984375, 0.0084228515625, 0.01139068603515625, 0.0143585205078125, 0.01732635498046875, 0.020294189453125, 0.02326202392578125, 0.0262298583984375, 0.02919769287109375, 0.03216552734375, 0.03513336181640625, 0.0381011962890625, 0.04106903076171875, 0.044036865234375, 0.04700469970703125, 0.0499725341796875, 0.05294036865234375, 0.055908203125, 0.05887603759765625, 0.0618438720703125, 0.06481170654296875, 0.067779541015625, 0.07074737548828125, 0.0737152099609375, 0.07668304443359375, 0.07965087890625, 0.08261871337890625, 0.0855865478515625, 0.08855438232421875, 0.091522216796875, 0.09449005126953125, 0.0974578857421875, 0.10042572021484375, 0.1033935546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 13.0, 7.0, 8.0, 13.0, 24.0, 20.0, 24.0, 31.0, 30.0, 35.0, 40.0, 40.0, 43.0, 48.0, 48.0, 48.0, 40.0, 61.0, 56.0, 50.0, 46.0, 37.0, 38.0, 26.0, 26.0, 27.0, 17.0, 20.0, 15.0, 13.0, 10.0, 7.0, 2.0, 6.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04876708984375, -0.047338008880615234, -0.04590892791748047, -0.0444798469543457, -0.04305076599121094, -0.04162168502807617, -0.040192604064941406, -0.03876352310180664, -0.037334442138671875, -0.03590536117553711, -0.034476280212402344, -0.03304719924926758, -0.03161811828613281, -0.030189037322998047, -0.02875995635986328, -0.027330875396728516, -0.02590179443359375, -0.024472713470458984, -0.02304363250732422, -0.021614551544189453, -0.020185470581054688, -0.018756389617919922, -0.017327308654785156, -0.01589822769165039, -0.014469146728515625, -0.01304006576538086, -0.011610984802246094, -0.010181903839111328, -0.008752822875976562, -0.007323741912841797, -0.005894660949707031, -0.004465579986572266, -0.0030364990234375, -0.0016074180603027344, -0.00017833709716796875, 0.0012507438659667969, 0.0026798248291015625, 0.004108905792236328, 0.005537986755371094, 0.006967067718505859, 0.008396148681640625, 0.00982522964477539, 0.011254310607910156, 0.012683391571044922, 0.014112472534179688, 0.015541553497314453, 0.01697063446044922, 0.018399715423583984, 0.01982879638671875, 0.021257877349853516, 0.02268695831298828, 0.024116039276123047, 0.025545120239257812, 0.026974201202392578, 0.028403282165527344, 0.02983236312866211, 0.031261444091796875, 0.03269052505493164, 0.034119606018066406, 0.03554868698120117, 0.03697776794433594, 0.0384068489074707, 0.03983592987060547, 0.041265010833740234, 0.042694091796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 6.0, 11.0, 23.0, 23.0, 39.0, 46.0, 63.0, 75.0, 118.0, 131.0, 166.0, 290.0, 442.0, 592.0, 915.0, 1653.0, 2959.0, 5648.0, 10620.0, 20525.0, 40564.0, 75553.0, 128827.0, 187954.0, 203478.0, 157046.0, 97748.0, 53718.0, 27847.0, 14436.0, 7237.0, 3999.0, 2063.0, 1322.0, 775.0, 456.0, 348.0, 228.0, 161.0, 120.0, 82.0, 55.0, 50.0, 37.0, 27.0, 23.0, 15.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0], "bins": [-0.0911865234375, -0.08844184875488281, -0.08569717407226562, -0.08295249938964844, -0.08020782470703125, -0.07746315002441406, -0.07471847534179688, -0.07197380065917969, -0.0692291259765625, -0.06648445129394531, -0.06373977661132812, -0.06099510192871094, -0.05825042724609375, -0.05550575256347656, -0.052761077880859375, -0.05001640319824219, -0.047271728515625, -0.04452705383300781, -0.041782379150390625, -0.03903770446777344, -0.03629302978515625, -0.03354835510253906, -0.030803680419921875, -0.028059005737304688, -0.0253143310546875, -0.022569656372070312, -0.019824981689453125, -0.017080307006835938, -0.01433563232421875, -0.011590957641601562, -0.008846282958984375, -0.0061016082763671875, -0.00335693359375, -0.0006122589111328125, 0.002132415771484375, 0.0048770904541015625, 0.00762176513671875, 0.010366439819335938, 0.013111114501953125, 0.015855789184570312, 0.0186004638671875, 0.021345138549804688, 0.024089813232421875, 0.026834487915039062, 0.02957916259765625, 0.03232383728027344, 0.035068511962890625, 0.03781318664550781, 0.040557861328125, 0.04330253601074219, 0.046047210693359375, 0.04879188537597656, 0.05153656005859375, 0.05428123474121094, 0.057025909423828125, 0.05977058410644531, 0.0625152587890625, 0.06525993347167969, 0.06800460815429688, 0.07074928283691406, 0.07349395751953125, 0.07623863220214844, 0.07898330688476562, 0.08172798156738281, 0.08447265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 2.0, 6.0, 7.0, 4.0, 11.0, 6.0, 14.0, 19.0, 18.0, 22.0, 27.0, 31.0, 30.0, 26.0, 44.0, 36.0, 48.0, 39.0, 47.0, 45.0, 33.0, 40.0, 53.0, 36.0, 34.0, 41.0, 43.0, 31.0, 34.0, 23.0, 22.0, 15.0, 20.0, 17.0, 14.0, 5.0, 12.0, 7.0, 10.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1134033203125, -0.10993003845214844, -0.10645675659179688, -0.10298347473144531, -0.09951019287109375, -0.09603691101074219, -0.09256362915039062, -0.08909034729003906, -0.0856170654296875, -0.08214378356933594, -0.07867050170898438, -0.07519721984863281, -0.07172393798828125, -0.06825065612792969, -0.06477737426757812, -0.06130409240722656, -0.057830810546875, -0.05435752868652344, -0.050884246826171875, -0.04741096496582031, -0.04393768310546875, -0.04046440124511719, -0.036991119384765625, -0.03351783752441406, -0.0300445556640625, -0.026571273803710938, -0.023097991943359375, -0.019624710083007812, -0.01615142822265625, -0.012678146362304688, -0.009204864501953125, -0.0057315826416015625, -0.00225830078125, 0.0012149810791015625, 0.004688262939453125, 0.008161544799804688, 0.01163482666015625, 0.015108108520507812, 0.018581390380859375, 0.022054672241210938, 0.0255279541015625, 0.029001235961914062, 0.032474517822265625, 0.03594779968261719, 0.03942108154296875, 0.04289436340332031, 0.046367645263671875, 0.04984092712402344, 0.053314208984375, 0.05678749084472656, 0.060260772705078125, 0.06373405456542969, 0.06720733642578125, 0.07068061828613281, 0.07415390014648438, 0.07762718200683594, 0.0811004638671875, 0.08457374572753906, 0.08804702758789062, 0.09152030944824219, 0.09499359130859375, 0.09846687316894531, 0.10194015502929688, 0.10541343688964844, 0.10888671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 2.0, 8.0, 16.0, 22.0, 32.0, 62.0, 118.0, 193.0, 320.0, 718.0, 1788.0, 4370.0, 12666.0, 39622.0, 130455.0, 327598.0, 332702.0, 135435.0, 41554.0, 13125.0, 4385.0, 1749.0, 766.0, 369.0, 193.0, 99.0, 63.0, 45.0, 32.0, 10.0, 8.0, 9.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.061920166015625, -0.060410499572753906, -0.05890083312988281, -0.05739116668701172, -0.055881500244140625, -0.05437183380126953, -0.05286216735839844, -0.051352500915527344, -0.04984283447265625, -0.048333168029785156, -0.04682350158691406, -0.04531383514404297, -0.043804168701171875, -0.04229450225830078, -0.04078483581542969, -0.039275169372558594, -0.0377655029296875, -0.036255836486816406, -0.03474617004394531, -0.03323650360107422, -0.031726837158203125, -0.03021717071533203, -0.028707504272460938, -0.027197837829589844, -0.02568817138671875, -0.024178504943847656, -0.022668838500976562, -0.02115917205810547, -0.019649505615234375, -0.01813983917236328, -0.016630172729492188, -0.015120506286621094, -0.01361083984375, -0.012101173400878906, -0.010591506958007812, -0.009081840515136719, -0.007572174072265625, -0.006062507629394531, -0.0045528411865234375, -0.0030431747436523438, -0.00153350830078125, -2.384185791015625e-05, 0.0014858245849609375, 0.0029954910278320312, 0.004505157470703125, 0.006014823913574219, 0.0075244903564453125, 0.009034156799316406, 0.0105438232421875, 0.012053489685058594, 0.013563156127929688, 0.015072822570800781, 0.016582489013671875, 0.01809215545654297, 0.019601821899414062, 0.021111488342285156, 0.02262115478515625, 0.024130821228027344, 0.025640487670898438, 0.02715015411376953, 0.028659820556640625, 0.03016948699951172, 0.03167915344238281, 0.033188819885253906, 0.034698486328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 9.0, 8.0, 12.0, 19.0, 20.0, 30.0, 36.0, 21.0, 44.0, 40.0, 32.0, 47.0, 62.0, 53.0, 45.0, 64.0, 51.0, 51.0, 43.0, 45.0, 32.0, 36.0, 32.0, 34.0, 24.0, 14.0, 14.0, 8.0, 11.0, 12.0, 7.0, 3.0, 5.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1269934475421906e-05, -1.091696321964264e-05, -1.0563991963863373e-05, -1.0211020708084106e-05, -9.85804945230484e-06, -9.505078196525574e-06, -9.152106940746307e-06, -8.799135684967041e-06, -8.446164429187775e-06, -8.093193173408508e-06, -7.740221917629242e-06, -7.387250661849976e-06, -7.034279406070709e-06, -6.681308150291443e-06, -6.3283368945121765e-06, -5.97536563873291e-06, -5.622394382953644e-06, -5.2694231271743774e-06, -4.916451871395111e-06, -4.563480615615845e-06, -4.210509359836578e-06, -3.857538104057312e-06, -3.5045668482780457e-06, -3.1515955924987793e-06, -2.798624336719513e-06, -2.4456530809402466e-06, -2.0926818251609802e-06, -1.7397105693817139e-06, -1.3867393136024475e-06, -1.0337680578231812e-06, -6.807968020439148e-07, -3.2782554626464844e-07, 2.514570951461792e-08, 3.781169652938843e-07, 7.310882210731506e-07, 1.084059476852417e-06, 1.4370307326316833e-06, 1.7900019884109497e-06, 2.142973244190216e-06, 2.4959444999694824e-06, 2.8489157557487488e-06, 3.201887011528015e-06, 3.5548582673072815e-06, 3.907829523086548e-06, 4.260800778865814e-06, 4.6137720346450806e-06, 4.966743290424347e-06, 5.319714546203613e-06, 5.67268580198288e-06, 6.025657057762146e-06, 6.378628313541412e-06, 6.731599569320679e-06, 7.084570825099945e-06, 7.4375420808792114e-06, 7.790513336658478e-06, 8.143484592437744e-06, 8.49645584821701e-06, 8.849427103996277e-06, 9.202398359775543e-06, 9.55536961555481e-06, 9.908340871334076e-06, 1.0261312127113342e-05, 1.0614283382892609e-05, 1.0967254638671875e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 26.0, 35.0, 41.0, 93.0, 123.0, 202.0, 341.0, 608.0, 1232.0, 2687.0, 6580.0, 17298.0, 48088.0, 136494.0, 301161.0, 309109.0, 143326.0, 50473.0, 18069.0, 6946.0, 2800.0, 1238.0, 620.0, 351.0, 218.0, 137.0, 92.0, 53.0, 29.0, 19.0, 14.0, 14.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044342041015625, -0.04303884506225586, -0.04173564910888672, -0.04043245315551758, -0.03912925720214844, -0.0378260612487793, -0.036522865295410156, -0.035219669342041016, -0.033916473388671875, -0.032613277435302734, -0.031310081481933594, -0.030006885528564453, -0.028703689575195312, -0.027400493621826172, -0.02609729766845703, -0.02479410171508789, -0.02349090576171875, -0.02218770980834961, -0.02088451385498047, -0.019581317901611328, -0.018278121948242188, -0.016974925994873047, -0.015671730041503906, -0.014368534088134766, -0.013065338134765625, -0.011762142181396484, -0.010458946228027344, -0.009155750274658203, -0.007852554321289062, -0.006549358367919922, -0.005246162414550781, -0.003942966461181641, -0.0026397705078125, -0.0013365745544433594, -3.337860107421875e-05, 0.0012698173522949219, 0.0025730133056640625, 0.003876209259033203, 0.005179405212402344, 0.006482601165771484, 0.007785797119140625, 0.009088993072509766, 0.010392189025878906, 0.011695384979248047, 0.012998580932617188, 0.014301776885986328, 0.015604972839355469, 0.01690816879272461, 0.01821136474609375, 0.01951456069946289, 0.02081775665283203, 0.022120952606201172, 0.023424148559570312, 0.024727344512939453, 0.026030540466308594, 0.027333736419677734, 0.028636932373046875, 0.029940128326416016, 0.031243324279785156, 0.0325465202331543, 0.03384971618652344, 0.03515291213989258, 0.03645610809326172, 0.03775930404663086, 0.0390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 7.0, 6.0, 13.0, 9.0, 13.0, 16.0, 28.0, 29.0, 20.0, 31.0, 42.0, 39.0, 44.0, 48.0, 67.0, 59.0, 54.0, 54.0, 48.0, 55.0, 60.0, 41.0, 27.0, 35.0, 32.0, 24.0, 12.0, 8.0, 14.0, 12.0, 13.0, 7.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.026885986328125, -0.026116132736206055, -0.02534627914428711, -0.024576425552368164, -0.02380657196044922, -0.023036718368530273, -0.022266864776611328, -0.021497011184692383, -0.020727157592773438, -0.019957304000854492, -0.019187450408935547, -0.0184175968170166, -0.017647743225097656, -0.01687788963317871, -0.016108036041259766, -0.01533818244934082, -0.014568328857421875, -0.01379847526550293, -0.013028621673583984, -0.012258768081665039, -0.011488914489746094, -0.010719060897827148, -0.009949207305908203, -0.009179353713989258, -0.008409500122070312, -0.007639646530151367, -0.006869792938232422, -0.0060999393463134766, -0.005330085754394531, -0.004560232162475586, -0.0037903785705566406, -0.0030205249786376953, -0.00225067138671875, -0.0014808177947998047, -0.0007109642028808594, 5.888938903808594e-05, 0.0008287429809570312, 0.0015985965728759766, 0.002368450164794922, 0.003138303756713867, 0.0039081573486328125, 0.004678010940551758, 0.005447864532470703, 0.0062177181243896484, 0.006987571716308594, 0.007757425308227539, 0.008527278900146484, 0.00929713249206543, 0.010066986083984375, 0.01083683967590332, 0.011606693267822266, 0.012376546859741211, 0.013146400451660156, 0.013916254043579102, 0.014686107635498047, 0.015455961227416992, 0.016225814819335938, 0.016995668411254883, 0.017765522003173828, 0.018535375595092773, 0.01930522918701172, 0.020075082778930664, 0.02084493637084961, 0.021614789962768555, 0.0223846435546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 9.0, 17.0, 12.0, 21.0, 27.0, 47.0, 70.0, 78.0, 87.0, 121.0, 109.0, 100.0, 79.0, 69.0, 44.0, 32.0, 22.0, 15.0, 12.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4154208302497864, -0.4028823971748352, -0.39034396409988403, -0.37780553102493286, -0.3652670979499817, -0.3527286648750305, -0.34019023180007935, -0.3276517987251282, -0.315113365650177, -0.30257493257522583, -0.29003649950027466, -0.2774980664253235, -0.2649596333503723, -0.25242120027542114, -0.23988276720046997, -0.2273443341255188, -0.21480591595172882, -0.20226748287677765, -0.18972904980182648, -0.1771906167268753, -0.16465218365192413, -0.15211376547813416, -0.13957533240318298, -0.1270368993282318, -0.11449845880270004, -0.10196002572774887, -0.0894215926527977, -0.07688316702842712, -0.06434473395347595, -0.05180630087852478, -0.03926786780357361, -0.026729434728622437, -0.014191001653671265, -0.0016525695100426674, 0.01088586263358593, 0.023424293845891953, 0.035962726920843124, 0.048501156270504, 0.06103958934545517, 0.07357802242040634, 0.08611645549535751, 0.09865488857030869, 0.11119332164525986, 0.12373174726963043, 0.1362701803445816, 0.14880861341953278, 0.16134704649448395, 0.17388547956943512, 0.1864239126443863, 0.19896234571933746, 0.21150077879428864, 0.2240392118692398, 0.23657764494419098, 0.24911606311798096, 0.26165449619293213, 0.2741929292678833, 0.2867313623428345, 0.29926979541778564, 0.3118082284927368, 0.324346661567688, 0.33688509464263916, 0.34942352771759033, 0.3619619607925415, 0.3745003938674927, 0.38703882694244385]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 5.0, 6.0, 13.0, 12.0, 16.0, 17.0, 16.0, 25.0, 27.0, 28.0, 32.0, 32.0, 41.0, 37.0, 34.0, 51.0, 59.0, 36.0, 40.0, 52.0, 50.0, 41.0, 42.0, 40.0, 36.0, 34.0, 26.0, 23.0, 24.0, 23.0, 18.0, 12.0, 13.0, 9.0, 9.0, 2.0, 8.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.3773934841156006, -0.36669328808784485, -0.3559931218624115, -0.34529292583465576, -0.3345927596092224, -0.3238925635814667, -0.31319236755371094, -0.3024922013282776, -0.29179200530052185, -0.2810918092727661, -0.27039164304733276, -0.259691447019577, -0.24899126589298248, -0.23829108476638794, -0.2275909036397934, -0.21689072251319885, -0.2061905413866043, -0.19549036026000977, -0.18479017913341522, -0.17408999800682068, -0.16338980197906494, -0.1526896208524704, -0.14198943972587585, -0.13128924369812012, -0.12058907002210617, -0.10988888889551163, -0.09918870031833649, -0.08848851919174194, -0.0777883380651474, -0.06708814948797226, -0.056387968361377716, -0.045687779784202576, -0.03498759865760803, -0.02428741380572319, -0.013587230816483498, -0.002887047827243805, 0.007813137024641037, 0.01851332187652588, 0.029213503003120422, 0.03991369158029556, 0.050613872706890106, 0.06131405755877495, 0.07201424241065979, 0.08271442353725433, 0.09341460466384888, 0.10411479324102402, 0.11481497436761856, 0.1255151629447937, 0.13621534407138824, 0.1469155251979828, 0.15761570632457733, 0.16831588745117188, 0.1790160834789276, 0.18971626460552216, 0.2004164457321167, 0.21111664175987244, 0.2218168079853058, 0.23251698911190033, 0.24321717023849487, 0.2539173662662506, 0.26461753249168396, 0.2753177285194397, 0.28601789474487305, 0.2967180907726288, 0.3074182868003845]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 10.0, 13.0, 19.0, 41.0, 63.0, 100.0, 178.0, 286.0, 605.0, 1250.0, 2869.0, 6743.0, 17512.0, 55237.0, 239483.0, 1479248.0, 1930548.0, 348936.0, 74394.0, 22720.0, 7994.0, 3386.0, 1407.0, 624.0, 283.0, 157.0, 64.0, 56.0, 23.0, 15.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.08441543579101562, -0.08161163330078125, -0.07880783081054688, -0.0760040283203125, -0.07320022583007812, -0.07039642333984375, -0.06759262084960938, -0.064788818359375, -0.061985015869140625, -0.05918121337890625, -0.056377410888671875, -0.0535736083984375, -0.050769805908203125, -0.04796600341796875, -0.045162200927734375, -0.0423583984375, -0.039554595947265625, -0.03675079345703125, -0.033946990966796875, -0.0311431884765625, -0.028339385986328125, -0.02553558349609375, -0.022731781005859375, -0.019927978515625, -0.017124176025390625, -0.01432037353515625, -0.011516571044921875, -0.0087127685546875, -0.005908966064453125, -0.00310516357421875, -0.000301361083984375, 0.00250244140625, 0.005306243896484375, 0.00811004638671875, 0.010913848876953125, 0.0137176513671875, 0.016521453857421875, 0.01932525634765625, 0.022129058837890625, 0.024932861328125, 0.027736663818359375, 0.03054046630859375, 0.033344268798828125, 0.0361480712890625, 0.038951873779296875, 0.04175567626953125, 0.044559478759765625, 0.04736328125, 0.050167083740234375, 0.05297088623046875, 0.055774688720703125, 0.0585784912109375, 0.061382293701171875, 0.06418609619140625, 0.06698989868164062, 0.069793701171875, 0.07259750366210938, 0.07540130615234375, 0.07820510864257812, 0.0810089111328125, 0.08381271362304688, 0.08661651611328125, 0.08942031860351562, 0.09222412109375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 8.0, 17.0, 11.0, 25.0, 15.0, 28.0, 32.0, 32.0, 51.0, 55.0, 43.0, 55.0, 62.0, 56.0, 51.0, 52.0, 53.0, 56.0, 41.0, 50.0, 32.0, 33.0, 25.0, 22.0, 24.0, 11.0, 15.0, 16.0, 11.0, 5.0, 4.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06146240234375, -0.059812068939208984, -0.05816173553466797, -0.05651140213012695, -0.05486106872558594, -0.05321073532104492, -0.051560401916503906, -0.04991006851196289, -0.048259735107421875, -0.04660940170288086, -0.044959068298339844, -0.04330873489379883, -0.04165840148925781, -0.0400080680847168, -0.03835773468017578, -0.036707401275634766, -0.03505706787109375, -0.033406734466552734, -0.03175640106201172, -0.030106067657470703, -0.028455734252929688, -0.026805400848388672, -0.025155067443847656, -0.02350473403930664, -0.021854400634765625, -0.02020406723022461, -0.018553733825683594, -0.016903400421142578, -0.015253067016601562, -0.013602733612060547, -0.011952400207519531, -0.010302066802978516, -0.0086517333984375, -0.007001399993896484, -0.005351066589355469, -0.003700733184814453, -0.0020503997802734375, -0.0004000663757324219, 0.0012502670288085938, 0.0029006004333496094, 0.004550933837890625, 0.006201267242431641, 0.007851600646972656, 0.009501934051513672, 0.011152267456054688, 0.012802600860595703, 0.014452934265136719, 0.016103267669677734, 0.01775360107421875, 0.019403934478759766, 0.02105426788330078, 0.022704601287841797, 0.024354934692382812, 0.026005268096923828, 0.027655601501464844, 0.02930593490600586, 0.030956268310546875, 0.03260660171508789, 0.034256935119628906, 0.03590726852416992, 0.03755760192871094, 0.03920793533325195, 0.04085826873779297, 0.042508602142333984, 0.044158935546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 2.0, 5.0, 9.0, 12.0, 15.0, 17.0, 39.0, 41.0, 70.0, 117.0, 209.0, 404.0, 873.0, 2420.0, 8613.0, 36115.0, 181502.0, 1088077.0, 2271951.0, 489348.0, 87709.0, 18978.0, 4910.0, 1543.0, 577.0, 288.0, 139.0, 101.0, 66.0, 44.0, 28.0, 17.0, 12.0, 14.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10552978515625, -0.10192584991455078, -0.09832191467285156, -0.09471797943115234, -0.09111404418945312, -0.0875101089477539, -0.08390617370605469, -0.08030223846435547, -0.07669830322265625, -0.07309436798095703, -0.06949043273925781, -0.0658864974975586, -0.062282562255859375, -0.058678627014160156, -0.05507469177246094, -0.05147075653076172, -0.0478668212890625, -0.04426288604736328, -0.04065895080566406, -0.037055015563964844, -0.033451080322265625, -0.029847145080566406, -0.026243209838867188, -0.02263927459716797, -0.01903533935546875, -0.015431404113769531, -0.011827468872070312, -0.008223533630371094, -0.004619598388671875, -0.0010156631469726562, 0.0025882720947265625, 0.006192207336425781, 0.009796142578125, 0.013400077819824219, 0.017004013061523438, 0.020607948303222656, 0.024211883544921875, 0.027815818786621094, 0.03141975402832031, 0.03502368927001953, 0.03862762451171875, 0.04223155975341797, 0.04583549499511719, 0.049439430236816406, 0.053043365478515625, 0.056647300720214844, 0.06025123596191406, 0.06385517120361328, 0.0674591064453125, 0.07106304168701172, 0.07466697692871094, 0.07827091217041016, 0.08187484741210938, 0.0854787826538086, 0.08908271789550781, 0.09268665313720703, 0.09629058837890625, 0.09989452362060547, 0.10349845886230469, 0.1071023941040039, 0.11070632934570312, 0.11431026458740234, 0.11791419982910156, 0.12151813507080078, 0.1251220703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 10.0, 6.0, 9.0, 16.0, 23.0, 43.0, 26.0, 48.0, 74.0, 96.0, 144.0, 181.0, 261.0, 381.0, 434.0, 503.0, 471.0, 343.0, 278.0, 210.0, 151.0, 105.0, 60.0, 52.0, 43.0, 29.0, 28.0, 16.0, 5.0, 8.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.07326126098632812, -0.07059478759765625, -0.06792831420898438, -0.0652618408203125, -0.06259536743164062, -0.05992889404296875, -0.057262420654296875, -0.054595947265625, -0.051929473876953125, -0.04926300048828125, -0.046596527099609375, -0.0439300537109375, -0.041263580322265625, -0.03859710693359375, -0.035930633544921875, -0.03326416015625, -0.030597686767578125, -0.02793121337890625, -0.025264739990234375, -0.0225982666015625, -0.019931793212890625, -0.01726531982421875, -0.014598846435546875, -0.011932373046875, -0.009265899658203125, -0.00659942626953125, -0.003932952880859375, -0.0012664794921875, 0.001399993896484375, 0.00406646728515625, 0.006732940673828125, 0.0093994140625, 0.012065887451171875, 0.01473236083984375, 0.017398834228515625, 0.0200653076171875, 0.022731781005859375, 0.02539825439453125, 0.028064727783203125, 0.030731201171875, 0.033397674560546875, 0.03606414794921875, 0.038730621337890625, 0.0413970947265625, 0.044063568115234375, 0.04673004150390625, 0.049396514892578125, 0.05206298828125, 0.054729461669921875, 0.05739593505859375, 0.060062408447265625, 0.0627288818359375, 0.06539535522460938, 0.06806182861328125, 0.07072830200195312, 0.073394775390625, 0.07606124877929688, 0.07872772216796875, 0.08139419555664062, 0.0840606689453125, 0.08672714233398438, 0.08939361572265625, 0.09206008911132812, 0.0947265625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 10.0, 25.0, 37.0, 62.0, 80.0, 116.0, 120.0, 127.0, 121.0, 120.0, 77.0, 41.0, 31.0, 16.0, 11.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.584062933921814, -0.5669274926185608, -0.5497919917106628, -0.5326565504074097, -0.5155210494995117, -0.49838560819625854, -0.48125016689300537, -0.4641146957874298, -0.44697922468185425, -0.4298437535762787, -0.4127082824707031, -0.39557284116744995, -0.3784373700618744, -0.36130189895629883, -0.34416645765304565, -0.3270309865474701, -0.30989551544189453, -0.29276004433631897, -0.2756245732307434, -0.25848913192749023, -0.24135366082191467, -0.2242181897163391, -0.20708273351192474, -0.18994727730751038, -0.17281180620193481, -0.15567633509635925, -0.13854087889194489, -0.12140541523694992, -0.10426995158195496, -0.08713448792695999, -0.06999902427196503, -0.05286356061697006, -0.03572815656661987, -0.01859269291162491, -0.0014572292566299438, 0.01567823439836502, 0.032813698053359985, 0.04994916170835495, 0.06708462536334991, 0.08422008901834488, 0.10135555267333984, 0.11849101632833481, 0.13562647998332977, 0.15276193618774414, 0.1698974072933197, 0.18703287839889526, 0.20416833460330963, 0.221303790807724, 0.23843926191329956, 0.2555747330188751, 0.2727102041244507, 0.28984564542770386, 0.3069811165332794, 0.324116587638855, 0.34125202894210815, 0.3583875000476837, 0.3755229711532593, 0.39265844225883484, 0.4097939133644104, 0.4269293546676636, 0.44406482577323914, 0.4612002968788147, 0.47833573818206787, 0.49547120928764343, 0.512606680393219]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 9.0, 8.0, 9.0, 10.0, 10.0, 12.0, 21.0, 21.0, 19.0, 25.0, 20.0, 32.0, 34.0, 39.0, 42.0, 36.0, 33.0, 40.0, 36.0, 42.0, 45.0, 44.0, 53.0, 44.0, 29.0, 43.0, 31.0, 25.0, 23.0, 35.0, 26.0, 19.0, 13.0, 9.0, 14.0, 8.0, 8.0, 11.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2305338978767395, -0.22263604402542114, -0.21473820507526398, -0.20684035122394562, -0.19894251227378845, -0.1910446584224701, -0.18314680457115173, -0.17524895071983337, -0.1673511117696762, -0.15945325791835785, -0.15155541896820068, -0.14365756511688232, -0.13575971126556396, -0.1278618723154068, -0.11996401846408844, -0.11206617206335068, -0.10416832566261292, -0.09627047926187515, -0.08837263286113739, -0.08047477900981903, -0.07257693260908127, -0.0646790862083435, -0.056781236082315445, -0.048883385956287384, -0.04098553955554962, -0.03308769315481186, -0.025189843028783798, -0.017291994765400887, -0.009394146502017975, -0.0014963001012802124, 0.0064015500247478485, 0.01429940015077591, 0.022197246551513672, 0.030095094814896584, 0.037992943078279495, 0.045890793204307556, 0.05378863960504532, 0.06168648600578308, 0.06958433985710144, 0.0774821862578392, 0.08538003265857697, 0.09327787905931473, 0.10117572546005249, 0.10907357931137085, 0.11697142571210861, 0.12486927211284637, 0.13276712596416473, 0.1406649649143219, 0.14856281876564026, 0.15646067261695862, 0.16435851156711578, 0.17225636541843414, 0.1801542043685913, 0.18805205821990967, 0.19594991207122803, 0.2038477659225464, 0.21174560487270355, 0.2196434587240219, 0.22754129767417908, 0.23543915152549744, 0.2433370053768158, 0.25123482942581177, 0.2591326832771301, 0.2670305371284485, 0.27492839097976685]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 10.0, 19.0, 23.0, 25.0, 48.0, 73.0, 107.0, 195.0, 278.0, 435.0, 739.0, 1317.0, 2227.0, 3865.0, 6886.0, 12555.0, 21779.0, 39184.0, 69503.0, 116587.0, 173243.0, 196266.0, 160259.0, 104165.0, 60610.0, 33971.0, 19034.0, 10692.0, 6071.0, 3496.0, 1960.0, 1125.0, 673.0, 413.0, 255.0, 138.0, 92.0, 70.0, 38.0, 20.0, 27.0, 19.0, 12.0, 12.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.07568359375, -0.0732717514038086, -0.07085990905761719, -0.06844806671142578, -0.06603622436523438, -0.06362438201904297, -0.06121253967285156, -0.058800697326660156, -0.05638885498046875, -0.053977012634277344, -0.05156517028808594, -0.04915332794189453, -0.046741485595703125, -0.04432964324951172, -0.04191780090332031, -0.039505958557128906, -0.0370941162109375, -0.034682273864746094, -0.03227043151855469, -0.02985858917236328, -0.027446746826171875, -0.02503490447998047, -0.022623062133789062, -0.020211219787597656, -0.01779937744140625, -0.015387535095214844, -0.012975692749023438, -0.010563850402832031, -0.008152008056640625, -0.005740165710449219, -0.0033283233642578125, -0.0009164810180664062, 0.001495361328125, 0.003907203674316406, 0.0063190460205078125, 0.008730888366699219, 0.011142730712890625, 0.013554573059082031, 0.015966415405273438, 0.018378257751464844, 0.02079010009765625, 0.023201942443847656, 0.025613784790039062, 0.02802562713623047, 0.030437469482421875, 0.03284931182861328, 0.03526115417480469, 0.037672996520996094, 0.0400848388671875, 0.042496681213378906, 0.04490852355957031, 0.04732036590576172, 0.049732208251953125, 0.05214405059814453, 0.05455589294433594, 0.056967735290527344, 0.05937957763671875, 0.061791419982910156, 0.06420326232910156, 0.06661510467529297, 0.06902694702148438, 0.07143878936767578, 0.07385063171386719, 0.0762624740600586, 0.07867431640625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 7.0, 9.0, 7.0, 16.0, 15.0, 22.0, 23.0, 25.0, 37.0, 36.0, 42.0, 35.0, 43.0, 52.0, 44.0, 45.0, 50.0, 49.0, 59.0, 40.0, 39.0, 52.0, 45.0, 39.0, 34.0, 21.0, 18.0, 16.0, 22.0, 14.0, 12.0, 9.0, 8.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.055450439453125, -0.054003238677978516, -0.05255603790283203, -0.05110883712768555, -0.04966163635253906, -0.04821443557739258, -0.046767234802246094, -0.04532003402709961, -0.043872833251953125, -0.04242563247680664, -0.040978431701660156, -0.03953123092651367, -0.03808403015136719, -0.0366368293762207, -0.03518962860107422, -0.033742427825927734, -0.03229522705078125, -0.030848026275634766, -0.02940082550048828, -0.027953624725341797, -0.026506423950195312, -0.025059223175048828, -0.023612022399902344, -0.02216482162475586, -0.020717620849609375, -0.01927042007446289, -0.017823219299316406, -0.016376018524169922, -0.014928817749023438, -0.013481616973876953, -0.012034416198730469, -0.010587215423583984, -0.0091400146484375, -0.007692813873291016, -0.006245613098144531, -0.004798412322998047, -0.0033512115478515625, -0.0019040107727050781, -0.00045680999755859375, 0.0009903907775878906, 0.002437591552734375, 0.0038847923278808594, 0.005331993103027344, 0.006779193878173828, 0.008226394653320312, 0.009673595428466797, 0.011120796203613281, 0.012567996978759766, 0.01401519775390625, 0.015462398529052734, 0.01690959930419922, 0.018356800079345703, 0.019804000854492188, 0.021251201629638672, 0.022698402404785156, 0.02414560317993164, 0.025592803955078125, 0.02704000473022461, 0.028487205505371094, 0.029934406280517578, 0.03138160705566406, 0.03282880783081055, 0.03427600860595703, 0.035723209381103516, 0.03717041015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 3.0, 2.0, 7.0, 5.0, 7.0, 13.0, 22.0, 29.0, 43.0, 75.0, 124.0, 239.0, 391.0, 924.0, 2016.0, 4422.0, 10324.0, 23582.0, 50721.0, 103748.0, 186769.0, 246302.0, 200560.0, 113694.0, 56907.0, 26463.0, 11562.0, 5144.0, 2309.0, 1034.0, 500.0, 254.0, 128.0, 81.0, 51.0, 38.0, 11.0, 11.0, 15.0, 6.0, 12.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.122314453125, -0.11905956268310547, -0.11580467224121094, -0.1125497817993164, -0.10929489135742188, -0.10604000091552734, -0.10278511047363281, -0.09953022003173828, -0.09627532958984375, -0.09302043914794922, -0.08976554870605469, -0.08651065826416016, -0.08325576782226562, -0.0800008773803711, -0.07674598693847656, -0.07349109649658203, -0.0702362060546875, -0.06698131561279297, -0.06372642517089844, -0.060471534729003906, -0.057216644287109375, -0.053961753845214844, -0.05070686340332031, -0.04745197296142578, -0.04419708251953125, -0.04094219207763672, -0.03768730163574219, -0.034432411193847656, -0.031177520751953125, -0.027922630310058594, -0.024667739868164062, -0.02141284942626953, -0.018157958984375, -0.014903068542480469, -0.011648178100585938, -0.008393287658691406, -0.005138397216796875, -0.0018835067749023438, 0.0013713836669921875, 0.004626274108886719, 0.00788116455078125, 0.011136054992675781, 0.014390945434570312, 0.017645835876464844, 0.020900726318359375, 0.024155616760253906, 0.027410507202148438, 0.03066539764404297, 0.0339202880859375, 0.03717517852783203, 0.04043006896972656, 0.043684959411621094, 0.046939849853515625, 0.050194740295410156, 0.05344963073730469, 0.05670452117919922, 0.05995941162109375, 0.06321430206298828, 0.06646919250488281, 0.06972408294677734, 0.07297897338867188, 0.0762338638305664, 0.07948875427246094, 0.08274364471435547, 0.08599853515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 5.0, 9.0, 8.0, 8.0, 7.0, 10.0, 12.0, 13.0, 20.0, 19.0, 11.0, 18.0, 34.0, 38.0, 30.0, 29.0, 26.0, 29.0, 29.0, 46.0, 29.0, 37.0, 41.0, 35.0, 37.0, 45.0, 41.0, 45.0, 33.0, 39.0, 30.0, 19.0, 22.0, 22.0, 28.0, 17.0, 13.0, 12.0, 12.0, 5.0, 4.0, 6.0, 7.0, 5.0, 6.0, 2.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.093017578125, -0.08979034423828125, -0.0865631103515625, -0.08333587646484375, -0.080108642578125, -0.07688140869140625, -0.0736541748046875, -0.07042694091796875, -0.06719970703125, -0.06397247314453125, -0.0607452392578125, -0.05751800537109375, -0.054290771484375, -0.05106353759765625, -0.0478363037109375, -0.04460906982421875, -0.0413818359375, -0.03815460205078125, -0.0349273681640625, -0.03170013427734375, -0.028472900390625, -0.02524566650390625, -0.0220184326171875, -0.01879119873046875, -0.01556396484375, -0.01233673095703125, -0.0091094970703125, -0.00588226318359375, -0.002655029296875, 0.00057220458984375, 0.0037994384765625, 0.00702667236328125, 0.01025390625, 0.01348114013671875, 0.0167083740234375, 0.01993560791015625, 0.023162841796875, 0.02639007568359375, 0.0296173095703125, 0.03284454345703125, 0.03607177734375, 0.03929901123046875, 0.0425262451171875, 0.04575347900390625, 0.048980712890625, 0.05220794677734375, 0.0554351806640625, 0.05866241455078125, 0.0618896484375, 0.06511688232421875, 0.0683441162109375, 0.07157135009765625, 0.074798583984375, 0.07802581787109375, 0.0812530517578125, 0.08448028564453125, 0.08770751953125, 0.09093475341796875, 0.0941619873046875, 0.09738922119140625, 0.100616455078125, 0.10384368896484375, 0.1070709228515625, 0.11029815673828125, 0.113525390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 13.0, 11.0, 12.0, 12.0, 33.0, 48.0, 88.0, 167.0, 364.0, 701.0, 1628.0, 3744.0, 9794.0, 26427.0, 73270.0, 175984.0, 292561.0, 256598.0, 128024.0, 49480.0, 17903.0, 6741.0, 2708.0, 1135.0, 514.0, 287.0, 103.0, 73.0, 47.0, 25.0, 14.0, 15.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0367431640625, -0.03562307357788086, -0.03450298309326172, -0.03338289260864258, -0.03226280212402344, -0.031142711639404297, -0.030022621154785156, -0.028902530670166016, -0.027782440185546875, -0.026662349700927734, -0.025542259216308594, -0.024422168731689453, -0.023302078247070312, -0.022181987762451172, -0.02106189727783203, -0.01994180679321289, -0.01882171630859375, -0.01770162582397461, -0.01658153533935547, -0.015461444854736328, -0.014341354370117188, -0.013221263885498047, -0.012101173400878906, -0.010981082916259766, -0.009860992431640625, -0.008740901947021484, -0.007620811462402344, -0.006500720977783203, -0.0053806304931640625, -0.004260540008544922, -0.0031404495239257812, -0.0020203590393066406, -0.0009002685546875, 0.00021982192993164062, 0.0013399124145507812, 0.002460002899169922, 0.0035800933837890625, 0.004700183868408203, 0.005820274353027344, 0.006940364837646484, 0.008060455322265625, 0.009180545806884766, 0.010300636291503906, 0.011420726776123047, 0.012540817260742188, 0.013660907745361328, 0.014780998229980469, 0.01590108871459961, 0.01702117919921875, 0.01814126968383789, 0.01926136016845703, 0.020381450653076172, 0.021501541137695312, 0.022621631622314453, 0.023741722106933594, 0.024861812591552734, 0.025981903076171875, 0.027101993560791016, 0.028222084045410156, 0.029342174530029297, 0.030462265014648438, 0.03158235549926758, 0.03270244598388672, 0.03382253646850586, 0.034942626953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 13.0, 15.0, 7.0, 21.0, 13.0, 26.0, 24.0, 41.0, 44.0, 41.0, 49.0, 78.0, 70.0, 51.0, 79.0, 63.0, 70.0, 67.0, 41.0, 35.0, 28.0, 20.0, 19.0, 15.0, 13.0, 12.0, 9.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2993812561035156e-05, -1.2516044080257416e-05, -1.2038275599479675e-05, -1.1560507118701935e-05, -1.1082738637924194e-05, -1.0604970157146454e-05, -1.0127201676368713e-05, -9.649433195590973e-06, -9.171664714813232e-06, -8.693896234035492e-06, -8.216127753257751e-06, -7.738359272480011e-06, -7.2605907917022705e-06, -6.78282231092453e-06, -6.3050538301467896e-06, -5.827285349369049e-06, -5.349516868591309e-06, -4.871748387813568e-06, -4.393979907035828e-06, -3.916211426258087e-06, -3.4384429454803467e-06, -2.960674464702606e-06, -2.4829059839248657e-06, -2.0051375031471252e-06, -1.5273690223693848e-06, -1.0496005415916443e-06, -5.718320608139038e-07, -9.406358003616333e-08, 3.8370490074157715e-07, 8.614733815193176e-07, 1.339241862297058e-06, 1.8170103430747986e-06, 2.294778823852539e-06, 2.7725473046302795e-06, 3.25031578540802e-06, 3.7280842661857605e-06, 4.205852746963501e-06, 4.6836212277412415e-06, 5.161389708518982e-06, 5.639158189296722e-06, 6.116926670074463e-06, 6.594695150852203e-06, 7.072463631629944e-06, 7.550232112407684e-06, 8.028000593185425e-06, 8.505769073963165e-06, 8.983537554740906e-06, 9.461306035518646e-06, 9.939074516296387e-06, 1.0416842997074127e-05, 1.0894611477851868e-05, 1.1372379958629608e-05, 1.1850148439407349e-05, 1.2327916920185089e-05, 1.280568540096283e-05, 1.328345388174057e-05, 1.376122236251831e-05, 1.4238990843296051e-05, 1.4716759324073792e-05, 1.5194527804851532e-05, 1.5672296285629272e-05, 1.6150064766407013e-05, 1.6627833247184753e-05, 1.7105601727962494e-05, 1.7583370208740234e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 13.0, 9.0, 13.0, 20.0, 30.0, 43.0, 70.0, 114.0, 176.0, 262.0, 406.0, 681.0, 1053.0, 1827.0, 3290.0, 5963.0, 11599.0, 22411.0, 44183.0, 82797.0, 139197.0, 190363.0, 196509.0, 150277.0, 92496.0, 50177.0, 25739.0, 13194.0, 6744.0, 3669.0, 2034.0, 1241.0, 715.0, 430.0, 276.0, 169.0, 129.0, 76.0, 46.0, 31.0, 27.0, 18.0, 11.0, 7.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0212860107421875, -0.020601511001586914, -0.019917011260986328, -0.019232511520385742, -0.018548011779785156, -0.01786351203918457, -0.017179012298583984, -0.0164945125579834, -0.015810012817382812, -0.015125513076782227, -0.01444101333618164, -0.013756513595581055, -0.013072013854980469, -0.012387514114379883, -0.011703014373779297, -0.011018514633178711, -0.010334014892578125, -0.009649515151977539, -0.008965015411376953, -0.008280515670776367, -0.007596015930175781, -0.006911516189575195, -0.006227016448974609, -0.0055425167083740234, -0.0048580169677734375, -0.0041735172271728516, -0.0034890174865722656, -0.0028045177459716797, -0.0021200180053710938, -0.0014355182647705078, -0.0007510185241699219, -6.651878356933594e-05, 0.00061798095703125, 0.001302480697631836, 0.001986980438232422, 0.002671480178833008, 0.0033559799194335938, 0.00404047966003418, 0.004724979400634766, 0.0054094791412353516, 0.0060939788818359375, 0.0067784786224365234, 0.007462978363037109, 0.008147478103637695, 0.008831977844238281, 0.009516477584838867, 0.010200977325439453, 0.010885477066040039, 0.011569976806640625, 0.012254476547241211, 0.012938976287841797, 0.013623476028442383, 0.014307975769042969, 0.014992475509643555, 0.01567697525024414, 0.016361474990844727, 0.017045974731445312, 0.0177304744720459, 0.018414974212646484, 0.01909947395324707, 0.019783973693847656, 0.020468473434448242, 0.021152973175048828, 0.021837472915649414, 0.02252197265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 12.0, 10.0, 6.0, 16.0, 15.0, 24.0, 18.0, 34.0, 34.0, 39.0, 41.0, 48.0, 62.0, 49.0, 60.0, 60.0, 53.0, 68.0, 58.0, 52.0, 54.0, 42.0, 19.0, 20.0, 23.0, 19.0, 11.0, 13.0, 6.0, 10.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.025054931640625, -0.024324893951416016, -0.02359485626220703, -0.022864818572998047, -0.022134780883789062, -0.021404743194580078, -0.020674705505371094, -0.01994466781616211, -0.019214630126953125, -0.01848459243774414, -0.017754554748535156, -0.017024517059326172, -0.016294479370117188, -0.015564441680908203, -0.014834403991699219, -0.014104366302490234, -0.01337432861328125, -0.012644290924072266, -0.011914253234863281, -0.011184215545654297, -0.010454177856445312, -0.009724140167236328, -0.008994102478027344, -0.00826406478881836, -0.007534027099609375, -0.006803989410400391, -0.006073951721191406, -0.005343914031982422, -0.0046138763427734375, -0.003883838653564453, -0.0031538009643554688, -0.0024237632751464844, -0.0016937255859375, -0.0009636878967285156, -0.00023365020751953125, 0.0004963874816894531, 0.0012264251708984375, 0.001956462860107422, 0.0026865005493164062, 0.0034165382385253906, 0.004146575927734375, 0.004876613616943359, 0.005606651306152344, 0.006336688995361328, 0.0070667266845703125, 0.007796764373779297, 0.008526802062988281, 0.009256839752197266, 0.00998687744140625, 0.010716915130615234, 0.011446952819824219, 0.012176990509033203, 0.012907028198242188, 0.013637065887451172, 0.014367103576660156, 0.01509714126586914, 0.015827178955078125, 0.01655721664428711, 0.017287254333496094, 0.018017292022705078, 0.018747329711914062, 0.019477367401123047, 0.02020740509033203, 0.020937442779541016, 0.02166748046875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 1.0, 12.0, 11.0, 17.0, 20.0, 27.0, 35.0, 53.0, 51.0, 62.0, 53.0, 87.0, 69.0, 89.0, 89.0, 70.0, 46.0, 53.0, 44.0, 29.0, 19.0, 16.0, 7.0, 12.0, 5.0, 4.0, 8.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.3592032790184021, -0.34932658076286316, -0.3394498825073242, -0.3295731842517853, -0.31969648599624634, -0.309819757938385, -0.29994305968284607, -0.29006636142730713, -0.2801896631717682, -0.27031296491622925, -0.2604362666606903, -0.25055956840515137, -0.24068285524845123, -0.2308061569929123, -0.22092944383621216, -0.21105274558067322, -0.20117604732513428, -0.19129934906959534, -0.1814226508140564, -0.17154593765735626, -0.16166923940181732, -0.15179254114627838, -0.14191582798957825, -0.1320391297340393, -0.12216243147850037, -0.11228573322296143, -0.10240902751684189, -0.09253232181072235, -0.08265562355518341, -0.07277892529964447, -0.06290221959352493, -0.053025513887405396, -0.043148815631866455, -0.033272113651037216, -0.023395411670207977, -0.013518709689378738, -0.0036420077085494995, 0.006234694272279739, 0.01611139625310898, 0.025988101959228516, 0.035864800214767456, 0.045741502195596695, 0.055618204176425934, 0.06549490988254547, 0.07537160813808441, 0.08524830639362335, 0.09512501209974289, 0.10500171780586243, 0.11487841606140137, 0.12475511431694031, 0.13463181257247925, 0.14450852572917938, 0.15438522398471832, 0.16426192224025726, 0.1741386353969574, 0.18401533365249634, 0.19389203190803528, 0.20376873016357422, 0.21364542841911316, 0.2235221415758133, 0.23339883983135223, 0.24327553808689117, 0.2531522512435913, 0.26302894949913025, 0.2729056477546692]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 5.0, 7.0, 7.0, 15.0, 7.0, 17.0, 18.0, 25.0, 25.0, 34.0, 31.0, 41.0, 49.0, 47.0, 52.0, 58.0, 44.0, 44.0, 47.0, 48.0, 40.0, 37.0, 39.0, 37.0, 33.0, 30.0, 38.0, 31.0, 15.0, 18.0, 15.0, 13.0, 6.0, 7.0, 3.0, 4.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.48973506689071655, -0.4769791066646576, -0.46422314643859863, -0.45146721601486206, -0.4387112557888031, -0.42595529556274414, -0.4131993353366852, -0.4004433751106262, -0.38768741488456726, -0.3749314546585083, -0.36217549443244934, -0.3494195342063904, -0.3366636037826538, -0.32390764355659485, -0.3111516833305359, -0.29839572310447693, -0.28563976287841797, -0.272883802652359, -0.26012784242630005, -0.24737189710140228, -0.23461593687534332, -0.22185999155044556, -0.2091040313243866, -0.19634807109832764, -0.18359214067459106, -0.1708361804485321, -0.15808023512363434, -0.14532427489757538, -0.13256831467151642, -0.11981236189603806, -0.10705640912055969, -0.09430044889450073, -0.08154448866844177, -0.06878853589296341, -0.05603257566690445, -0.043276622891426086, -0.030520666390657425, -0.017764709889888763, -0.0050087571144104, 0.00774720311164856, 0.020503155887126923, 0.033259112387895584, 0.046015068888664246, 0.05877102166414261, 0.07152697443962097, 0.08428293466567993, 0.0970388874411583, 0.10979484766721725, 0.12255080044269562, 0.13530676066875458, 0.14806270599365234, 0.1608186662197113, 0.17357462644577026, 0.18633058667182922, 0.199086531996727, 0.21184249222278595, 0.22459843754768372, 0.23735439777374268, 0.25011035799980164, 0.2628663182258606, 0.27562224864959717, 0.28837820887565613, 0.3011341691017151, 0.31389012932777405, 0.326646089553833]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 6.0, 14.0, 15.0, 31.0, 37.0, 53.0, 83.0, 128.0, 188.0, 276.0, 514.0, 960.0, 1772.0, 3899.0, 9252.0, 24171.0, 78097.0, 380090.0, 2038189.0, 1351715.0, 221064.0, 54606.0, 17504.0, 6471.0, 2632.0, 1278.0, 538.0, 293.0, 169.0, 93.0, 49.0, 34.0, 17.0, 15.0, 5.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10638427734375, -0.10357284545898438, -0.10076141357421875, -0.09794998168945312, -0.0951385498046875, -0.09232711791992188, -0.08951568603515625, -0.08670425415039062, -0.083892822265625, -0.08108139038085938, -0.07826995849609375, -0.07545852661132812, -0.0726470947265625, -0.06983566284179688, -0.06702423095703125, -0.06421279907226562, -0.0614013671875, -0.058589935302734375, -0.05577850341796875, -0.052967071533203125, -0.0501556396484375, -0.047344207763671875, -0.04453277587890625, -0.041721343994140625, -0.038909912109375, -0.036098480224609375, -0.03328704833984375, -0.030475616455078125, -0.0276641845703125, -0.024852752685546875, -0.02204132080078125, -0.019229888916015625, -0.01641845703125, -0.013607025146484375, -0.01079559326171875, -0.007984161376953125, -0.0051727294921875, -0.002361297607421875, 0.00045013427734375, 0.003261566162109375, 0.006072998046875, 0.008884429931640625, 0.01169586181640625, 0.014507293701171875, 0.0173187255859375, 0.020130157470703125, 0.02294158935546875, 0.025753021240234375, 0.028564453125, 0.031375885009765625, 0.03418731689453125, 0.036998748779296875, 0.0398101806640625, 0.042621612548828125, 0.04543304443359375, 0.048244476318359375, 0.051055908203125, 0.053867340087890625, 0.05667877197265625, 0.059490203857421875, 0.0623016357421875, 0.06511306762695312, 0.06792449951171875, 0.07073593139648438, 0.07354736328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 5.0, 7.0, 7.0, 8.0, 12.0, 16.0, 31.0, 32.0, 34.0, 38.0, 39.0, 58.0, 55.0, 45.0, 59.0, 70.0, 56.0, 53.0, 65.0, 52.0, 51.0, 39.0, 36.0, 33.0, 25.0, 21.0, 10.0, 16.0, 9.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0777587890625, -0.07588720321655273, -0.07401561737060547, -0.0721440315246582, -0.07027244567871094, -0.06840085983276367, -0.0665292739868164, -0.06465768814086914, -0.06278610229492188, -0.06091451644897461, -0.059042930603027344, -0.05717134475708008, -0.05529975891113281, -0.05342817306518555, -0.05155658721923828, -0.049685001373291016, -0.04781341552734375, -0.045941829681396484, -0.04407024383544922, -0.04219865798950195, -0.04032707214355469, -0.03845548629760742, -0.036583900451660156, -0.03471231460571289, -0.032840728759765625, -0.03096914291381836, -0.029097557067871094, -0.027225971221923828, -0.025354385375976562, -0.023482799530029297, -0.02161121368408203, -0.019739627838134766, -0.0178680419921875, -0.015996456146240234, -0.014124870300292969, -0.012253284454345703, -0.010381698608398438, -0.008510112762451172, -0.006638526916503906, -0.004766941070556641, -0.002895355224609375, -0.0010237693786621094, 0.0008478164672851562, 0.002719402313232422, 0.0045909881591796875, 0.006462574005126953, 0.008334159851074219, 0.010205745697021484, 0.01207733154296875, 0.013948917388916016, 0.01582050323486328, 0.017692089080810547, 0.019563674926757812, 0.021435260772705078, 0.023306846618652344, 0.02517843246459961, 0.027050018310546875, 0.02892160415649414, 0.030793190002441406, 0.03266477584838867, 0.03453636169433594, 0.0364079475402832, 0.03827953338623047, 0.040151119232177734, 0.042022705078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 15.0, 36.0, 25.0, 71.0, 119.0, 207.0, 523.0, 1255.0, 3726.0, 12316.0, 49429.0, 221141.0, 1166775.0, 2135224.0, 470811.0, 99180.0, 23409.0, 6441.0, 2092.0, 771.0, 341.0, 158.0, 72.0, 39.0, 24.0, 26.0, 17.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08758544921875, -0.08436965942382812, -0.08115386962890625, -0.07793807983398438, -0.0747222900390625, -0.07150650024414062, -0.06829071044921875, -0.06507492065429688, -0.061859130859375, -0.058643341064453125, -0.05542755126953125, -0.052211761474609375, -0.0489959716796875, -0.045780181884765625, -0.04256439208984375, -0.039348602294921875, -0.0361328125, -0.032917022705078125, -0.02970123291015625, -0.026485443115234375, -0.0232696533203125, -0.020053863525390625, -0.01683807373046875, -0.013622283935546875, -0.010406494140625, -0.007190704345703125, -0.00397491455078125, -0.000759124755859375, 0.0024566650390625, 0.005672454833984375, 0.00888824462890625, 0.012104034423828125, 0.01531982421875, 0.018535614013671875, 0.02175140380859375, 0.024967193603515625, 0.0281829833984375, 0.031398773193359375, 0.03461456298828125, 0.037830352783203125, 0.041046142578125, 0.044261932373046875, 0.04747772216796875, 0.050693511962890625, 0.0539093017578125, 0.057125091552734375, 0.06034088134765625, 0.06355667114257812, 0.0667724609375, 0.06998825073242188, 0.07320404052734375, 0.07641983032226562, 0.0796356201171875, 0.08285140991210938, 0.08606719970703125, 0.08928298950195312, 0.092498779296875, 0.09571456909179688, 0.09893035888671875, 0.10214614868164062, 0.1053619384765625, 0.10857772827148438, 0.11179351806640625, 0.11500930786132812, 0.11822509765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 8.0, 9.0, 10.0, 19.0, 26.0, 27.0, 27.0, 52.0, 55.0, 76.0, 83.0, 129.0, 170.0, 231.0, 285.0, 369.0, 436.0, 465.0, 373.0, 298.0, 230.0, 156.0, 116.0, 105.0, 67.0, 45.0, 54.0, 37.0, 29.0, 25.0, 15.0, 11.0, 8.0, 7.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0640869140625, -0.061878204345703125, -0.05966949462890625, -0.057460784912109375, -0.0552520751953125, -0.053043365478515625, -0.05083465576171875, -0.048625946044921875, -0.046417236328125, -0.044208526611328125, -0.04199981689453125, -0.039791107177734375, -0.0375823974609375, -0.035373687744140625, -0.03316497802734375, -0.030956268310546875, -0.02874755859375, -0.026538848876953125, -0.02433013916015625, -0.022121429443359375, -0.0199127197265625, -0.017704010009765625, -0.01549530029296875, -0.013286590576171875, -0.011077880859375, -0.008869171142578125, -0.00666046142578125, -0.004451751708984375, -0.0022430419921875, -3.4332275390625e-05, 0.00217437744140625, 0.004383087158203125, 0.006591796875, 0.008800506591796875, 0.01100921630859375, 0.013217926025390625, 0.0154266357421875, 0.017635345458984375, 0.01984405517578125, 0.022052764892578125, 0.024261474609375, 0.026470184326171875, 0.02867889404296875, 0.030887603759765625, 0.0330963134765625, 0.035305023193359375, 0.03751373291015625, 0.039722442626953125, 0.04193115234375, 0.044139862060546875, 0.04634857177734375, 0.048557281494140625, 0.0507659912109375, 0.052974700927734375, 0.05518341064453125, 0.057392120361328125, 0.059600830078125, 0.061809539794921875, 0.06401824951171875, 0.06622695922851562, 0.0684356689453125, 0.07064437866210938, 0.07285308837890625, 0.07506179809570312, 0.0772705078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 9.0, 9.0, 18.0, 21.0, 40.0, 47.0, 56.0, 81.0, 91.0, 89.0, 86.0, 80.0, 92.0, 68.0, 64.0, 43.0, 30.0, 22.0, 19.0, 7.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3573712110519409, -0.34598851203918457, -0.3346058130264282, -0.3232231140136719, -0.3118404150009155, -0.3004577159881592, -0.28907501697540283, -0.27769234776496887, -0.2663096487522125, -0.2549269497394562, -0.24354425072669983, -0.23216155171394348, -0.22077886760234833, -0.20939616858959198, -0.19801346957683563, -0.18663078546524048, -0.17524807155132294, -0.1638653725385666, -0.15248267352581024, -0.1410999894142151, -0.12971729040145874, -0.11833459138870239, -0.10695189237594604, -0.0955692008137703, -0.08418650180101395, -0.0728038027882576, -0.06142111122608185, -0.0500384122133255, -0.03865571692585945, -0.027273021638393402, -0.015890322625637054, -0.004507631063461304, 0.006875067949295044, 0.018257763236761093, 0.02964046038687229, 0.04102315753698349, 0.05240585282444954, 0.06378854811191559, 0.07517124712467194, 0.08655393868684769, 0.09793663769960403, 0.10931933671236038, 0.12070202827453613, 0.13208472728729248, 0.14346742630004883, 0.15485012531280518, 0.16623282432556152, 0.17761550843715668, 0.18899820744991302, 0.20038090646266937, 0.21176360547542572, 0.22314628958702087, 0.23452898859977722, 0.24591168761253357, 0.2572943866252899, 0.26867708563804626, 0.2800597846508026, 0.29144248366355896, 0.3028251826763153, 0.31420788168907166, 0.325590580701828, 0.33697324991226196, 0.3483559489250183, 0.35973864793777466, 0.371121346950531]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 7.0, 9.0, 10.0, 10.0, 15.0, 7.0, 17.0, 27.0, 26.0, 22.0, 42.0, 39.0, 34.0, 30.0, 46.0, 32.0, 47.0, 44.0, 50.0, 44.0, 44.0, 44.0, 48.0, 40.0, 39.0, 36.0, 29.0, 21.0, 18.0, 30.0, 12.0, 6.0, 13.0, 11.0, 8.0, 7.0, 5.0, 9.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23004448413848877, -0.22217756509780884, -0.2143106460571289, -0.20644372701644897, -0.19857682287693024, -0.1907099038362503, -0.18284298479557037, -0.17497606575489044, -0.1671091616153717, -0.15924224257469177, -0.15137532353401184, -0.1435084044933319, -0.13564150035381317, -0.12777458131313324, -0.11990766227245331, -0.11204074323177338, -0.10417382419109344, -0.09630690515041351, -0.08843999356031418, -0.08057307451963425, -0.07270616292953491, -0.06483924388885498, -0.05697232484817505, -0.049105409532785416, -0.04123849421739578, -0.03337157890200615, -0.025504661723971367, -0.017637744545936584, -0.009770829230546951, -0.0019039139151573181, 0.0059630051255226135, 0.013829920440912247, 0.02169683575630188, 0.029563751071691513, 0.037430666387081146, 0.04529758542776108, 0.05316450074315071, 0.061031416058540344, 0.06889833509922028, 0.07676525413990021, 0.08463216572999954, 0.09249908477067947, 0.10036599636077881, 0.10823291540145874, 0.11609983444213867, 0.123966746032238, 0.13183367252349854, 0.13970057666301727, 0.1475674957036972, 0.15543441474437714, 0.16330133378505707, 0.1711682379245758, 0.17903515696525574, 0.18690207600593567, 0.1947689950466156, 0.20263591408729553, 0.21050283312797546, 0.2183697521686554, 0.22623667120933533, 0.23410359025001526, 0.241970494389534, 0.24983741343021393, 0.25770431756973267, 0.2655712366104126, 0.27343815565109253]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 9.0, 16.0, 22.0, 41.0, 53.0, 96.0, 175.0, 315.0, 550.0, 1054.0, 2071.0, 4103.0, 8639.0, 18656.0, 40725.0, 87881.0, 171083.0, 248017.0, 220154.0, 128935.0, 62248.0, 28197.0, 13013.0, 6138.0, 2965.0, 1494.0, 800.0, 438.0, 219.0, 155.0, 89.0, 52.0, 35.0, 32.0, 23.0, 10.0, 13.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.16209030151367188, -0.15779876708984375, -0.15350723266601562, -0.1492156982421875, -0.14492416381835938, -0.14063262939453125, -0.13634109497070312, -0.132049560546875, -0.12775802612304688, -0.12346649169921875, -0.11917495727539062, -0.1148834228515625, -0.11059188842773438, -0.10630035400390625, -0.10200881958007812, -0.09771728515625, -0.09342575073242188, -0.08913421630859375, -0.08484268188476562, -0.0805511474609375, -0.07625961303710938, -0.07196807861328125, -0.06767654418945312, -0.063385009765625, -0.059093475341796875, -0.05480194091796875, -0.050510406494140625, -0.0462188720703125, -0.041927337646484375, -0.03763580322265625, -0.033344268798828125, -0.029052734375, -0.024761199951171875, -0.02046966552734375, -0.016178131103515625, -0.0118865966796875, -0.007595062255859375, -0.00330352783203125, 0.000988006591796875, 0.005279541015625, 0.009571075439453125, 0.01386260986328125, 0.018154144287109375, 0.0224456787109375, 0.026737213134765625, 0.03102874755859375, 0.035320281982421875, 0.03961181640625, 0.043903350830078125, 0.04819488525390625, 0.052486419677734375, 0.0567779541015625, 0.061069488525390625, 0.06536102294921875, 0.06965255737304688, 0.073944091796875, 0.07823562622070312, 0.08252716064453125, 0.08681869506835938, 0.0911102294921875, 0.09540176391601562, 0.09969329833984375, 0.10398483276367188, 0.1082763671875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 4.0, 7.0, 10.0, 14.0, 21.0, 25.0, 26.0, 34.0, 34.0, 41.0, 40.0, 53.0, 47.0, 52.0, 57.0, 60.0, 56.0, 66.0, 55.0, 46.0, 38.0, 43.0, 23.0, 32.0, 23.0, 19.0, 19.0, 14.0, 15.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.069580078125, -0.06796503067016602, -0.06634998321533203, -0.06473493576049805, -0.06311988830566406, -0.06150484085083008, -0.059889793395996094, -0.05827474594116211, -0.056659698486328125, -0.05504465103149414, -0.053429603576660156, -0.05181455612182617, -0.05019950866699219, -0.0485844612121582, -0.04696941375732422, -0.045354366302490234, -0.04373931884765625, -0.042124271392822266, -0.04050922393798828, -0.0388941764831543, -0.03727912902832031, -0.03566408157348633, -0.034049034118652344, -0.03243398666381836, -0.030818939208984375, -0.02920389175415039, -0.027588844299316406, -0.025973796844482422, -0.024358749389648438, -0.022743701934814453, -0.02112865447998047, -0.019513607025146484, -0.0178985595703125, -0.016283512115478516, -0.014668464660644531, -0.013053417205810547, -0.011438369750976562, -0.009823322296142578, -0.008208274841308594, -0.006593227386474609, -0.004978179931640625, -0.0033631324768066406, -0.0017480850219726562, -0.00013303756713867188, 0.0014820098876953125, 0.003097057342529297, 0.004712104797363281, 0.006327152252197266, 0.00794219970703125, 0.009557247161865234, 0.011172294616699219, 0.012787342071533203, 0.014402389526367188, 0.016017436981201172, 0.017632484436035156, 0.01924753189086914, 0.020862579345703125, 0.02247762680053711, 0.024092674255371094, 0.025707721710205078, 0.027322769165039062, 0.028937816619873047, 0.03055286407470703, 0.032167911529541016, 0.033782958984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 10.0, 10.0, 33.0, 49.0, 75.0, 136.0, 235.0, 437.0, 1027.0, 2274.0, 5717.0, 15147.0, 44007.0, 121438.0, 260107.0, 308848.0, 179642.0, 70146.0, 24301.0, 8633.0, 3353.0, 1462.0, 690.0, 349.0, 172.0, 103.0, 55.0, 30.0, 20.0, 13.0, 11.0, 4.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1470947265625, -0.1420612335205078, -0.13702774047851562, -0.13199424743652344, -0.12696075439453125, -0.12192726135253906, -0.11689376831054688, -0.11186027526855469, -0.1068267822265625, -0.10179328918457031, -0.09675979614257812, -0.09172630310058594, -0.08669281005859375, -0.08165931701660156, -0.07662582397460938, -0.07159233093261719, -0.066558837890625, -0.06152534484863281, -0.056491851806640625, -0.05145835876464844, -0.04642486572265625, -0.04139137268066406, -0.036357879638671875, -0.03132438659667969, -0.0262908935546875, -0.021257400512695312, -0.016223907470703125, -0.011190414428710938, -0.00615692138671875, -0.0011234283447265625, 0.003910064697265625, 0.008943557739257812, 0.01397705078125, 0.019010543823242188, 0.024044036865234375, 0.029077529907226562, 0.03411102294921875, 0.03914451599121094, 0.044178009033203125, 0.04921150207519531, 0.0542449951171875, 0.05927848815917969, 0.06431198120117188, 0.06934547424316406, 0.07437896728515625, 0.07941246032714844, 0.08444595336914062, 0.08947944641113281, 0.094512939453125, 0.09954643249511719, 0.10457992553710938, 0.10961341857910156, 0.11464691162109375, 0.11968040466308594, 0.12471389770507812, 0.1297473907470703, 0.1347808837890625, 0.1398143768310547, 0.14484786987304688, 0.14988136291503906, 0.15491485595703125, 0.15994834899902344, 0.16498184204101562, 0.1700153350830078, 0.175048828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 10.0, 8.0, 8.0, 9.0, 15.0, 22.0, 22.0, 18.0, 22.0, 27.0, 27.0, 32.0, 36.0, 42.0, 37.0, 65.0, 42.0, 45.0, 52.0, 50.0, 44.0, 42.0, 38.0, 43.0, 30.0, 37.0, 28.0, 25.0, 13.0, 23.0, 16.0, 15.0, 10.0, 10.0, 6.0, 8.0, 5.0, 10.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1190185546875, -0.11521244049072266, -0.11140632629394531, -0.10760021209716797, -0.10379409790039062, -0.09998798370361328, -0.09618186950683594, -0.0923757553100586, -0.08856964111328125, -0.0847635269165039, -0.08095741271972656, -0.07715129852294922, -0.07334518432617188, -0.06953907012939453, -0.06573295593261719, -0.061926841735839844, -0.0581207275390625, -0.054314613342285156, -0.05050849914550781, -0.04670238494873047, -0.042896270751953125, -0.03909015655517578, -0.03528404235839844, -0.031477928161621094, -0.02767181396484375, -0.023865699768066406, -0.020059585571289062, -0.01625347137451172, -0.012447357177734375, -0.008641242980957031, -0.0048351287841796875, -0.0010290145874023438, 0.002777099609375, 0.006583213806152344, 0.010389328002929688, 0.014195442199707031, 0.018001556396484375, 0.02180767059326172, 0.025613784790039062, 0.029419898986816406, 0.03322601318359375, 0.037032127380371094, 0.04083824157714844, 0.04464435577392578, 0.048450469970703125, 0.05225658416748047, 0.05606269836425781, 0.059868812561035156, 0.0636749267578125, 0.06748104095458984, 0.07128715515136719, 0.07509326934814453, 0.07889938354492188, 0.08270549774169922, 0.08651161193847656, 0.0903177261352539, 0.09412384033203125, 0.0979299545288086, 0.10173606872558594, 0.10554218292236328, 0.10934829711914062, 0.11315441131591797, 0.11696052551269531, 0.12076663970947266, 0.12457275390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 8.0, 14.0, 19.0, 21.0, 47.0, 80.0, 87.0, 148.0, 195.0, 277.0, 386.0, 625.0, 947.0, 1426.0, 2278.0, 3899.0, 7362.0, 15549.0, 37087.0, 97397.0, 236679.0, 323498.0, 190373.0, 74011.0, 28584.0, 12223.0, 6069.0, 3339.0, 1988.0, 1315.0, 800.0, 574.0, 388.0, 282.0, 179.0, 122.0, 108.0, 55.0, 35.0, 24.0, 11.0, 10.0, 8.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04742431640625, -0.04586219787597656, -0.044300079345703125, -0.04273796081542969, -0.04117584228515625, -0.03961372375488281, -0.038051605224609375, -0.03648948669433594, -0.0349273681640625, -0.03336524963378906, -0.031803131103515625, -0.030241012573242188, -0.02867889404296875, -0.027116775512695312, -0.025554656982421875, -0.023992538452148438, -0.022430419921875, -0.020868301391601562, -0.019306182861328125, -0.017744064331054688, -0.01618194580078125, -0.014619827270507812, -0.013057708740234375, -0.011495590209960938, -0.0099334716796875, -0.008371353149414062, -0.006809234619140625, -0.0052471160888671875, -0.00368499755859375, -0.0021228790283203125, -0.000560760498046875, 0.0010013580322265625, 0.0025634765625, 0.0041255950927734375, 0.005687713623046875, 0.0072498321533203125, 0.00881195068359375, 0.010374069213867188, 0.011936187744140625, 0.013498306274414062, 0.0150604248046875, 0.016622543334960938, 0.018184661865234375, 0.019746780395507812, 0.02130889892578125, 0.022871017456054688, 0.024433135986328125, 0.025995254516601562, 0.027557373046875, 0.029119491577148438, 0.030681610107421875, 0.03224372863769531, 0.03380584716796875, 0.03536796569824219, 0.036930084228515625, 0.03849220275878906, 0.0400543212890625, 0.04161643981933594, 0.043178558349609375, 0.04474067687988281, 0.04630279541015625, 0.04786491394042969, 0.049427032470703125, 0.05098915100097656, 0.05255126953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 15.0, 10.0, 11.0, 15.0, 11.0, 20.0, 21.0, 24.0, 40.0, 29.0, 44.0, 54.0, 47.0, 62.0, 62.0, 81.0, 54.0, 55.0, 48.0, 38.0, 36.0, 42.0, 29.0, 30.0, 25.0, 15.0, 17.0, 12.0, 9.0, 14.0, 7.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.8606893718242645e-05, -1.80806964635849e-05, -1.7554499208927155e-05, -1.702830195426941e-05, -1.6502104699611664e-05, -1.597590744495392e-05, -1.5449710190296173e-05, -1.4923512935638428e-05, -1.4397315680980682e-05, -1.3871118426322937e-05, -1.3344921171665192e-05, -1.2818723917007446e-05, -1.2292526662349701e-05, -1.1766329407691956e-05, -1.124013215303421e-05, -1.0713934898376465e-05, -1.018773764371872e-05, -9.661540389060974e-06, -9.135343134403229e-06, -8.609145879745483e-06, -8.082948625087738e-06, -7.556751370429993e-06, -7.030554115772247e-06, -6.504356861114502e-06, -5.978159606456757e-06, -5.451962351799011e-06, -4.925765097141266e-06, -4.3995678424835205e-06, -3.873370587825775e-06, -3.3471733331680298e-06, -2.8209760785102844e-06, -2.294778823852539e-06, -1.7685815691947937e-06, -1.2423843145370483e-06, -7.16187059879303e-07, -1.8998980522155762e-07, 3.3620744943618774e-07, 8.624047040939331e-07, 1.3886019587516785e-06, 1.914799213409424e-06, 2.440996468067169e-06, 2.9671937227249146e-06, 3.49339097738266e-06, 4.019588232040405e-06, 4.545785486698151e-06, 5.071982741355896e-06, 5.598179996013641e-06, 6.124377250671387e-06, 6.650574505329132e-06, 7.1767717599868774e-06, 7.702969014644623e-06, 8.229166269302368e-06, 8.755363523960114e-06, 9.281560778617859e-06, 9.807758033275604e-06, 1.033395528793335e-05, 1.0860152542591095e-05, 1.138634979724884e-05, 1.1912547051906586e-05, 1.2438744306564331e-05, 1.2964941561222076e-05, 1.3491138815879822e-05, 1.4017336070537567e-05, 1.4543533325195312e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 18.0, 20.0, 38.0, 63.0, 86.0, 154.0, 180.0, 285.0, 445.0, 740.0, 1227.0, 2115.0, 4096.0, 8913.0, 24292.0, 87740.0, 308439.0, 404254.0, 142665.0, 38204.0, 12645.0, 5263.0, 2638.0, 1516.0, 927.0, 543.0, 363.0, 254.0, 130.0, 104.0, 65.0, 38.0, 26.0, 17.0, 9.0, 9.0, 3.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 4.0], "bins": [-0.07171630859375, -0.06978750228881836, -0.06785869598388672, -0.06592988967895508, -0.06400108337402344, -0.0620722770690918, -0.060143470764160156, -0.058214664459228516, -0.056285858154296875, -0.054357051849365234, -0.052428245544433594, -0.05049943923950195, -0.04857063293457031, -0.04664182662963867, -0.04471302032470703, -0.04278421401977539, -0.04085540771484375, -0.03892660140991211, -0.03699779510498047, -0.03506898880004883, -0.03314018249511719, -0.031211376190185547, -0.029282569885253906, -0.027353763580322266, -0.025424957275390625, -0.023496150970458984, -0.021567344665527344, -0.019638538360595703, -0.017709732055664062, -0.015780925750732422, -0.013852119445800781, -0.01192331314086914, -0.0099945068359375, -0.00806570053100586, -0.006136894226074219, -0.004208087921142578, -0.0022792816162109375, -0.0003504753112792969, 0.0015783309936523438, 0.0035071372985839844, 0.005435943603515625, 0.007364749908447266, 0.009293556213378906, 0.011222362518310547, 0.013151168823242188, 0.015079975128173828, 0.01700878143310547, 0.01893758773803711, 0.02086639404296875, 0.02279520034790039, 0.02472400665283203, 0.026652812957763672, 0.028581619262695312, 0.030510425567626953, 0.032439231872558594, 0.034368038177490234, 0.036296844482421875, 0.038225650787353516, 0.040154457092285156, 0.0420832633972168, 0.04401206970214844, 0.04594087600708008, 0.04786968231201172, 0.04979848861694336, 0.051727294921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 8.0, 8.0, 5.0, 8.0, 15.0, 30.0, 23.0, 50.0, 59.0, 77.0, 70.0, 91.0, 112.0, 87.0, 79.0, 71.0, 58.0, 41.0, 30.0, 18.0, 22.0, 9.0, 11.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0552978515625, -0.05389213562011719, -0.052486419677734375, -0.05108070373535156, -0.04967498779296875, -0.04826927185058594, -0.046863555908203125, -0.04545783996582031, -0.0440521240234375, -0.04264640808105469, -0.041240692138671875, -0.03983497619628906, -0.03842926025390625, -0.03702354431152344, -0.035617828369140625, -0.03421211242675781, -0.032806396484375, -0.03140068054199219, -0.029994964599609375, -0.028589248657226562, -0.02718353271484375, -0.025777816772460938, -0.024372100830078125, -0.022966384887695312, -0.0215606689453125, -0.020154953002929688, -0.018749237060546875, -0.017343521118164062, -0.01593780517578125, -0.014532089233398438, -0.013126373291015625, -0.011720657348632812, -0.01031494140625, -0.008909225463867188, -0.007503509521484375, -0.0060977935791015625, -0.00469207763671875, -0.0032863616943359375, -0.001880645751953125, -0.0004749298095703125, 0.0009307861328125, 0.0023365020751953125, 0.003742218017578125, 0.0051479339599609375, 0.00655364990234375, 0.007959365844726562, 0.009365081787109375, 0.010770797729492188, 0.012176513671875, 0.013582229614257812, 0.014987945556640625, 0.016393661499023438, 0.01779937744140625, 0.019205093383789062, 0.020610809326171875, 0.022016525268554688, 0.0234222412109375, 0.024827957153320312, 0.026233673095703125, 0.027639389038085938, 0.02904510498046875, 0.030450820922851562, 0.031856536865234375, 0.03326225280761719, 0.03466796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 3.0, 11.0, 8.0, 14.0, 16.0, 27.0, 36.0, 55.0, 30.0, 56.0, 72.0, 83.0, 68.0, 73.0, 76.0, 73.0, 62.0, 52.0, 44.0, 25.0, 31.0, 24.0, 16.0, 14.0, 11.0, 3.0, 6.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.41785478591918945, -0.4052482843399048, -0.3926417827606201, -0.38003528118133545, -0.3674287497997284, -0.3548222482204437, -0.34221574664115906, -0.3296092450618744, -0.3170027434825897, -0.30439624190330505, -0.2917897403240204, -0.27918320894241333, -0.26657670736312866, -0.253970205783844, -0.24136370420455933, -0.22875720262527466, -0.2161506861448288, -0.20354418456554413, -0.19093766808509827, -0.1783311665058136, -0.16572466492652893, -0.15311816334724426, -0.1405116468667984, -0.12790514528751373, -0.11529863625764847, -0.1026921272277832, -0.09008562564849854, -0.07747911661863327, -0.064872607588768, -0.05226610600948334, -0.03965959697961807, -0.027053095400333405, -0.01444658637046814, -0.0018400801345705986, 0.010766426101326942, 0.023372933268547058, 0.035979438573122025, 0.04858594387769699, 0.061192452907562256, 0.07379895448684692, 0.08640546351671219, 0.09901197254657745, 0.11161847412586212, 0.12422498315572739, 0.13683149218559265, 0.14943799376487732, 0.162044495344162, 0.17465099692344666, 0.18725751340389252, 0.19986401498317719, 0.21247053146362305, 0.22507703304290771, 0.23768353462219238, 0.25029003620147705, 0.2628965377807617, 0.2755030393600464, 0.28810957074165344, 0.3007160723209381, 0.3133225739002228, 0.32592910528182983, 0.3385356068611145, 0.35114210844039917, 0.36374861001968384, 0.3763551115989685, 0.3889616131782532]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 6.0, 5.0, 4.0, 7.0, 8.0, 12.0, 8.0, 10.0, 14.0, 11.0, 16.0, 13.0, 17.0, 21.0, 25.0, 30.0, 23.0, 25.0, 27.0, 49.0, 40.0, 31.0, 51.0, 39.0, 39.0, 51.0, 41.0, 47.0, 29.0, 32.0, 29.0, 28.0, 42.0, 31.0, 22.0, 19.0, 17.0, 17.0, 12.0, 12.0, 8.0, 7.0, 14.0, 5.0, 4.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3790660500526428, -0.3679039776325226, -0.35674190521240234, -0.3455798029899597, -0.3344177305698395, -0.32325565814971924, -0.312093585729599, -0.30093151330947876, -0.28976941108703613, -0.2786073386669159, -0.26744526624679565, -0.256283164024353, -0.2451210916042328, -0.23395901918411255, -0.2227969467639923, -0.21163485944271088, -0.20047278702259064, -0.1893107146024704, -0.17814862728118896, -0.16698655486106873, -0.1558244675397873, -0.14466239511966705, -0.13350030779838562, -0.12233823537826538, -0.11117615550756454, -0.10001407563686371, -0.08885199576616287, -0.07768991589546204, -0.0665278434753418, -0.05536575987935066, -0.044203683733940125, -0.03304160386323929, -0.021879523992538452, -0.01071744505316019, 0.000444633886218071, 0.011606711894273758, 0.022768791764974594, 0.03393087163567543, 0.04509294778108597, 0.056255027651786804, 0.06741710752248764, 0.07857918739318848, 0.08974126726388931, 0.10090334713459015, 0.11206541955471039, 0.12322750687599182, 0.13438957929611206, 0.1455516517162323, 0.15671373903751373, 0.16787581145763397, 0.1790378987789154, 0.19019997119903564, 0.20136205852031708, 0.21252413094043732, 0.22368621826171875, 0.234848290681839, 0.24601036310195923, 0.25717243552207947, 0.2683345079421997, 0.27949661016464233, 0.2906586825847626, 0.3018207550048828, 0.31298282742500305, 0.3241448998451233, 0.3353070020675659]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 6.0, 8.0, 15.0, 15.0, 13.0, 25.0, 37.0, 48.0, 63.0, 126.0, 159.0, 231.0, 303.0, 474.0, 852.0, 1302.0, 2088.0, 3461.0, 6202.0, 11798.0, 22969.0, 51405.0, 135326.0, 494704.0, 1487201.0, 1326685.0, 427009.0, 127878.0, 48522.0, 21877.0, 10637.0, 5672.0, 3006.0, 1702.0, 954.0, 585.0, 359.0, 201.0, 133.0, 85.0, 43.0, 48.0, 26.0, 13.0, 13.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0758056640625, -0.0738077163696289, -0.07180976867675781, -0.06981182098388672, -0.06781387329101562, -0.06581592559814453, -0.06381797790527344, -0.061820030212402344, -0.05982208251953125, -0.057824134826660156, -0.05582618713378906, -0.05382823944091797, -0.051830291748046875, -0.04983234405517578, -0.04783439636230469, -0.045836448669433594, -0.0438385009765625, -0.041840553283691406, -0.03984260559082031, -0.03784465789794922, -0.035846710205078125, -0.03384876251220703, -0.03185081481933594, -0.029852867126464844, -0.02785491943359375, -0.025856971740722656, -0.023859024047851562, -0.02186107635498047, -0.019863128662109375, -0.01786518096923828, -0.015867233276367188, -0.013869285583496094, -0.011871337890625, -0.009873390197753906, -0.007875442504882812, -0.005877494812011719, -0.003879547119140625, -0.0018815994262695312, 0.0001163482666015625, 0.0021142959594726562, 0.00411224365234375, 0.006110191345214844, 0.008108139038085938, 0.010106086730957031, 0.012104034423828125, 0.014101982116699219, 0.016099929809570312, 0.018097877502441406, 0.0200958251953125, 0.022093772888183594, 0.024091720581054688, 0.02608966827392578, 0.028087615966796875, 0.03008556365966797, 0.03208351135253906, 0.034081459045410156, 0.03607940673828125, 0.038077354431152344, 0.04007530212402344, 0.04207324981689453, 0.044071197509765625, 0.04606914520263672, 0.04806709289550781, 0.050065040588378906, 0.05206298828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 14.0, 17.0, 12.0, 15.0, 17.0, 21.0, 25.0, 25.0, 26.0, 35.0, 32.0, 29.0, 31.0, 40.0, 40.0, 54.0, 45.0, 54.0, 52.0, 37.0, 40.0, 23.0, 32.0, 42.0, 23.0, 38.0, 23.0, 21.0, 20.0, 19.0, 12.0, 15.0, 12.0, 8.0, 9.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.058074951171875, -0.05652141571044922, -0.05496788024902344, -0.053414344787597656, -0.051860809326171875, -0.050307273864746094, -0.04875373840332031, -0.04720020294189453, -0.04564666748046875, -0.04409313201904297, -0.04253959655761719, -0.040986061096191406, -0.039432525634765625, -0.037878990173339844, -0.03632545471191406, -0.03477191925048828, -0.0332183837890625, -0.03166484832763672, -0.030111312866210938, -0.028557777404785156, -0.027004241943359375, -0.025450706481933594, -0.023897171020507812, -0.02234363555908203, -0.02079010009765625, -0.01923656463623047, -0.017683029174804688, -0.016129493713378906, -0.014575958251953125, -0.013022422790527344, -0.011468887329101562, -0.009915351867675781, -0.00836181640625, -0.006808280944824219, -0.0052547454833984375, -0.0037012100219726562, -0.002147674560546875, -0.0005941390991210938, 0.0009593963623046875, 0.0025129318237304688, 0.00406646728515625, 0.005620002746582031, 0.0071735382080078125, 0.008727073669433594, 0.010280609130859375, 0.011834144592285156, 0.013387680053710938, 0.014941215515136719, 0.0164947509765625, 0.01804828643798828, 0.019601821899414062, 0.021155357360839844, 0.022708892822265625, 0.024262428283691406, 0.025815963745117188, 0.02736949920654297, 0.02892303466796875, 0.03047657012939453, 0.03203010559082031, 0.033583641052246094, 0.035137176513671875, 0.036690711975097656, 0.03824424743652344, 0.03979778289794922, 0.041351318359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 4.0, 7.0, 8.0, 22.0, 25.0, 17.0, 47.0, 55.0, 72.0, 97.0, 184.0, 313.0, 621.0, 1299.0, 2971.0, 7562.0, 20263.0, 63590.0, 230728.0, 1033791.0, 2087927.0, 547336.0, 134859.0, 39303.0, 13637.0, 5124.0, 2240.0, 989.0, 468.0, 219.0, 155.0, 95.0, 56.0, 54.0, 45.0, 18.0, 23.0, 12.0, 12.0, 11.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0953369140625, -0.09229087829589844, -0.08924484252929688, -0.08619880676269531, -0.08315277099609375, -0.08010673522949219, -0.07706069946289062, -0.07401466369628906, -0.0709686279296875, -0.06792259216308594, -0.06487655639648438, -0.06183052062988281, -0.05878448486328125, -0.05573844909667969, -0.052692413330078125, -0.04964637756347656, -0.046600341796875, -0.04355430603027344, -0.040508270263671875, -0.03746223449707031, -0.03441619873046875, -0.03137016296386719, -0.028324127197265625, -0.025278091430664062, -0.0222320556640625, -0.019186019897460938, -0.016139984130859375, -0.013093948364257812, -0.01004791259765625, -0.0070018768310546875, -0.003955841064453125, -0.0009098052978515625, 0.00213623046875, 0.0051822662353515625, 0.008228302001953125, 0.011274337768554688, 0.01432037353515625, 0.017366409301757812, 0.020412445068359375, 0.023458480834960938, 0.0265045166015625, 0.029550552368164062, 0.032596588134765625, 0.03564262390136719, 0.03868865966796875, 0.04173469543457031, 0.044780731201171875, 0.04782676696777344, 0.050872802734375, 0.05391883850097656, 0.056964874267578125, 0.06001091003417969, 0.06305694580078125, 0.06610298156738281, 0.06914901733398438, 0.07219505310058594, 0.0752410888671875, 0.07828712463378906, 0.08133316040039062, 0.08437919616699219, 0.08742523193359375, 0.09047126770019531, 0.09351730346679688, 0.09656333923339844, 0.099609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 14.0, 17.0, 16.0, 26.0, 36.0, 57.0, 63.0, 75.0, 104.0, 110.0, 215.0, 264.0, 403.0, 514.0, 559.0, 417.0, 294.0, 208.0, 162.0, 124.0, 85.0, 73.0, 51.0, 38.0, 16.0, 28.0, 21.0, 19.0, 12.0, 8.0, 5.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.06166648864746094, -0.059001922607421875, -0.05633735656738281, -0.05367279052734375, -0.05100822448730469, -0.048343658447265625, -0.04567909240722656, -0.0430145263671875, -0.04034996032714844, -0.037685394287109375, -0.03502082824707031, -0.03235626220703125, -0.029691696166992188, -0.027027130126953125, -0.024362564086914062, -0.021697998046875, -0.019033432006835938, -0.016368865966796875, -0.013704299926757812, -0.01103973388671875, -0.008375167846679688, -0.005710601806640625, -0.0030460357666015625, -0.0003814697265625, 0.0022830963134765625, 0.004947662353515625, 0.0076122283935546875, 0.01027679443359375, 0.012941360473632812, 0.015605926513671875, 0.018270492553710938, 0.02093505859375, 0.023599624633789062, 0.026264190673828125, 0.028928756713867188, 0.03159332275390625, 0.03425788879394531, 0.036922454833984375, 0.03958702087402344, 0.0422515869140625, 0.04491615295410156, 0.047580718994140625, 0.05024528503417969, 0.05290985107421875, 0.05557441711425781, 0.058238983154296875, 0.06090354919433594, 0.063568115234375, 0.06623268127441406, 0.06889724731445312, 0.07156181335449219, 0.07422637939453125, 0.07689094543457031, 0.07955551147460938, 0.08222007751464844, 0.0848846435546875, 0.08754920959472656, 0.09021377563476562, 0.09287834167480469, 0.09554290771484375, 0.09820747375488281, 0.10087203979492188, 0.10353660583496094, 0.106201171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 16.0, 8.0, 12.0, 17.0, 26.0, 46.0, 36.0, 50.0, 60.0, 70.0, 71.0, 73.0, 75.0, 76.0, 63.0, 60.0, 46.0, 48.0, 40.0, 29.0, 28.0, 10.0, 16.0, 11.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31792187690734863, -0.3059340715408325, -0.2939462661743164, -0.2819584608078003, -0.2699706554412842, -0.25798285007476807, -0.24599504470825195, -0.23400723934173584, -0.22201943397521973, -0.2100316286087036, -0.1980438232421875, -0.1860560178756714, -0.17406821250915527, -0.16208040714263916, -0.15009260177612305, -0.13810479640960693, -0.12611700594425201, -0.1141292005777359, -0.10214139521121979, -0.09015358984470367, -0.07816578447818756, -0.06617797911167145, -0.05419018119573593, -0.04220237582921982, -0.030214570462703705, -0.01822676509618759, -0.0062389615923166275, 0.0057488419115543365, 0.01773664727807045, 0.029724452644586563, 0.04171225428581238, 0.05370005965232849, 0.0656878650188446, 0.07767567038536072, 0.08966347575187683, 0.10165128111839294, 0.11363908648490906, 0.12562689185142517, 0.13761469721794128, 0.1496025025844574, 0.1615903079509735, 0.17357811331748962, 0.18556591868400574, 0.19755372405052185, 0.20954152941703796, 0.22152933478355408, 0.2335171401500702, 0.2455049455165863, 0.25749272108078003, 0.26948052644729614, 0.28146833181381226, 0.29345613718032837, 0.3054439425468445, 0.3174317479133606, 0.3294195532798767, 0.3414073586463928, 0.35339516401290894, 0.36538296937942505, 0.37737077474594116, 0.3893585801124573, 0.4013463854789734, 0.4133341908454895, 0.4253219962120056, 0.43730980157852173, 0.44929760694503784]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 6.0, 13.0, 8.0, 18.0, 10.0, 17.0, 20.0, 29.0, 32.0, 38.0, 35.0, 31.0, 23.0, 34.0, 39.0, 40.0, 37.0, 53.0, 41.0, 35.0, 32.0, 29.0, 34.0, 45.0, 26.0, 29.0, 29.0, 28.0, 24.0, 19.0, 29.0, 15.0, 12.0, 14.0, 14.0, 8.0, 6.0, 5.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.23656213283538818, -0.2287934273481369, -0.22102473676204681, -0.21325603127479553, -0.20548734068870544, -0.19771863520145416, -0.18994992971420288, -0.1821812391281128, -0.1744125485420227, -0.16664384305477142, -0.15887515246868134, -0.15110644698143005, -0.14333775639533997, -0.13556905090808868, -0.1278003454208374, -0.12003165483474731, -0.11226294934749603, -0.10449425131082535, -0.09672555327415466, -0.08895684778690338, -0.0811881572008133, -0.07341945171356201, -0.06565075367689133, -0.05788205564022064, -0.05011335760354996, -0.04234465956687927, -0.03457596153020859, -0.026807259768247604, -0.01903856173157692, -0.011269863694906235, -0.0035011619329452515, 0.004267536103725433, 0.012036234140396118, 0.019804932177066803, 0.027573632076382637, 0.03534233197569847, 0.043111030012369156, 0.05087972804903984, 0.058648429811000824, 0.06641712784767151, 0.0741858258843422, 0.08195452392101288, 0.08972322195768356, 0.09749191999435425, 0.10526062548160553, 0.11302931606769562, 0.1207980215549469, 0.128566712141037, 0.13633541762828827, 0.14410412311553955, 0.15187281370162964, 0.15964151918888092, 0.167410209774971, 0.1751789152622223, 0.18294760584831238, 0.19071631133556366, 0.19848501682281494, 0.20625372231006622, 0.2140224128961563, 0.2217911183834076, 0.22955980896949768, 0.23732851445674896, 0.24509721994400024, 0.25286591053009033, 0.2606346011161804]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 8.0, 17.0, 14.0, 29.0, 36.0, 66.0, 102.0, 127.0, 190.0, 310.0, 497.0, 877.0, 1482.0, 2396.0, 4501.0, 7863.0, 14411.0, 25401.0, 45285.0, 80444.0, 137456.0, 205656.0, 204089.0, 135800.0, 78937.0, 45040.0, 25364.0, 13889.0, 7731.0, 4442.0, 2485.0, 1374.0, 844.0, 521.0, 321.0, 194.0, 116.0, 90.0, 43.0, 29.0, 31.0, 23.0, 13.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09039306640625, -0.08727455139160156, -0.08415603637695312, -0.08103752136230469, -0.07791900634765625, -0.07480049133300781, -0.07168197631835938, -0.06856346130371094, -0.0654449462890625, -0.06232643127441406, -0.059207916259765625, -0.05608940124511719, -0.05297088623046875, -0.04985237121582031, -0.046733856201171875, -0.04361534118652344, -0.040496826171875, -0.03737831115722656, -0.034259796142578125, -0.031141281127929688, -0.02802276611328125, -0.024904251098632812, -0.021785736083984375, -0.018667221069335938, -0.0155487060546875, -0.012430191040039062, -0.009311676025390625, -0.0061931610107421875, -0.00307464599609375, 4.38690185546875e-05, 0.003162384033203125, 0.0062808990478515625, 0.0093994140625, 0.012517929077148438, 0.015636444091796875, 0.018754959106445312, 0.02187347412109375, 0.024991989135742188, 0.028110504150390625, 0.031229019165039062, 0.0343475341796875, 0.03746604919433594, 0.040584564208984375, 0.04370307922363281, 0.04682159423828125, 0.04994010925292969, 0.053058624267578125, 0.05617713928222656, 0.059295654296875, 0.06241416931152344, 0.06553268432617188, 0.06865119934082031, 0.07176971435546875, 0.07488822937011719, 0.07800674438476562, 0.08112525939941406, 0.0842437744140625, 0.08736228942871094, 0.09048080444335938, 0.09359931945800781, 0.09671783447265625, 0.09983634948730469, 0.10295486450195312, 0.10607337951660156, 0.10919189453125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 2.0, 5.0, 4.0, 10.0, 11.0, 13.0, 18.0, 14.0, 27.0, 23.0, 25.0, 23.0, 34.0, 34.0, 46.0, 44.0, 52.0, 41.0, 43.0, 49.0, 49.0, 50.0, 40.0, 45.0, 42.0, 37.0, 33.0, 34.0, 29.0, 19.0, 25.0, 16.0, 17.0, 12.0, 10.0, 7.0, 4.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05889892578125, -0.057271480560302734, -0.05564403533935547, -0.0540165901184082, -0.05238914489746094, -0.05076169967651367, -0.049134254455566406, -0.04750680923461914, -0.045879364013671875, -0.04425191879272461, -0.042624473571777344, -0.04099702835083008, -0.03936958312988281, -0.03774213790893555, -0.03611469268798828, -0.034487247467041016, -0.03285980224609375, -0.031232357025146484, -0.02960491180419922, -0.027977466583251953, -0.026350021362304688, -0.024722576141357422, -0.023095130920410156, -0.02146768569946289, -0.019840240478515625, -0.01821279525756836, -0.016585350036621094, -0.014957904815673828, -0.013330459594726562, -0.011703014373779297, -0.010075569152832031, -0.008448123931884766, -0.0068206787109375, -0.005193233489990234, -0.0035657882690429688, -0.0019383430480957031, -0.0003108978271484375, 0.0013165473937988281, 0.0029439926147460938, 0.004571437835693359, 0.006198883056640625, 0.00782632827758789, 0.009453773498535156, 0.011081218719482422, 0.012708663940429688, 0.014336109161376953, 0.01596355438232422, 0.017590999603271484, 0.01921844482421875, 0.020845890045166016, 0.02247333526611328, 0.024100780487060547, 0.025728225708007812, 0.027355670928955078, 0.028983116149902344, 0.03061056137084961, 0.032238006591796875, 0.03386545181274414, 0.035492897033691406, 0.03712034225463867, 0.03874778747558594, 0.0403752326965332, 0.04200267791748047, 0.043630123138427734, 0.045257568359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 5.0, 3.0, 12.0, 11.0, 14.0, 27.0, 28.0, 41.0, 48.0, 74.0, 99.0, 157.0, 275.0, 474.0, 920.0, 1991.0, 4695.0, 11278.0, 26574.0, 62095.0, 133537.0, 243818.0, 266252.0, 160711.0, 76922.0, 33476.0, 14090.0, 5833.0, 2536.0, 1173.0, 529.0, 316.0, 166.0, 107.0, 66.0, 63.0, 52.0, 27.0, 18.0, 15.0, 11.0, 2.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.11956787109375, -0.11595916748046875, -0.1123504638671875, -0.10874176025390625, -0.105133056640625, -0.10152435302734375, -0.0979156494140625, -0.09430694580078125, -0.0906982421875, -0.08708953857421875, -0.0834808349609375, -0.07987213134765625, -0.076263427734375, -0.07265472412109375, -0.0690460205078125, -0.06543731689453125, -0.06182861328125, -0.05821990966796875, -0.0546112060546875, -0.05100250244140625, -0.047393798828125, -0.04378509521484375, -0.0401763916015625, -0.03656768798828125, -0.032958984375, -0.02935028076171875, -0.0257415771484375, -0.02213287353515625, -0.018524169921875, -0.01491546630859375, -0.0113067626953125, -0.00769805908203125, -0.00408935546875, -0.00048065185546875, 0.0031280517578125, 0.00673675537109375, 0.010345458984375, 0.01395416259765625, 0.0175628662109375, 0.02117156982421875, 0.0247802734375, 0.02838897705078125, 0.0319976806640625, 0.03560638427734375, 0.039215087890625, 0.04282379150390625, 0.0464324951171875, 0.05004119873046875, 0.05364990234375, 0.05725860595703125, 0.0608673095703125, 0.06447601318359375, 0.068084716796875, 0.07169342041015625, 0.0753021240234375, 0.07891082763671875, 0.08251953125, 0.08612823486328125, 0.0897369384765625, 0.09334564208984375, 0.096954345703125, 0.10056304931640625, 0.1041717529296875, 0.10778045654296875, 0.11138916015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 7.0, 11.0, 8.0, 5.0, 11.0, 8.0, 6.0, 20.0, 22.0, 17.0, 20.0, 22.0, 34.0, 25.0, 27.0, 34.0, 35.0, 44.0, 34.0, 38.0, 46.0, 44.0, 41.0, 36.0, 35.0, 28.0, 31.0, 33.0, 42.0, 40.0, 28.0, 16.0, 23.0, 18.0, 14.0, 20.0, 9.0, 6.0, 9.0, 12.0, 7.0, 9.0, 6.0, 3.0, 1.0, 7.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.134765625, -0.1309185028076172, -0.12707138061523438, -0.12322425842285156, -0.11937713623046875, -0.11553001403808594, -0.11168289184570312, -0.10783576965332031, -0.1039886474609375, -0.10014152526855469, -0.09629440307617188, -0.09244728088378906, -0.08860015869140625, -0.08475303649902344, -0.08090591430664062, -0.07705879211425781, -0.073211669921875, -0.06936454772949219, -0.06551742553710938, -0.06167030334472656, -0.05782318115234375, -0.05397605895996094, -0.050128936767578125, -0.04628181457519531, -0.0424346923828125, -0.03858757019042969, -0.034740447998046875, -0.030893325805664062, -0.02704620361328125, -0.023199081420898438, -0.019351959228515625, -0.015504837036132812, -0.01165771484375, -0.0078105926513671875, -0.003963470458984375, -0.0001163482666015625, 0.00373077392578125, 0.0075778961181640625, 0.011425018310546875, 0.015272140502929688, 0.0191192626953125, 0.022966384887695312, 0.026813507080078125, 0.030660629272460938, 0.03450775146484375, 0.03835487365722656, 0.042201995849609375, 0.04604911804199219, 0.049896240234375, 0.05374336242675781, 0.057590484619140625, 0.06143760681152344, 0.06528472900390625, 0.06913185119628906, 0.07297897338867188, 0.07682609558105469, 0.0806732177734375, 0.08452033996582031, 0.08836746215820312, 0.09221458435058594, 0.09606170654296875, 0.09990882873535156, 0.10375595092773438, 0.10760307312011719, 0.1114501953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 10.0, 7.0, 12.0, 9.0, 33.0, 49.0, 85.0, 133.0, 346.0, 637.0, 1482.0, 3555.0, 8926.0, 24269.0, 67032.0, 229479.0, 445356.0, 179022.0, 55208.0, 19981.0, 7568.0, 3038.0, 1206.0, 518.0, 265.0, 128.0, 70.0, 36.0, 21.0, 20.0, 12.0, 9.0, 4.0, 9.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0628662109375, -0.06079864501953125, -0.0587310791015625, -0.05666351318359375, -0.054595947265625, -0.05252838134765625, -0.0504608154296875, -0.04839324951171875, -0.04632568359375, -0.04425811767578125, -0.0421905517578125, -0.04012298583984375, -0.038055419921875, -0.03598785400390625, -0.0339202880859375, -0.03185272216796875, -0.02978515625, -0.02771759033203125, -0.0256500244140625, -0.02358245849609375, -0.021514892578125, -0.01944732666015625, -0.0173797607421875, -0.01531219482421875, -0.01324462890625, -0.01117706298828125, -0.0091094970703125, -0.00704193115234375, -0.004974365234375, -0.00290679931640625, -0.0008392333984375, 0.00122833251953125, 0.0032958984375, 0.00536346435546875, 0.0074310302734375, 0.00949859619140625, 0.011566162109375, 0.01363372802734375, 0.0157012939453125, 0.01776885986328125, 0.01983642578125, 0.02190399169921875, 0.0239715576171875, 0.02603912353515625, 0.028106689453125, 0.03017425537109375, 0.0322418212890625, 0.03430938720703125, 0.036376953125, 0.03844451904296875, 0.0405120849609375, 0.04257965087890625, 0.044647216796875, 0.04671478271484375, 0.0487823486328125, 0.05084991455078125, 0.05291748046875, 0.05498504638671875, 0.0570526123046875, 0.05912017822265625, 0.061187744140625, 0.06325531005859375, 0.0653228759765625, 0.06739044189453125, 0.0694580078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 14.0, 6.0, 13.0, 16.0, 28.0, 25.0, 39.0, 51.0, 67.0, 70.0, 76.0, 64.0, 81.0, 77.0, 77.0, 57.0, 39.0, 43.0, 28.0, 28.0, 25.0, 16.0, 13.0, 9.0, 3.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1869316697120667e-05, -2.1267682313919067e-05, -2.0666047930717468e-05, -2.006441354751587e-05, -1.946277916431427e-05, -1.886114478111267e-05, -1.8259510397911072e-05, -1.7657876014709473e-05, -1.7056241631507874e-05, -1.6454607248306274e-05, -1.5852972865104675e-05, -1.5251338481903076e-05, -1.4649704098701477e-05, -1.4048069715499878e-05, -1.3446435332298279e-05, -1.284480094909668e-05, -1.224316656589508e-05, -1.1641532182693481e-05, -1.1039897799491882e-05, -1.0438263416290283e-05, -9.836629033088684e-06, -9.234994649887085e-06, -8.633360266685486e-06, -8.031725883483887e-06, -7.430091500282288e-06, -6.8284571170806885e-06, -6.226822733879089e-06, -5.62518835067749e-06, -5.023553967475891e-06, -4.421919584274292e-06, -3.820285201072693e-06, -3.2186508178710938e-06, -2.6170164346694946e-06, -2.0153820514678955e-06, -1.4137476682662964e-06, -8.121132850646973e-07, -2.1047890186309814e-07, 3.91155481338501e-07, 9.927898645401e-07, 1.5944242477416992e-06, 2.1960586309432983e-06, 2.7976930141448975e-06, 3.3993273973464966e-06, 4.000961780548096e-06, 4.602596163749695e-06, 5.204230546951294e-06, 5.805864930152893e-06, 6.407499313354492e-06, 7.009133696556091e-06, 7.6107680797576904e-06, 8.21240246295929e-06, 8.814036846160889e-06, 9.415671229362488e-06, 1.0017305612564087e-05, 1.0618939995765686e-05, 1.1220574378967285e-05, 1.1822208762168884e-05, 1.2423843145370483e-05, 1.3025477528572083e-05, 1.3627111911773682e-05, 1.422874629497528e-05, 1.483038067817688e-05, 1.543201506137848e-05, 1.6033649444580078e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 14.0, 16.0, 20.0, 24.0, 39.0, 52.0, 82.0, 109.0, 168.0, 232.0, 400.0, 646.0, 1184.0, 2166.0, 4278.0, 9061.0, 18322.0, 37955.0, 87686.0, 257209.0, 368201.0, 151546.0, 56362.0, 26243.0, 13131.0, 6319.0, 3053.0, 1641.0, 881.0, 527.0, 322.0, 190.0, 152.0, 103.0, 66.0, 49.0, 28.0, 27.0, 10.0, 5.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.044403076171875, -0.04288530349731445, -0.041367530822753906, -0.03984975814819336, -0.03833198547363281, -0.036814212799072266, -0.03529644012451172, -0.03377866744995117, -0.032260894775390625, -0.030743122100830078, -0.02922534942626953, -0.027707576751708984, -0.026189804077148438, -0.02467203140258789, -0.023154258728027344, -0.021636486053466797, -0.02011871337890625, -0.018600940704345703, -0.017083168029785156, -0.01556539535522461, -0.014047622680664062, -0.012529850006103516, -0.011012077331542969, -0.009494304656982422, -0.007976531982421875, -0.006458759307861328, -0.004940986633300781, -0.0034232139587402344, -0.0019054412841796875, -0.0003876686096191406, 0.0011301040649414062, 0.002647876739501953, 0.0041656494140625, 0.005683422088623047, 0.007201194763183594, 0.00871896743774414, 0.010236740112304688, 0.011754512786865234, 0.013272285461425781, 0.014790058135986328, 0.016307830810546875, 0.017825603485107422, 0.01934337615966797, 0.020861148834228516, 0.022378921508789062, 0.02389669418334961, 0.025414466857910156, 0.026932239532470703, 0.02845001220703125, 0.029967784881591797, 0.031485557556152344, 0.03300333023071289, 0.03452110290527344, 0.036038875579833984, 0.03755664825439453, 0.03907442092895508, 0.040592193603515625, 0.04210996627807617, 0.04362773895263672, 0.045145511627197266, 0.04666328430175781, 0.04818105697631836, 0.049698829650878906, 0.05121660232543945, 0.052734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 4.0, 10.0, 8.0, 5.0, 12.0, 26.0, 21.0, 56.0, 61.0, 87.0, 130.0, 129.0, 128.0, 91.0, 66.0, 58.0, 32.0, 25.0, 11.0, 4.0, 8.0, 9.0, 8.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07220458984375, -0.07017993927001953, -0.06815528869628906, -0.0661306381225586, -0.06410598754882812, -0.062081336975097656, -0.06005668640136719, -0.05803203582763672, -0.05600738525390625, -0.05398273468017578, -0.05195808410644531, -0.049933433532714844, -0.047908782958984375, -0.045884132385253906, -0.04385948181152344, -0.04183483123779297, -0.0398101806640625, -0.03778553009033203, -0.03576087951660156, -0.033736228942871094, -0.031711578369140625, -0.029686927795410156, -0.027662277221679688, -0.02563762664794922, -0.02361297607421875, -0.02158832550048828, -0.019563674926757812, -0.017539024353027344, -0.015514373779296875, -0.013489723205566406, -0.011465072631835938, -0.009440422058105469, -0.007415771484375, -0.005391120910644531, -0.0033664703369140625, -0.0013418197631835938, 0.000682830810546875, 0.0027074813842773438, 0.0047321319580078125, 0.006756782531738281, 0.00878143310546875, 0.010806083679199219, 0.012830734252929688, 0.014855384826660156, 0.016880035400390625, 0.018904685974121094, 0.020929336547851562, 0.02295398712158203, 0.0249786376953125, 0.02700328826904297, 0.029027938842773438, 0.031052589416503906, 0.033077239990234375, 0.035101890563964844, 0.03712654113769531, 0.03915119171142578, 0.04117584228515625, 0.04320049285888672, 0.04522514343261719, 0.047249794006347656, 0.049274444580078125, 0.051299095153808594, 0.05332374572753906, 0.05534839630126953, 0.057373046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 6.0, 3.0, 11.0, 19.0, 14.0, 21.0, 29.0, 36.0, 60.0, 68.0, 70.0, 75.0, 73.0, 72.0, 70.0, 73.0, 64.0, 50.0, 40.0, 27.0, 23.0, 15.0, 20.0, 16.0, 9.0, 7.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2400253862142563, -0.22900430858135223, -0.21798323094844818, -0.20696213841438293, -0.19594106078147888, -0.18491998314857483, -0.17389890551567078, -0.16287782788276672, -0.15185675024986267, -0.14083567261695862, -0.12981459498405457, -0.11879350990056992, -0.10777243226766586, -0.09675135463476181, -0.08573026955127716, -0.07470919191837311, -0.06368811428546906, -0.052667036652565, -0.04164595529437065, -0.0306248739361763, -0.019603796303272247, -0.008582718670368195, 0.002438366413116455, 0.013459444046020508, 0.02448052167892456, 0.03550159931182861, 0.046522680670022964, 0.057543762028217316, 0.06856483966112137, 0.07958591729402542, 0.09060700237751007, 0.10162808001041412, 0.11264914274215698, 0.12367022037506104, 0.1346912980079651, 0.14571237564086914, 0.1567334532737732, 0.16775453090667725, 0.1787756234407425, 0.18979670107364655, 0.2008177787065506, 0.21183885633945465, 0.2228599339723587, 0.23388102650642395, 0.244902104139328, 0.25592318177223206, 0.2669442594051361, 0.27796533703804016, 0.2889864146709442, 0.30000749230384827, 0.3110285699367523, 0.32204964756965637, 0.3330707252025604, 0.3440918028354645, 0.3551129102706909, 0.36613398790359497, 0.377155065536499, 0.3881761431694031, 0.39919722080230713, 0.4102182984352112, 0.42123937606811523, 0.4322604537010193, 0.44328153133392334, 0.4543026089668274, 0.46532368659973145]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 8.0, 15.0, 11.0, 17.0, 15.0, 16.0, 19.0, 19.0, 37.0, 24.0, 29.0, 28.0, 33.0, 44.0, 41.0, 48.0, 30.0, 41.0, 41.0, 39.0, 37.0, 28.0, 41.0, 27.0, 30.0, 34.0, 31.0, 29.0, 23.0, 26.0, 16.0, 19.0, 19.0, 13.0, 10.0, 11.0, 8.0, 6.0, 5.0, 5.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.35033005475997925, -0.33945605158805847, -0.3285820186138153, -0.31770801544189453, -0.30683398246765137, -0.2959599792957306, -0.2850859761238098, -0.27421194314956665, -0.2633379399776459, -0.2524639368057251, -0.24158990383148193, -0.23071590065956116, -0.2198418825864792, -0.20896786451339722, -0.19809386134147644, -0.18721984326839447, -0.1763458251953125, -0.16547180712223053, -0.15459778904914856, -0.14372378587722778, -0.1328497678041458, -0.12197574973106384, -0.11110173910856247, -0.1002277284860611, -0.08935371041297913, -0.07847969233989716, -0.06760568171739578, -0.05673166736960411, -0.04585765302181244, -0.03498363867402077, -0.024109624326229095, -0.013235613703727722, -0.002361595630645752, 0.00851241871714592, 0.01938643306493759, 0.030260447412729263, 0.041134461760520935, 0.05200847610831261, 0.06288249045610428, 0.07375650107860565, 0.08463051915168762, 0.09550453722476959, 0.10637854784727097, 0.11725255846977234, 0.1281265765428543, 0.13900059461593628, 0.14987459778785706, 0.16074861586093903, 0.171622633934021, 0.18249665200710297, 0.19337067008018494, 0.2042446732521057, 0.21511869132518768, 0.22599270939826965, 0.23686671257019043, 0.2477407306432724, 0.25861474871635437, 0.26948875188827515, 0.2803627848625183, 0.2912367880344391, 0.30211079120635986, 0.312984824180603, 0.3238588273525238, 0.3347328305244446, 0.34560686349868774]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 15.0, 14.0, 24.0, 30.0, 61.0, 55.0, 94.0, 124.0, 169.0, 312.0, 472.0, 745.0, 1381.0, 2470.0, 4488.0, 9342.0, 19663.0, 46490.0, 124411.0, 453889.0, 1586749.0, 1376279.0, 374889.0, 113832.0, 43189.0, 18206.0, 8318.0, 4000.0, 1996.0, 1062.0, 599.0, 344.0, 203.0, 126.0, 85.0, 57.0, 22.0, 26.0, 16.0, 11.0, 2.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07854747772216797, -0.07616233825683594, -0.0737771987915039, -0.07139205932617188, -0.06900691986083984, -0.06662178039550781, -0.06423664093017578, -0.06185150146484375, -0.05946636199951172, -0.05708122253417969, -0.054696083068847656, -0.052310943603515625, -0.049925804138183594, -0.04754066467285156, -0.04515552520751953, -0.0427703857421875, -0.04038524627685547, -0.03800010681152344, -0.035614967346191406, -0.033229827880859375, -0.030844688415527344, -0.028459548950195312, -0.02607440948486328, -0.02368927001953125, -0.02130413055419922, -0.018918991088867188, -0.016533851623535156, -0.014148712158203125, -0.011763572692871094, -0.009378433227539062, -0.006993293762207031, -0.004608154296875, -0.0022230148315429688, 0.0001621246337890625, 0.0025472640991210938, 0.004932403564453125, 0.007317543029785156, 0.009702682495117188, 0.012087821960449219, 0.01447296142578125, 0.01685810089111328, 0.019243240356445312, 0.021628379821777344, 0.024013519287109375, 0.026398658752441406, 0.028783798217773438, 0.03116893768310547, 0.0335540771484375, 0.03593921661376953, 0.03832435607910156, 0.040709495544433594, 0.043094635009765625, 0.045479774475097656, 0.04786491394042969, 0.05025005340576172, 0.05263519287109375, 0.05502033233642578, 0.05740547180175781, 0.059790611267089844, 0.062175750732421875, 0.0645608901977539, 0.06694602966308594, 0.06933116912841797, 0.07171630859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 6.0, 2.0, 2.0, 11.0, 9.0, 16.0, 11.0, 13.0, 29.0, 19.0, 29.0, 26.0, 30.0, 39.0, 33.0, 45.0, 43.0, 41.0, 34.0, 34.0, 50.0, 36.0, 47.0, 51.0, 38.0, 38.0, 45.0, 33.0, 26.0, 27.0, 21.0, 18.0, 16.0, 19.0, 17.0, 8.0, 10.0, 11.0, 3.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06060791015625, -0.05891847610473633, -0.057229042053222656, -0.055539608001708984, -0.05385017395019531, -0.05216073989868164, -0.05047130584716797, -0.0487818717956543, -0.047092437744140625, -0.04540300369262695, -0.04371356964111328, -0.04202413558959961, -0.04033470153808594, -0.038645267486572266, -0.036955833435058594, -0.03526639938354492, -0.03357696533203125, -0.03188753128051758, -0.030198097229003906, -0.028508663177490234, -0.026819229125976562, -0.02512979507446289, -0.02344036102294922, -0.021750926971435547, -0.020061492919921875, -0.018372058868408203, -0.01668262481689453, -0.01499319076538086, -0.013303756713867188, -0.011614322662353516, -0.009924888610839844, -0.008235454559326172, -0.0065460205078125, -0.004856586456298828, -0.0031671524047851562, -0.0014777183532714844, 0.0002117156982421875, 0.0019011497497558594, 0.0035905838012695312, 0.005280017852783203, 0.006969451904296875, 0.008658885955810547, 0.010348320007324219, 0.01203775405883789, 0.013727188110351562, 0.015416622161865234, 0.017106056213378906, 0.018795490264892578, 0.02048492431640625, 0.022174358367919922, 0.023863792419433594, 0.025553226470947266, 0.027242660522460938, 0.02893209457397461, 0.03062152862548828, 0.03231096267700195, 0.034000396728515625, 0.0356898307800293, 0.03737926483154297, 0.03906869888305664, 0.04075813293457031, 0.042447566986083984, 0.044137001037597656, 0.04582643508911133, 0.047515869140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 4.0, 11.0, 14.0, 17.0, 18.0, 31.0, 34.0, 57.0, 71.0, 113.0, 170.0, 240.0, 437.0, 750.0, 1542.0, 3271.0, 7954.0, 21838.0, 68619.0, 248612.0, 1061051.0, 2026238.0, 548615.0, 139387.0, 40902.0, 13830.0, 5458.0, 2315.0, 1101.0, 590.0, 362.0, 194.0, 117.0, 91.0, 52.0, 36.0, 28.0, 33.0, 15.0, 13.0, 13.0, 9.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.10528564453125, -0.10202407836914062, -0.09876251220703125, -0.09550094604492188, -0.0922393798828125, -0.08897781372070312, -0.08571624755859375, -0.08245468139648438, -0.079193115234375, -0.07593154907226562, -0.07266998291015625, -0.06940841674804688, -0.0661468505859375, -0.06288528442382812, -0.05962371826171875, -0.056362152099609375, -0.0531005859375, -0.049839019775390625, -0.04657745361328125, -0.043315887451171875, -0.0400543212890625, -0.036792755126953125, -0.03353118896484375, -0.030269622802734375, -0.027008056640625, -0.023746490478515625, -0.02048492431640625, -0.017223358154296875, -0.0139617919921875, -0.010700225830078125, -0.00743865966796875, -0.004177093505859375, -0.00091552734375, 0.002346038818359375, 0.00560760498046875, 0.008869171142578125, 0.0121307373046875, 0.015392303466796875, 0.01865386962890625, 0.021915435791015625, 0.025177001953125, 0.028438568115234375, 0.03170013427734375, 0.034961700439453125, 0.0382232666015625, 0.041484832763671875, 0.04474639892578125, 0.048007965087890625, 0.05126953125, 0.054531097412109375, 0.05779266357421875, 0.061054229736328125, 0.0643157958984375, 0.06757736206054688, 0.07083892822265625, 0.07410049438476562, 0.077362060546875, 0.08062362670898438, 0.08388519287109375, 0.08714675903320312, 0.0904083251953125, 0.09366989135742188, 0.09693145751953125, 0.10019302368164062, 0.10345458984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 14.0, 16.0, 15.0, 29.0, 35.0, 50.0, 64.0, 88.0, 155.0, 160.0, 220.0, 332.0, 437.0, 568.0, 554.0, 332.0, 281.0, 189.0, 142.0, 101.0, 61.0, 48.0, 45.0, 28.0, 22.0, 16.0, 13.0, 15.0, 9.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0709228515625, -0.067779541015625, -0.06463623046875, -0.061492919921875, -0.058349609375, -0.055206298828125, -0.05206298828125, -0.048919677734375, -0.0457763671875, -0.042633056640625, -0.03948974609375, -0.036346435546875, -0.033203125, -0.030059814453125, -0.02691650390625, -0.023773193359375, -0.0206298828125, -0.017486572265625, -0.01434326171875, -0.011199951171875, -0.008056640625, -0.004913330078125, -0.00177001953125, 0.001373291015625, 0.0045166015625, 0.007659912109375, 0.01080322265625, 0.013946533203125, 0.01708984375, 0.020233154296875, 0.02337646484375, 0.026519775390625, 0.0296630859375, 0.032806396484375, 0.03594970703125, 0.039093017578125, 0.042236328125, 0.045379638671875, 0.04852294921875, 0.051666259765625, 0.0548095703125, 0.057952880859375, 0.06109619140625, 0.064239501953125, 0.0673828125, 0.070526123046875, 0.07366943359375, 0.076812744140625, 0.0799560546875, 0.083099365234375, 0.08624267578125, 0.089385986328125, 0.092529296875, 0.095672607421875, 0.09881591796875, 0.101959228515625, 0.1051025390625, 0.108245849609375, 0.11138916015625, 0.114532470703125, 0.11767578125, 0.120819091796875, 0.12396240234375, 0.127105712890625, 0.1302490234375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 17.0, 27.0, 56.0, 77.0, 104.0, 138.0, 162.0, 135.0, 104.0, 67.0, 50.0, 30.0, 16.0, 12.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.018960952758789, -0.9949027895927429, -0.9708446860313416, -0.9467865228652954, -0.922728419303894, -0.8986702561378479, -0.8746121525764465, -0.8505539894104004, -0.826495885848999, -0.8024377226829529, -0.7783796191215515, -0.7543214559555054, -0.730263352394104, -0.7062051892280579, -0.6821470856666565, -0.6580889225006104, -0.634030818939209, -0.6099726557731628, -0.5859145522117615, -0.5618563890457153, -0.537798285484314, -0.5137401223182678, -0.48968201875686646, -0.4656238555908203, -0.44156569242477417, -0.4175075590610504, -0.39344942569732666, -0.3693912923336029, -0.34533315896987915, -0.3212750256061554, -0.29721689224243164, -0.2731587290763855, -0.24910062551498413, -0.22504249215126038, -0.20098435878753662, -0.17692622542381287, -0.1528680920600891, -0.12880995869636536, -0.10475181043148041, -0.08069367706775665, -0.0566355437040329, -0.03257741034030914, -0.00851927325129509, 0.015538863837718964, 0.03959699720144272, 0.06365513056516647, 0.08771327137947083, 0.11177140474319458, 0.13582953810691833, 0.1598876714706421, 0.18394580483436584, 0.2080039381980896, 0.23206207156181335, 0.2561202049255371, 0.28017836809158325, 0.3042364716529846, 0.32829463481903076, 0.3523527681827545, 0.37641090154647827, 0.400469034910202, 0.4245271682739258, 0.44858530163764954, 0.4726434350013733, 0.49670159816741943, 0.5207597017288208]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 12.0, 4.0, 9.0, 12.0, 14.0, 12.0, 18.0, 14.0, 18.0, 19.0, 26.0, 25.0, 25.0, 29.0, 21.0, 27.0, 28.0, 32.0, 29.0, 43.0, 30.0, 39.0, 39.0, 36.0, 24.0, 39.0, 29.0, 36.0, 26.0, 27.0, 25.0, 23.0, 21.0, 27.0, 28.0, 21.0, 17.0, 22.0, 11.0, 9.0, 7.0, 8.0, 5.0, 4.0, 2.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.24354857206344604, -0.23560334742069244, -0.22765812277793884, -0.21971288323402405, -0.21176765859127045, -0.20382243394851685, -0.19587720930576324, -0.18793198466300964, -0.17998674511909485, -0.17204152047634125, -0.16409629583358765, -0.15615105628967285, -0.14820583164691925, -0.14026060700416565, -0.13231538236141205, -0.12437015771865845, -0.11642493307590485, -0.10847970843315125, -0.10053447633981705, -0.09258925169706345, -0.08464401960372925, -0.07669879496097565, -0.06875357031822205, -0.060808341950178146, -0.05286311358213425, -0.04491788521409035, -0.03697265684604645, -0.029027432203292847, -0.021082203835248947, -0.013136975467205048, -0.0051917508244514465, 0.002753477543592453, 0.010698705911636353, 0.018643934279680252, 0.026589160785079002, 0.03453438729047775, 0.04247961565852165, 0.05042484402656555, 0.05837006866931915, 0.06631529331207275, 0.07426052540540695, 0.08220575004816055, 0.09015098214149475, 0.09809620678424835, 0.10604143142700195, 0.11398666352033615, 0.12193188816308975, 0.12987712025642395, 0.13782234489917755, 0.14576756954193115, 0.15371279418468475, 0.16165801882743835, 0.16960325837135315, 0.17754848301410675, 0.18549370765686035, 0.19343893229961395, 0.20138415694236755, 0.20932938158512115, 0.21727460622787476, 0.22521984577178955, 0.23316507041454315, 0.24111029505729675, 0.24905551970005035, 0.25700074434280396, 0.26494598388671875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 12.0, 11.0, 25.0, 35.0, 45.0, 80.0, 96.0, 200.0, 292.0, 441.0, 764.0, 1298.0, 2225.0, 3692.0, 6178.0, 10518.0, 17883.0, 29974.0, 48990.0, 77085.0, 118585.0, 167431.0, 180769.0, 138794.0, 92851.0, 58625.0, 37005.0, 22315.0, 13037.0, 7940.0, 4644.0, 2626.0, 1607.0, 937.0, 520.0, 354.0, 240.0, 127.0, 89.0, 60.0, 57.0, 25.0, 20.0, 11.0, 10.0, 9.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.099609375, -0.09651660919189453, -0.09342384338378906, -0.0903310775756836, -0.08723831176757812, -0.08414554595947266, -0.08105278015136719, -0.07796001434326172, -0.07486724853515625, -0.07177448272705078, -0.06868171691894531, -0.06558895111083984, -0.062496185302734375, -0.059403419494628906, -0.05631065368652344, -0.05321788787841797, -0.0501251220703125, -0.04703235626220703, -0.04393959045410156, -0.040846824645996094, -0.037754058837890625, -0.034661293029785156, -0.03156852722167969, -0.02847576141357422, -0.02538299560546875, -0.02229022979736328, -0.019197463989257812, -0.016104698181152344, -0.013011932373046875, -0.009919166564941406, -0.0068264007568359375, -0.0037336349487304688, -0.000640869140625, 0.0024518966674804688, 0.0055446624755859375, 0.008637428283691406, 0.011730194091796875, 0.014822959899902344, 0.017915725708007812, 0.02100849151611328, 0.02410125732421875, 0.02719402313232422, 0.030286788940429688, 0.033379554748535156, 0.036472320556640625, 0.039565086364746094, 0.04265785217285156, 0.04575061798095703, 0.0488433837890625, 0.05193614959716797, 0.05502891540527344, 0.058121681213378906, 0.061214447021484375, 0.06430721282958984, 0.06739997863769531, 0.07049274444580078, 0.07358551025390625, 0.07667827606201172, 0.07977104187011719, 0.08286380767822266, 0.08595657348632812, 0.0890493392944336, 0.09214210510253906, 0.09523487091064453, 0.09832763671875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 4.0, 1.0, 7.0, 10.0, 5.0, 19.0, 14.0, 10.0, 25.0, 25.0, 25.0, 32.0, 34.0, 29.0, 42.0, 36.0, 50.0, 48.0, 54.0, 39.0, 43.0, 49.0, 45.0, 44.0, 43.0, 41.0, 29.0, 30.0, 36.0, 25.0, 18.0, 21.0, 15.0, 13.0, 11.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.062103271484375, -0.06035423278808594, -0.058605194091796875, -0.05685615539550781, -0.05510711669921875, -0.05335807800292969, -0.051609039306640625, -0.04986000061035156, -0.0481109619140625, -0.04636192321777344, -0.044612884521484375, -0.04286384582519531, -0.04111480712890625, -0.03936576843261719, -0.037616729736328125, -0.03586769104003906, -0.03411865234375, -0.03236961364746094, -0.030620574951171875, -0.028871536254882812, -0.02712249755859375, -0.025373458862304688, -0.023624420166015625, -0.021875381469726562, -0.0201263427734375, -0.018377304077148438, -0.016628265380859375, -0.014879226684570312, -0.01313018798828125, -0.011381149291992188, -0.009632110595703125, -0.007883071899414062, -0.006134033203125, -0.0043849945068359375, -0.002635955810546875, -0.0008869171142578125, 0.00086212158203125, 0.0026111602783203125, 0.004360198974609375, 0.0061092376708984375, 0.0078582763671875, 0.009607315063476562, 0.011356353759765625, 0.013105392456054688, 0.01485443115234375, 0.016603469848632812, 0.018352508544921875, 0.020101547241210938, 0.0218505859375, 0.023599624633789062, 0.025348663330078125, 0.027097702026367188, 0.02884674072265625, 0.030595779418945312, 0.032344818115234375, 0.03409385681152344, 0.0358428955078125, 0.03759193420410156, 0.039340972900390625, 0.04109001159667969, 0.04283905029296875, 0.04458808898925781, 0.046337127685546875, 0.04808616638183594, 0.049835205078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 3.0, 10.0, 11.0, 26.0, 34.0, 54.0, 107.0, 163.0, 290.0, 566.0, 1112.0, 2485.0, 5774.0, 13485.0, 34994.0, 92378.0, 236164.0, 352359.0, 189090.0, 72684.0, 27389.0, 10878.0, 4556.0, 2022.0, 945.0, 443.0, 232.0, 113.0, 72.0, 38.0, 28.0, 17.0, 16.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17200088500976562, -0.16614532470703125, -0.16028976440429688, -0.1544342041015625, -0.14857864379882812, -0.14272308349609375, -0.13686752319335938, -0.131011962890625, -0.12515640258789062, -0.11930084228515625, -0.11344528198242188, -0.1075897216796875, -0.10173416137695312, -0.09587860107421875, -0.09002304077148438, -0.08416748046875, -0.07831192016601562, -0.07245635986328125, -0.06660079956054688, -0.0607452392578125, -0.054889678955078125, -0.04903411865234375, -0.043178558349609375, -0.037322998046875, -0.031467437744140625, -0.02561187744140625, -0.019756317138671875, -0.0139007568359375, -0.008045196533203125, -0.00218963623046875, 0.003665924072265625, 0.009521484375, 0.015377044677734375, 0.02123260498046875, 0.027088165283203125, 0.0329437255859375, 0.038799285888671875, 0.04465484619140625, 0.050510406494140625, 0.056365966796875, 0.062221527099609375, 0.06807708740234375, 0.07393264770507812, 0.0797882080078125, 0.08564376831054688, 0.09149932861328125, 0.09735488891601562, 0.10321044921875, 0.10906600952148438, 0.11492156982421875, 0.12077713012695312, 0.1266326904296875, 0.13248825073242188, 0.13834381103515625, 0.14419937133789062, 0.150054931640625, 0.15591049194335938, 0.16176605224609375, 0.16762161254882812, 0.1734771728515625, 0.17933273315429688, 0.18518829345703125, 0.19104385375976562, 0.1968994140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 9.0, 8.0, 16.0, 10.0, 15.0, 29.0, 14.0, 28.0, 25.0, 26.0, 32.0, 40.0, 40.0, 55.0, 28.0, 49.0, 35.0, 48.0, 52.0, 34.0, 46.0, 50.0, 29.0, 47.0, 38.0, 19.0, 18.0, 20.0, 18.0, 22.0, 14.0, 11.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 4.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16070175170898438, -0.15550994873046875, -0.15031814575195312, -0.1451263427734375, -0.13993453979492188, -0.13474273681640625, -0.12955093383789062, -0.124359130859375, -0.11916732788085938, -0.11397552490234375, -0.10878372192382812, -0.1035919189453125, -0.09840011596679688, -0.09320831298828125, -0.08801651000976562, -0.08282470703125, -0.07763290405273438, -0.07244110107421875, -0.06724929809570312, -0.0620574951171875, -0.056865692138671875, -0.05167388916015625, -0.046482086181640625, -0.041290283203125, -0.036098480224609375, -0.03090667724609375, -0.025714874267578125, -0.0205230712890625, -0.015331268310546875, -0.01013946533203125, -0.004947662353515625, 0.000244140625, 0.005435943603515625, 0.01062774658203125, 0.015819549560546875, 0.0210113525390625, 0.026203155517578125, 0.03139495849609375, 0.036586761474609375, 0.041778564453125, 0.046970367431640625, 0.05216217041015625, 0.057353973388671875, 0.0625457763671875, 0.06773757934570312, 0.07292938232421875, 0.07812118530273438, 0.08331298828125, 0.08850479125976562, 0.09369659423828125, 0.09888839721679688, 0.1040802001953125, 0.10927200317382812, 0.11446380615234375, 0.11965560913085938, 0.124847412109375, 0.13003921508789062, 0.13523101806640625, 0.14042282104492188, 0.1456146240234375, 0.15080642700195312, 0.15599822998046875, 0.16119003295898438, 0.1663818359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 9.0, 15.0, 24.0, 22.0, 49.0, 58.0, 87.0, 118.0, 202.0, 321.0, 513.0, 764.0, 1343.0, 2331.0, 4313.0, 7877.0, 15397.0, 29569.0, 58477.0, 110916.0, 189070.0, 233217.0, 178904.0, 102912.0, 53442.0, 27670.0, 14223.0, 7258.0, 3979.0, 2145.0, 1270.0, 693.0, 464.0, 279.0, 196.0, 112.0, 95.0, 66.0, 43.0, 36.0, 29.0, 11.0, 10.0, 10.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.044677734375, -0.043341636657714844, -0.04200553894042969, -0.04066944122314453, -0.039333343505859375, -0.03799724578857422, -0.03666114807128906, -0.035325050354003906, -0.03398895263671875, -0.032652854919433594, -0.03131675720214844, -0.02998065948486328, -0.028644561767578125, -0.02730846405029297, -0.025972366333007812, -0.024636268615722656, -0.0233001708984375, -0.021964073181152344, -0.020627975463867188, -0.01929187774658203, -0.017955780029296875, -0.01661968231201172, -0.015283584594726562, -0.013947486877441406, -0.01261138916015625, -0.011275291442871094, -0.009939193725585938, -0.008603096008300781, -0.007266998291015625, -0.005930900573730469, -0.0045948028564453125, -0.0032587051391601562, -0.001922607421875, -0.0005865097045898438, 0.0007495880126953125, 0.0020856857299804688, 0.003421783447265625, 0.004757881164550781, 0.0060939788818359375, 0.007430076599121094, 0.00876617431640625, 0.010102272033691406, 0.011438369750976562, 0.012774467468261719, 0.014110565185546875, 0.015446662902832031, 0.016782760620117188, 0.018118858337402344, 0.0194549560546875, 0.020791053771972656, 0.022127151489257812, 0.02346324920654297, 0.024799346923828125, 0.02613544464111328, 0.027471542358398438, 0.028807640075683594, 0.03014373779296875, 0.031479835510253906, 0.03281593322753906, 0.03415203094482422, 0.035488128662109375, 0.03682422637939453, 0.03816032409667969, 0.039496421813964844, 0.04083251953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 6.0, 10.0, 8.0, 14.0, 9.0, 27.0, 35.0, 51.0, 75.0, 84.0, 101.0, 104.0, 106.0, 72.0, 73.0, 65.0, 41.0, 42.0, 21.0, 7.0, 16.0, 10.0, 10.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.155732363462448e-05, -2.0643696188926697e-05, -1.9730068743228912e-05, -1.8816441297531128e-05, -1.7902813851833344e-05, -1.698918640613556e-05, -1.6075558960437775e-05, -1.516193151473999e-05, -1.4248304069042206e-05, -1.3334676623344421e-05, -1.2421049177646637e-05, -1.1507421731948853e-05, -1.0593794286251068e-05, -9.680166840553284e-06, -8.7665393948555e-06, -7.852911949157715e-06, -6.93928450345993e-06, -6.025657057762146e-06, -5.1120296120643616e-06, -4.198402166366577e-06, -3.2847747206687927e-06, -2.3711472749710083e-06, -1.4575198292732239e-06, -5.438923835754395e-07, 3.6973506212234497e-07, 1.2833625078201294e-06, 2.196989953517914e-06, 3.1106173992156982e-06, 4.024244844913483e-06, 4.937872290611267e-06, 5.8514997363090515e-06, 6.765127182006836e-06, 7.67875462770462e-06, 8.592382073402405e-06, 9.50600951910019e-06, 1.0419636964797974e-05, 1.1333264410495758e-05, 1.2246891856193542e-05, 1.3160519301891327e-05, 1.4074146747589111e-05, 1.4987774193286896e-05, 1.590140163898468e-05, 1.6815029084682465e-05, 1.772865653038025e-05, 1.8642283976078033e-05, 1.9555911421775818e-05, 2.0469538867473602e-05, 2.1383166313171387e-05, 2.229679375886917e-05, 2.3210421204566956e-05, 2.412404865026474e-05, 2.5037676095962524e-05, 2.595130354166031e-05, 2.6864930987358093e-05, 2.7778558433055878e-05, 2.8692185878753662e-05, 2.9605813324451447e-05, 3.051944077014923e-05, 3.1433068215847015e-05, 3.23466956615448e-05, 3.3260323107242584e-05, 3.417395055294037e-05, 3.508757799863815e-05, 3.600120544433594e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 9.0, 8.0, 20.0, 21.0, 41.0, 66.0, 99.0, 174.0, 213.0, 396.0, 567.0, 922.0, 1485.0, 2421.0, 3894.0, 6673.0, 10944.0, 18088.0, 29337.0, 47723.0, 76385.0, 118477.0, 162430.0, 174269.0, 140875.0, 95720.0, 60519.0, 37808.0, 22992.0, 14001.0, 8482.0, 5243.0, 3136.0, 1896.0, 1137.0, 742.0, 487.0, 281.0, 190.0, 143.0, 83.0, 40.0, 30.0, 24.0, 16.0, 12.0, 14.0, 9.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.029937744140625, -0.029009342193603516, -0.02808094024658203, -0.027152538299560547, -0.026224136352539062, -0.025295734405517578, -0.024367332458496094, -0.02343893051147461, -0.022510528564453125, -0.02158212661743164, -0.020653724670410156, -0.019725322723388672, -0.018796920776367188, -0.017868518829345703, -0.01694011688232422, -0.016011714935302734, -0.01508331298828125, -0.014154911041259766, -0.013226509094238281, -0.012298107147216797, -0.011369705200195312, -0.010441303253173828, -0.009512901306152344, -0.00858449935913086, -0.007656097412109375, -0.006727695465087891, -0.005799293518066406, -0.004870891571044922, -0.0039424896240234375, -0.003014087677001953, -0.0020856857299804688, -0.0011572837829589844, -0.0002288818359375, 0.0006995201110839844, 0.0016279220581054688, 0.002556324005126953, 0.0034847259521484375, 0.004413127899169922, 0.005341529846191406, 0.006269931793212891, 0.007198333740234375, 0.00812673568725586, 0.009055137634277344, 0.009983539581298828, 0.010911941528320312, 0.011840343475341797, 0.012768745422363281, 0.013697147369384766, 0.01462554931640625, 0.015553951263427734, 0.01648235321044922, 0.017410755157470703, 0.018339157104492188, 0.019267559051513672, 0.020195960998535156, 0.02112436294555664, 0.022052764892578125, 0.02298116683959961, 0.023909568786621094, 0.024837970733642578, 0.025766372680664062, 0.026694774627685547, 0.02762317657470703, 0.028551578521728516, 0.02947998046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 7.0, 10.0, 12.0, 13.0, 12.0, 24.0, 16.0, 32.0, 28.0, 32.0, 40.0, 42.0, 50.0, 50.0, 56.0, 70.0, 64.0, 59.0, 50.0, 41.0, 40.0, 36.0, 31.0, 36.0, 30.0, 25.0, 13.0, 19.0, 12.0, 11.0, 5.0, 10.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.043426513671875, -0.042124271392822266, -0.04082202911376953, -0.0395197868347168, -0.03821754455566406, -0.03691530227661133, -0.035613059997558594, -0.03431081771850586, -0.033008575439453125, -0.03170633316040039, -0.030404090881347656, -0.029101848602294922, -0.027799606323242188, -0.026497364044189453, -0.02519512176513672, -0.023892879486083984, -0.02259063720703125, -0.021288394927978516, -0.01998615264892578, -0.018683910369873047, -0.017381668090820312, -0.016079425811767578, -0.014777183532714844, -0.01347494125366211, -0.012172698974609375, -0.01087045669555664, -0.009568214416503906, -0.008265972137451172, -0.0069637298583984375, -0.005661487579345703, -0.004359245300292969, -0.0030570030212402344, -0.0017547607421875, -0.0004525184631347656, 0.0008497238159179688, 0.002151966094970703, 0.0034542083740234375, 0.004756450653076172, 0.006058692932128906, 0.007360935211181641, 0.008663177490234375, 0.00996541976928711, 0.011267662048339844, 0.012569904327392578, 0.013872146606445312, 0.015174388885498047, 0.01647663116455078, 0.017778873443603516, 0.01908111572265625, 0.020383358001708984, 0.02168560028076172, 0.022987842559814453, 0.024290084838867188, 0.025592327117919922, 0.026894569396972656, 0.02819681167602539, 0.029499053955078125, 0.03080129623413086, 0.032103538513183594, 0.03340578079223633, 0.03470802307128906, 0.0360102653503418, 0.03731250762939453, 0.038614749908447266, 0.0399169921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 8.0, 17.0, 21.0, 25.0, 57.0, 67.0, 71.0, 73.0, 78.0, 77.0, 85.0, 89.0, 61.0, 60.0, 55.0, 40.0, 29.0, 17.0, 16.0, 15.0, 6.0, 11.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5560685396194458, -0.5400553345680237, -0.5240421295166016, -0.5080288648605347, -0.49201565980911255, -0.47600245475769043, -0.4599892199039459, -0.4439759850502014, -0.4279627799987793, -0.4119495749473572, -0.39593634009361267, -0.37992310523986816, -0.36390990018844604, -0.3478966951370239, -0.3318834602832794, -0.3158702254295349, -0.2998570203781128, -0.2838438153266907, -0.26783058047294617, -0.25181734561920166, -0.23580414056777954, -0.21979092061519623, -0.20377770066261292, -0.1877644807100296, -0.1717512607574463, -0.15573804080486298, -0.13972482085227966, -0.12371160089969635, -0.10769838094711304, -0.09168516099452972, -0.07567194104194641, -0.0596587210893631, -0.04364544153213501, -0.027632221579551697, -0.011619001626968384, 0.004394218325614929, 0.020407438278198242, 0.036420658230781555, 0.05243387818336487, 0.06844709813594818, 0.0844603180885315, 0.10047353804111481, 0.11648675799369812, 0.13249997794628143, 0.14851319789886475, 0.16452641785144806, 0.18053963780403137, 0.19655285775661469, 0.212566077709198, 0.2285792976617813, 0.24459251761436462, 0.26060575246810913, 0.27661895751953125, 0.29263216257095337, 0.3086453974246979, 0.3246586322784424, 0.3406718373298645, 0.3566850423812866, 0.37269827723503113, 0.38871151208877563, 0.40472471714019775, 0.4207379221916199, 0.4367511570453644, 0.4527643918991089, 0.468777596950531]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 9.0, 7.0, 14.0, 7.0, 11.0, 16.0, 22.0, 18.0, 23.0, 29.0, 32.0, 36.0, 28.0, 43.0, 34.0, 45.0, 46.0, 39.0, 62.0, 30.0, 32.0, 39.0, 50.0, 30.0, 43.0, 30.0, 26.0, 23.0, 28.0, 27.0, 17.0, 18.0, 17.0, 16.0, 12.0, 12.0, 6.0, 5.0, 5.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.41391491889953613, -0.40031224489212036, -0.3867095410823822, -0.37310683727264404, -0.35950416326522827, -0.3459014892578125, -0.33229878544807434, -0.3186960816383362, -0.3050934076309204, -0.29149073362350464, -0.2778880298137665, -0.2642853260040283, -0.25068265199661255, -0.23707996308803558, -0.22347727417945862, -0.20987458527088165, -0.1962718963623047, -0.18266920745372772, -0.16906651854515076, -0.1554638296365738, -0.14186114072799683, -0.12825845181941986, -0.1146557629108429, -0.10105307400226593, -0.08745038509368896, -0.073847696185112, -0.060245007276535034, -0.04664231836795807, -0.033039629459381104, -0.019436940550804138, -0.005834251642227173, 0.0077684372663497925, 0.021371126174926758, 0.03497381508350372, 0.04857650399208069, 0.062179192900657654, 0.07578188180923462, 0.08938457071781158, 0.10298725962638855, 0.11658994853496552, 0.13019263744354248, 0.14379532635211945, 0.1573980152606964, 0.17100070416927338, 0.18460339307785034, 0.1982060819864273, 0.21180877089500427, 0.22541145980358124, 0.2390141487121582, 0.252616822719574, 0.26621952652931213, 0.2798222303390503, 0.29342490434646606, 0.30702757835388184, 0.32063028216362, 0.33423298597335815, 0.3478356599807739, 0.3614383339881897, 0.37504103779792786, 0.388643741607666, 0.4022464156150818, 0.41584908962249756, 0.4294517934322357, 0.4430544972419739, 0.45665717124938965]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 8.0, 4.0, 8.0, 12.0, 12.0, 16.0, 25.0, 38.0, 33.0, 55.0, 71.0, 79.0, 110.0, 175.0, 262.0, 352.0, 541.0, 838.0, 1274.0, 2099.0, 3681.0, 6607.0, 12781.0, 26041.0, 61320.0, 171813.0, 697792.0, 2072446.0, 806684.0, 200459.0, 68663.0, 29188.0, 14110.0, 7033.0, 3845.0, 2143.0, 1272.0, 742.0, 497.0, 342.0, 222.0, 164.0, 107.0, 96.0, 59.0, 46.0, 36.0, 18.0, 15.0, 12.0, 11.0, 13.0, 6.0, 2.0, 4.0, 3.0], "bins": [-0.0931396484375, -0.09051990509033203, -0.08790016174316406, -0.0852804183959961, -0.08266067504882812, -0.08004093170166016, -0.07742118835449219, -0.07480144500732422, -0.07218170166015625, -0.06956195831298828, -0.06694221496582031, -0.06432247161865234, -0.061702728271484375, -0.059082984924316406, -0.05646324157714844, -0.05384349822998047, -0.0512237548828125, -0.04860401153564453, -0.04598426818847656, -0.043364524841308594, -0.040744781494140625, -0.038125038146972656, -0.03550529479980469, -0.03288555145263672, -0.03026580810546875, -0.02764606475830078, -0.025026321411132812, -0.022406578063964844, -0.019786834716796875, -0.017167091369628906, -0.014547348022460938, -0.011927604675292969, -0.009307861328125, -0.006688117980957031, -0.0040683746337890625, -0.0014486312866210938, 0.001171112060546875, 0.0037908554077148438, 0.0064105987548828125, 0.009030342102050781, 0.01165008544921875, 0.014269828796386719, 0.016889572143554688, 0.019509315490722656, 0.022129058837890625, 0.024748802185058594, 0.027368545532226562, 0.02998828887939453, 0.0326080322265625, 0.03522777557373047, 0.03784751892089844, 0.040467262268066406, 0.043087005615234375, 0.045706748962402344, 0.04832649230957031, 0.05094623565673828, 0.05356597900390625, 0.05618572235107422, 0.05880546569824219, 0.061425209045410156, 0.06404495239257812, 0.0666646957397461, 0.06928443908691406, 0.07190418243408203, 0.07452392578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 8.0, 5.0, 4.0, 6.0, 9.0, 17.0, 25.0, 15.0, 22.0, 26.0, 43.0, 30.0, 33.0, 32.0, 41.0, 41.0, 44.0, 41.0, 51.0, 28.0, 46.0, 41.0, 38.0, 41.0, 40.0, 47.0, 31.0, 32.0, 26.0, 18.0, 23.0, 21.0, 14.0, 12.0, 13.0, 3.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06591796875, -0.06402730941772461, -0.06213665008544922, -0.06024599075317383, -0.05835533142089844, -0.05646467208862305, -0.054574012756347656, -0.052683353424072266, -0.050792694091796875, -0.048902034759521484, -0.047011375427246094, -0.0451207160949707, -0.04323005676269531, -0.04133939743041992, -0.03944873809814453, -0.03755807876586914, -0.03566741943359375, -0.03377676010131836, -0.03188610076904297, -0.029995441436767578, -0.028104782104492188, -0.026214122772216797, -0.024323463439941406, -0.022432804107666016, -0.020542144775390625, -0.018651485443115234, -0.016760826110839844, -0.014870166778564453, -0.012979507446289062, -0.011088848114013672, -0.009198188781738281, -0.007307529449462891, -0.0054168701171875, -0.0035262107849121094, -0.0016355514526367188, 0.0002551078796386719, 0.0021457672119140625, 0.004036426544189453, 0.005927085876464844, 0.007817745208740234, 0.009708404541015625, 0.011599063873291016, 0.013489723205566406, 0.015380382537841797, 0.017271041870117188, 0.019161701202392578, 0.02105236053466797, 0.02294301986694336, 0.02483367919921875, 0.02672433853149414, 0.02861499786376953, 0.030505657196044922, 0.03239631652832031, 0.0342869758605957, 0.036177635192871094, 0.038068294525146484, 0.039958953857421875, 0.041849613189697266, 0.043740272521972656, 0.04563093185424805, 0.04752159118652344, 0.04941225051879883, 0.05130290985107422, 0.05319356918334961, 0.055084228515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 10.0, 4.0, 6.0, 14.0, 16.0, 34.0, 34.0, 33.0, 90.0, 99.0, 142.0, 265.0, 445.0, 925.0, 2184.0, 5884.0, 18933.0, 78702.0, 477668.0, 2763906.0, 704184.0, 104468.0, 24026.0, 7158.0, 2560.0, 1112.0, 531.0, 270.0, 168.0, 112.0, 70.0, 40.0, 39.0, 35.0, 25.0, 21.0, 13.0, 9.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1746826171875, -0.16897201538085938, -0.16326141357421875, -0.15755081176757812, -0.1518402099609375, -0.14612960815429688, -0.14041900634765625, -0.13470840454101562, -0.128997802734375, -0.12328720092773438, -0.11757659912109375, -0.11186599731445312, -0.1061553955078125, -0.10044479370117188, -0.09473419189453125, -0.08902359008789062, -0.08331298828125, -0.07760238647460938, -0.07189178466796875, -0.06618118286132812, -0.0604705810546875, -0.054759979248046875, -0.04904937744140625, -0.043338775634765625, -0.037628173828125, -0.031917572021484375, -0.02620697021484375, -0.020496368408203125, -0.0147857666015625, -0.009075164794921875, -0.00336456298828125, 0.002346038818359375, 0.008056640625, 0.013767242431640625, 0.01947784423828125, 0.025188446044921875, 0.0308990478515625, 0.036609649658203125, 0.04232025146484375, 0.048030853271484375, 0.053741455078125, 0.059452056884765625, 0.06516265869140625, 0.07087326049804688, 0.0765838623046875, 0.08229446411132812, 0.08800506591796875, 0.09371566772460938, 0.09942626953125, 0.10513687133789062, 0.11084747314453125, 0.11655807495117188, 0.1222686767578125, 0.12797927856445312, 0.13368988037109375, 0.13940048217773438, 0.145111083984375, 0.15082168579101562, 0.15653228759765625, 0.16224288940429688, 0.1679534912109375, 0.17366409301757812, 0.17937469482421875, 0.18508529663085938, 0.1907958984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 11.0, 13.0, 23.0, 45.0, 37.0, 56.0, 90.0, 137.0, 202.0, 379.0, 636.0, 908.0, 619.0, 339.0, 217.0, 136.0, 69.0, 46.0, 31.0, 25.0, 18.0, 13.0, 9.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.161865234375, -0.157012939453125, -0.15216064453125, -0.147308349609375, -0.1424560546875, -0.137603759765625, -0.13275146484375, -0.127899169921875, -0.123046875, -0.118194580078125, -0.11334228515625, -0.108489990234375, -0.1036376953125, -0.098785400390625, -0.09393310546875, -0.089080810546875, -0.084228515625, -0.079376220703125, -0.07452392578125, -0.069671630859375, -0.0648193359375, -0.059967041015625, -0.05511474609375, -0.050262451171875, -0.04541015625, -0.040557861328125, -0.03570556640625, -0.030853271484375, -0.0260009765625, -0.021148681640625, -0.01629638671875, -0.011444091796875, -0.006591796875, -0.001739501953125, 0.00311279296875, 0.007965087890625, 0.0128173828125, 0.017669677734375, 0.02252197265625, 0.027374267578125, 0.0322265625, 0.037078857421875, 0.04193115234375, 0.046783447265625, 0.0516357421875, 0.056488037109375, 0.06134033203125, 0.066192626953125, 0.071044921875, 0.075897216796875, 0.08074951171875, 0.085601806640625, 0.0904541015625, 0.095306396484375, 0.10015869140625, 0.105010986328125, 0.10986328125, 0.114715576171875, 0.11956787109375, 0.124420166015625, 0.1292724609375, 0.134124755859375, 0.13897705078125, 0.143829345703125, 0.148681640625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 12.0, 16.0, 14.0, 25.0, 40.0, 58.0, 75.0, 85.0, 92.0, 95.0, 114.0, 86.0, 92.0, 57.0, 56.0, 27.0, 21.0, 14.0, 11.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8929711580276489, -0.8741648197174072, -0.8553584814071655, -0.8365521430969238, -0.8177458047866821, -0.7989394664764404, -0.7801331281661987, -0.761326789855957, -0.7425204515457153, -0.7237141132354736, -0.7049077749252319, -0.6861014366149902, -0.6672950983047485, -0.6484887599945068, -0.6296824216842651, -0.6108760833740234, -0.5920697450637817, -0.57326340675354, -0.5544570684432983, -0.5356507301330566, -0.5168443918228149, -0.49803805351257324, -0.47923171520233154, -0.46042537689208984, -0.44161903858184814, -0.42281270027160645, -0.40400636196136475, -0.38520002365112305, -0.36639368534088135, -0.34758734703063965, -0.32878100872039795, -0.30997467041015625, -0.2911683917045593, -0.2723620533943176, -0.2535557150840759, -0.23474937677383423, -0.21594303846359253, -0.19713670015335083, -0.17833036184310913, -0.15952402353286743, -0.14071768522262573, -0.12191134691238403, -0.10310500860214233, -0.08429867029190063, -0.06549233198165894, -0.046685993671417236, -0.027879655361175537, -0.009073317050933838, 0.009733021259307861, 0.02853935956954956, 0.04734569787979126, 0.06615203619003296, 0.08495837450027466, 0.10376471281051636, 0.12257105112075806, 0.14137738943099976, 0.16018372774124146, 0.17899006605148315, 0.19779640436172485, 0.21660274267196655, 0.23540908098220825, 0.25421541929244995, 0.27302175760269165, 0.29182809591293335, 0.31063443422317505]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 11.0, 6.0, 13.0, 16.0, 9.0, 10.0, 14.0, 15.0, 23.0, 18.0, 25.0, 29.0, 33.0, 35.0, 35.0, 33.0, 47.0, 42.0, 34.0, 45.0, 49.0, 40.0, 41.0, 37.0, 33.0, 27.0, 35.0, 39.0, 33.0, 17.0, 23.0, 20.0, 19.0, 16.0, 10.0, 7.0, 9.0, 9.0, 13.0, 5.0, 1.0, 4.0, 5.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3246570825576782, -0.3147295117378235, -0.30480194091796875, -0.294874370098114, -0.2849467694759369, -0.27501919865608215, -0.2650916278362274, -0.2551640570163727, -0.24523648619651794, -0.2353089153766632, -0.22538132965564728, -0.21545375883579254, -0.2055261880159378, -0.19559860229492188, -0.18567103147506714, -0.1757434606552124, -0.16581587493419647, -0.15588830411434174, -0.1459607183933258, -0.13603314757347107, -0.12610557675361633, -0.116177998483181, -0.10625042021274567, -0.09632284939289093, -0.0863952711224556, -0.07646769285202026, -0.06654012203216553, -0.056612543761730194, -0.04668496921658516, -0.036757394671440125, -0.02682981640100479, -0.016902245581150055, -0.006974667310714722, 0.0029529081657528877, 0.012880483642220497, 0.02280806005001068, 0.032735634595155716, 0.04266320914030075, 0.052590787410736084, 0.06251835823059082, 0.07244593650102615, 0.08237351477146149, 0.09230108559131622, 0.10222866386175156, 0.11215624213218689, 0.12208381295204163, 0.13201138377189636, 0.1419389545917511, 0.15186654031276703, 0.16179411113262177, 0.1717216968536377, 0.18164926767349243, 0.19157683849334717, 0.2015044093132019, 0.21143199503421783, 0.22135956585407257, 0.2312871515750885, 0.24121472239494324, 0.251142293214798, 0.2610698938369751, 0.27099746465682983, 0.28092503547668457, 0.2908526062965393, 0.30078017711639404, 0.3107077479362488]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 11.0, 7.0, 18.0, 24.0, 27.0, 49.0, 81.0, 118.0, 191.0, 326.0, 538.0, 874.0, 1389.0, 2467.0, 4100.0, 7127.0, 12563.0, 22489.0, 41937.0, 78968.0, 145346.0, 225934.0, 215381.0, 132120.0, 70866.0, 37471.0, 20828.0, 11375.0, 6624.0, 3775.0, 2138.0, 1341.0, 781.0, 479.0, 316.0, 167.0, 122.0, 63.0, 44.0, 22.0, 19.0, 9.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10843276977539062, -0.10468292236328125, -0.10093307495117188, -0.0971832275390625, -0.09343338012695312, -0.08968353271484375, -0.08593368530273438, -0.082183837890625, -0.07843399047851562, -0.07468414306640625, -0.07093429565429688, -0.0671844482421875, -0.06343460083007812, -0.05968475341796875, -0.055934906005859375, -0.05218505859375, -0.048435211181640625, -0.04468536376953125, -0.040935516357421875, -0.0371856689453125, -0.033435821533203125, -0.02968597412109375, -0.025936126708984375, -0.022186279296875, -0.018436431884765625, -0.01468658447265625, -0.010936737060546875, -0.0071868896484375, -0.003437042236328125, 0.00031280517578125, 0.004062652587890625, 0.0078125, 0.011562347412109375, 0.01531219482421875, 0.019062042236328125, 0.0228118896484375, 0.026561737060546875, 0.03031158447265625, 0.034061431884765625, 0.037811279296875, 0.041561126708984375, 0.04531097412109375, 0.049060821533203125, 0.0528106689453125, 0.056560516357421875, 0.06031036376953125, 0.06406021118164062, 0.06781005859375, 0.07155990600585938, 0.07530975341796875, 0.07905960083007812, 0.0828094482421875, 0.08655929565429688, 0.09030914306640625, 0.09405899047851562, 0.097808837890625, 0.10155868530273438, 0.10530853271484375, 0.10905838012695312, 0.1128082275390625, 0.11655807495117188, 0.12030792236328125, 0.12405776977539062, 0.1278076171875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 10.0, 13.0, 11.0, 15.0, 15.0, 27.0, 32.0, 26.0, 29.0, 34.0, 41.0, 42.0, 46.0, 40.0, 47.0, 38.0, 47.0, 47.0, 61.0, 40.0, 41.0, 25.0, 33.0, 28.0, 29.0, 32.0, 21.0, 25.0, 13.0, 17.0, 9.0, 10.0, 7.0, 6.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0675048828125, -0.06557130813598633, -0.06363773345947266, -0.061704158782958984, -0.05977058410644531, -0.05783700942993164, -0.05590343475341797, -0.0539698600769043, -0.052036285400390625, -0.05010271072387695, -0.04816913604736328, -0.04623556137084961, -0.04430198669433594, -0.042368412017822266, -0.040434837341308594, -0.03850126266479492, -0.03656768798828125, -0.03463411331176758, -0.032700538635253906, -0.030766963958740234, -0.028833389282226562, -0.02689981460571289, -0.02496623992919922, -0.023032665252685547, -0.021099090576171875, -0.019165515899658203, -0.01723194122314453, -0.01529836654663086, -0.013364791870117188, -0.011431217193603516, -0.009497642517089844, -0.007564067840576172, -0.0056304931640625, -0.003696918487548828, -0.0017633438110351562, 0.00017023086547851562, 0.0021038055419921875, 0.004037380218505859, 0.005970954895019531, 0.007904529571533203, 0.009838104248046875, 0.011771678924560547, 0.013705253601074219, 0.01563882827758789, 0.017572402954101562, 0.019505977630615234, 0.021439552307128906, 0.023373126983642578, 0.02530670166015625, 0.027240276336669922, 0.029173851013183594, 0.031107425689697266, 0.03304100036621094, 0.03497457504272461, 0.03690814971923828, 0.03884172439575195, 0.040775299072265625, 0.0427088737487793, 0.04464244842529297, 0.04657602310180664, 0.04850959777832031, 0.050443172454833984, 0.052376747131347656, 0.05431032180786133, 0.056243896484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 4.0, 3.0, 8.0, 14.0, 17.0, 33.0, 41.0, 60.0, 144.0, 265.0, 479.0, 1040.0, 2422.0, 5584.0, 14456.0, 43243.0, 144135.0, 405109.0, 297402.0, 89295.0, 27810.0, 9793.0, 3971.0, 1676.0, 707.0, 360.0, 200.0, 102.0, 54.0, 43.0, 23.0, 15.0, 12.0, 8.0, 8.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2088623046875, -0.20229530334472656, -0.19572830200195312, -0.1891613006591797, -0.18259429931640625, -0.1760272979736328, -0.16946029663085938, -0.16289329528808594, -0.1563262939453125, -0.14975929260253906, -0.14319229125976562, -0.1366252899169922, -0.13005828857421875, -0.12349128723144531, -0.11692428588867188, -0.11035728454589844, -0.103790283203125, -0.09722328186035156, -0.09065628051757812, -0.08408927917480469, -0.07752227783203125, -0.07095527648925781, -0.06438827514648438, -0.05782127380371094, -0.0512542724609375, -0.04468727111816406, -0.038120269775390625, -0.03155326843261719, -0.02498626708984375, -0.018419265747070312, -0.011852264404296875, -0.0052852630615234375, 0.00128173828125, 0.007848739624023438, 0.014415740966796875, 0.020982742309570312, 0.02754974365234375, 0.03411674499511719, 0.040683746337890625, 0.04725074768066406, 0.0538177490234375, 0.06038475036621094, 0.06695175170898438, 0.07351875305175781, 0.08008575439453125, 0.08665275573730469, 0.09321975708007812, 0.09978675842285156, 0.106353759765625, 0.11292076110839844, 0.11948776245117188, 0.1260547637939453, 0.13262176513671875, 0.1391887664794922, 0.14575576782226562, 0.15232276916503906, 0.1588897705078125, 0.16545677185058594, 0.17202377319335938, 0.1785907745361328, 0.18515777587890625, 0.1917247772216797, 0.19829177856445312, 0.20485877990722656, 0.21142578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 8.0, 16.0, 10.0, 21.0, 19.0, 28.0, 28.0, 36.0, 36.0, 40.0, 56.0, 47.0, 41.0, 54.0, 68.0, 55.0, 51.0, 39.0, 43.0, 39.0, 38.0, 34.0, 27.0, 28.0, 20.0, 19.0, 17.0, 17.0, 10.0, 7.0, 12.0, 4.0, 7.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1585693359375, -0.15215492248535156, -0.14574050903320312, -0.1393260955810547, -0.13291168212890625, -0.1264972686767578, -0.12008285522460938, -0.11366844177246094, -0.1072540283203125, -0.10083961486816406, -0.09442520141601562, -0.08801078796386719, -0.08159637451171875, -0.07518196105957031, -0.06876754760742188, -0.06235313415527344, -0.055938720703125, -0.04952430725097656, -0.043109893798828125, -0.03669548034667969, -0.03028106689453125, -0.023866653442382812, -0.017452239990234375, -0.011037826538085938, -0.0046234130859375, 0.0017910003662109375, 0.008205413818359375, 0.014619827270507812, 0.02103424072265625, 0.027448654174804688, 0.033863067626953125, 0.04027748107910156, 0.04669189453125, 0.05310630798339844, 0.059520721435546875, 0.06593513488769531, 0.07234954833984375, 0.07876396179199219, 0.08517837524414062, 0.09159278869628906, 0.0980072021484375, 0.10442161560058594, 0.11083602905273438, 0.11725044250488281, 0.12366485595703125, 0.1300792694091797, 0.13649368286132812, 0.14290809631347656, 0.149322509765625, 0.15573692321777344, 0.16215133666992188, 0.1685657501220703, 0.17498016357421875, 0.1813945770263672, 0.18780899047851562, 0.19422340393066406, 0.2006378173828125, 0.20705223083496094, 0.21346664428710938, 0.2198810577392578, 0.22629547119140625, 0.2327098846435547, 0.23912429809570312, 0.24553871154785156, 0.251953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 15.0, 6.0, 19.0, 17.0, 32.0, 50.0, 90.0, 108.0, 171.0, 267.0, 445.0, 735.0, 1293.0, 2287.0, 4278.0, 8039.0, 15662.0, 31686.0, 71757.0, 186721.0, 354171.0, 215728.0, 82216.0, 35638.0, 17307.0, 9014.0, 4726.0, 2525.0, 1417.0, 823.0, 501.0, 286.0, 183.0, 108.0, 80.0, 61.0, 32.0, 15.0, 16.0, 12.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0], "bins": [-0.073486328125, -0.07158136367797852, -0.06967639923095703, -0.06777143478393555, -0.06586647033691406, -0.06396150588989258, -0.062056541442871094, -0.06015157699584961, -0.058246612548828125, -0.05634164810180664, -0.054436683654785156, -0.05253171920776367, -0.05062675476074219, -0.0487217903137207, -0.04681682586669922, -0.044911861419677734, -0.04300689697265625, -0.041101932525634766, -0.03919696807861328, -0.0372920036315918, -0.03538703918457031, -0.03348207473754883, -0.031577110290527344, -0.02967214584350586, -0.027767181396484375, -0.02586221694946289, -0.023957252502441406, -0.022052288055419922, -0.020147323608398438, -0.018242359161376953, -0.01633739471435547, -0.014432430267333984, -0.0125274658203125, -0.010622501373291016, -0.008717536926269531, -0.006812572479248047, -0.0049076080322265625, -0.003002643585205078, -0.0010976791381835938, 0.0008072853088378906, 0.002712249755859375, 0.004617214202880859, 0.006522178649902344, 0.008427143096923828, 0.010332107543945312, 0.012237071990966797, 0.014142036437988281, 0.016047000885009766, 0.01795196533203125, 0.019856929779052734, 0.02176189422607422, 0.023666858673095703, 0.025571823120117188, 0.027476787567138672, 0.029381752014160156, 0.03128671646118164, 0.033191680908203125, 0.03509664535522461, 0.037001609802246094, 0.03890657424926758, 0.04081153869628906, 0.04271650314331055, 0.04462146759033203, 0.046526432037353516, 0.048431396484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 1.0, 6.0, 5.0, 2.0, 5.0, 10.0, 14.0, 14.0, 23.0, 33.0, 33.0, 50.0, 59.0, 82.0, 90.0, 95.0, 109.0, 92.0, 55.0, 50.0, 30.0, 32.0, 28.0, 15.0, 15.0, 13.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.4616718292236328e-05, -2.3908913135528564e-05, -2.32011079788208e-05, -2.2493302822113037e-05, -2.1785497665405273e-05, -2.107769250869751e-05, -2.0369887351989746e-05, -1.9662082195281982e-05, -1.895427703857422e-05, -1.8246471881866455e-05, -1.753866672515869e-05, -1.6830861568450928e-05, -1.6123056411743164e-05, -1.54152512550354e-05, -1.4707446098327637e-05, -1.3999640941619873e-05, -1.329183578491211e-05, -1.2584030628204346e-05, -1.1876225471496582e-05, -1.1168420314788818e-05, -1.0460615158081055e-05, -9.752810001373291e-06, -9.045004844665527e-06, -8.337199687957764e-06, -7.62939453125e-06, -6.921589374542236e-06, -6.213784217834473e-06, -5.505979061126709e-06, -4.798173904418945e-06, -4.090368747711182e-06, -3.382563591003418e-06, -2.6747584342956543e-06, -1.9669532775878906e-06, -1.259148120880127e-06, -5.513429641723633e-07, 1.564621925354004e-07, 8.642673492431641e-07, 1.5720725059509277e-06, 2.2798776626586914e-06, 2.987682819366455e-06, 3.6954879760742188e-06, 4.403293132781982e-06, 5.111098289489746e-06, 5.81890344619751e-06, 6.5267086029052734e-06, 7.234513759613037e-06, 7.9423189163208e-06, 8.650124073028564e-06, 9.357929229736328e-06, 1.0065734386444092e-05, 1.0773539543151855e-05, 1.1481344699859619e-05, 1.2189149856567383e-05, 1.2896955013275146e-05, 1.360476016998291e-05, 1.4312565326690674e-05, 1.5020370483398438e-05, 1.57281756401062e-05, 1.6435980796813965e-05, 1.714378595352173e-05, 1.7851591110229492e-05, 1.8559396266937256e-05, 1.926720142364502e-05, 1.9975006580352783e-05, 2.0682811737060547e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 12.0, 4.0, 15.0, 15.0, 19.0, 32.0, 44.0, 79.0, 77.0, 125.0, 156.0, 216.0, 286.0, 426.0, 636.0, 1063.0, 1774.0, 3533.0, 7282.0, 17326.0, 45969.0, 147916.0, 424563.0, 269374.0, 78121.0, 26938.0, 11220.0, 4988.0, 2387.0, 1312.0, 845.0, 541.0, 331.0, 244.0, 170.0, 143.0, 68.0, 83.0, 52.0, 41.0, 27.0, 25.0, 19.0, 7.0, 8.0, 16.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.07427978515625, -0.07186317443847656, -0.06944656372070312, -0.06702995300292969, -0.06461334228515625, -0.06219673156738281, -0.059780120849609375, -0.05736351013183594, -0.0549468994140625, -0.05253028869628906, -0.050113677978515625, -0.04769706726074219, -0.04528045654296875, -0.04286384582519531, -0.040447235107421875, -0.03803062438964844, -0.035614013671875, -0.03319740295410156, -0.030780792236328125, -0.028364181518554688, -0.02594757080078125, -0.023530960083007812, -0.021114349365234375, -0.018697738647460938, -0.0162811279296875, -0.013864517211914062, -0.011447906494140625, -0.009031295776367188, -0.00661468505859375, -0.0041980743408203125, -0.001781463623046875, 0.0006351470947265625, 0.0030517578125, 0.0054683685302734375, 0.007884979248046875, 0.010301589965820312, 0.01271820068359375, 0.015134811401367188, 0.017551422119140625, 0.019968032836914062, 0.0223846435546875, 0.024801254272460938, 0.027217864990234375, 0.029634475708007812, 0.03205108642578125, 0.03446769714355469, 0.036884307861328125, 0.03930091857910156, 0.041717529296875, 0.04413414001464844, 0.046550750732421875, 0.04896736145019531, 0.05138397216796875, 0.05380058288574219, 0.056217193603515625, 0.05863380432128906, 0.0610504150390625, 0.06346702575683594, 0.06588363647460938, 0.06830024719238281, 0.07071685791015625, 0.07313346862792969, 0.07555007934570312, 0.07796669006347656, 0.08038330078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 4.0, 5.0, 7.0, 7.0, 8.0, 17.0, 21.0, 18.0, 31.0, 39.0, 59.0, 87.0, 95.0, 115.0, 107.0, 85.0, 67.0, 58.0, 47.0, 23.0, 18.0, 18.0, 19.0, 5.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.08086967468261719, -0.07860946655273438, -0.07634925842285156, -0.07408905029296875, -0.07182884216308594, -0.06956863403320312, -0.06730842590332031, -0.0650482177734375, -0.06278800964355469, -0.060527801513671875, -0.05826759338378906, -0.05600738525390625, -0.05374717712402344, -0.051486968994140625, -0.04922676086425781, -0.046966552734375, -0.04470634460449219, -0.042446136474609375, -0.04018592834472656, -0.03792572021484375, -0.03566551208496094, -0.033405303955078125, -0.031145095825195312, -0.0288848876953125, -0.026624679565429688, -0.024364471435546875, -0.022104263305664062, -0.01984405517578125, -0.017583847045898438, -0.015323638916015625, -0.013063430786132812, -0.01080322265625, -0.008543014526367188, -0.006282806396484375, -0.0040225982666015625, -0.00176239013671875, 0.0004978179931640625, 0.002758026123046875, 0.0050182342529296875, 0.0072784423828125, 0.009538650512695312, 0.011798858642578125, 0.014059066772460938, 0.01631927490234375, 0.018579483032226562, 0.020839691162109375, 0.023099899291992188, 0.025360107421875, 0.027620315551757812, 0.029880523681640625, 0.03214073181152344, 0.03440093994140625, 0.03666114807128906, 0.038921356201171875, 0.04118156433105469, 0.0434417724609375, 0.04570198059082031, 0.047962188720703125, 0.05022239685058594, 0.05248260498046875, 0.05474281311035156, 0.057003021240234375, 0.05926322937011719, 0.0615234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 28.0, 67.0, 119.0, 191.0, 230.0, 168.0, 100.0, 58.0, 26.0, 8.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9436389207839966, -0.8993273973464966, -0.8550158143043518, -0.8107042908668518, -0.766392707824707, -0.722081184387207, -0.677769660949707, -0.633458137512207, -0.5891465544700623, -0.5448350310325623, -0.5005234479904175, -0.4562119245529175, -0.4119003713130951, -0.3675888180732727, -0.3232772946357727, -0.2789657413959503, -0.23465418815612793, -0.19034263491630554, -0.14603109657764435, -0.10171955823898315, -0.05740800499916077, -0.013096451759338379, 0.03121507167816162, 0.07552662491798401, 0.1198381781578064, 0.16414973139762878, 0.20846126973628998, 0.25277280807495117, 0.29708436131477356, 0.34139591455459595, 0.38570743799209595, 0.43001899123191833, 0.4743306636810303, 0.5186421871185303, 0.562953770160675, 0.607265293598175, 0.6515768766403198, 0.6958884000778198, 0.7401999235153198, 0.7845114469528198, 0.8288230299949646, 0.8731345534324646, 0.9174461364746094, 0.9617576599121094, 1.0060691833496094, 1.0503807067871094, 1.0946922302246094, 1.139003872871399, 1.183315396308899, 1.227626919746399, 1.271938443183899, 1.3162500858306885, 1.3605616092681885, 1.4048731327056885, 1.4491846561431885, 1.4934961795806885, 1.5378077030181885, 1.5821192264556885, 1.6264307498931885, 1.6707422733306885, 1.715053915977478, 1.759365439414978, 1.803676962852478, 1.847988486289978, 1.8923001289367676]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 7.0, 5.0, 4.0, 10.0, 11.0, 11.0, 11.0, 19.0, 23.0, 15.0, 29.0, 30.0, 35.0, 34.0, 47.0, 47.0, 48.0, 44.0, 41.0, 43.0, 58.0, 47.0, 39.0, 40.0, 29.0, 31.0, 35.0, 23.0, 27.0, 29.0, 28.0, 16.0, 19.0, 18.0, 9.0, 8.0, 9.0, 10.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.4846387505531311, -0.46975982189178467, -0.4548809230327606, -0.4400019943714142, -0.42512306571006775, -0.4102441668510437, -0.39536523818969727, -0.38048630952835083, -0.3656074106693268, -0.35072848200798035, -0.3358495831489563, -0.32097065448760986, -0.3060917258262634, -0.2912128269672394, -0.27633389830589294, -0.2614549994468689, -0.24657605588436127, -0.23169714212417603, -0.2168182134628296, -0.20193929970264435, -0.1870603859424591, -0.17218145728111267, -0.15730254352092743, -0.1424236297607422, -0.12754470109939575, -0.11266577988862991, -0.09778686612844467, -0.08290794491767883, -0.06802903115749359, -0.05315010994672775, -0.038271188735961914, -0.023392274975776672, -0.00851336121559143, 0.006365557201206684, 0.0212444756180048, 0.03612339496612549, 0.05100231245160103, 0.06588122993707657, 0.08076015114784241, 0.09563906490802765, 0.11051798611879349, 0.12539690732955933, 0.14027582108974457, 0.1551547348499298, 0.17003366351127625, 0.1849125772714615, 0.19979149103164673, 0.21467041969299316, 0.2295493334531784, 0.24442824721336365, 0.2593071758747101, 0.27418607473373413, 0.28906500339508057, 0.303943932056427, 0.31882286071777344, 0.3337017595767975, 0.3485806882381439, 0.36345961689949036, 0.3783385157585144, 0.39321744441986084, 0.4080963730812073, 0.4229752719402313, 0.43785420060157776, 0.4527330994606018, 0.46761202812194824]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 12.0, 13.0, 23.0, 16.0, 32.0, 43.0, 45.0, 81.0, 109.0, 182.0, 345.0, 619.0, 1237.0, 2571.0, 5886.0, 15417.0, 49781.0, 240321.0, 2509210.0, 1179450.0, 136501.0, 32971.0, 10865.0, 4427.0, 1926.0, 916.0, 505.0, 247.0, 163.0, 102.0, 65.0, 49.0, 29.0, 23.0, 19.0, 17.0, 12.0, 7.0, 7.0, 5.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.1591796875, -0.15418052673339844, -0.14918136596679688, -0.1441822052001953, -0.13918304443359375, -0.1341838836669922, -0.12918472290039062, -0.12418556213378906, -0.1191864013671875, -0.11418724060058594, -0.10918807983398438, -0.10418891906738281, -0.09918975830078125, -0.09419059753417969, -0.08919143676757812, -0.08419227600097656, -0.079193115234375, -0.07419395446777344, -0.06919479370117188, -0.06419563293457031, -0.05919647216796875, -0.05419731140136719, -0.049198150634765625, -0.04419898986816406, -0.0391998291015625, -0.03420066833496094, -0.029201507568359375, -0.024202346801757812, -0.01920318603515625, -0.014204025268554688, -0.009204864501953125, -0.0042057037353515625, 0.00079345703125, 0.0057926177978515625, 0.010791778564453125, 0.015790939331054688, 0.02079010009765625, 0.025789260864257812, 0.030788421630859375, 0.03578758239746094, 0.0407867431640625, 0.04578590393066406, 0.050785064697265625, 0.05578422546386719, 0.06078338623046875, 0.06578254699707031, 0.07078170776367188, 0.07578086853027344, 0.080780029296875, 0.08577919006347656, 0.09077835083007812, 0.09577751159667969, 0.10077667236328125, 0.10577583312988281, 0.11077499389648438, 0.11577415466308594, 0.1207733154296875, 0.12577247619628906, 0.13077163696289062, 0.1357707977294922, 0.14076995849609375, 0.1457691192626953, 0.15076828002929688, 0.15576744079589844, 0.1607666015625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 1.0, 2.0, 11.0, 5.0, 10.0, 11.0, 17.0, 18.0, 13.0, 15.0, 21.0, 25.0, 33.0, 29.0, 32.0, 22.0, 38.0, 30.0, 51.0, 43.0, 43.0, 40.0, 44.0, 41.0, 40.0, 33.0, 32.0, 36.0, 38.0, 27.0, 16.0, 24.0, 15.0, 25.0, 17.0, 13.0, 21.0, 12.0, 9.0, 8.0, 8.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.06927490234375, -0.06733226776123047, -0.06538963317871094, -0.0634469985961914, -0.061504364013671875, -0.059561729431152344, -0.05761909484863281, -0.05567646026611328, -0.05373382568359375, -0.05179119110107422, -0.04984855651855469, -0.047905921936035156, -0.045963287353515625, -0.044020652770996094, -0.04207801818847656, -0.04013538360595703, -0.0381927490234375, -0.03625011444091797, -0.03430747985839844, -0.032364845275878906, -0.030422210693359375, -0.028479576110839844, -0.026536941528320312, -0.02459430694580078, -0.02265167236328125, -0.02070903778076172, -0.018766403198242188, -0.016823768615722656, -0.014881134033203125, -0.012938499450683594, -0.010995864868164062, -0.009053230285644531, -0.007110595703125, -0.005167961120605469, -0.0032253265380859375, -0.0012826919555664062, 0.000659942626953125, 0.0026025772094726562, 0.0045452117919921875, 0.006487846374511719, 0.00843048095703125, 0.010373115539550781, 0.012315750122070312, 0.014258384704589844, 0.016201019287109375, 0.018143653869628906, 0.020086288452148438, 0.02202892303466797, 0.0239715576171875, 0.02591419219970703, 0.027856826782226562, 0.029799461364746094, 0.031742095947265625, 0.033684730529785156, 0.03562736511230469, 0.03756999969482422, 0.03951263427734375, 0.04145526885986328, 0.04339790344238281, 0.045340538024902344, 0.047283172607421875, 0.049225807189941406, 0.05116844177246094, 0.05311107635498047, 0.0550537109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 7.0, 10.0, 11.0, 19.0, 21.0, 27.0, 34.0, 56.0, 56.0, 93.0, 133.0, 210.0, 366.0, 663.0, 1366.0, 3066.0, 7439.0, 21985.0, 85429.0, 505364.0, 2810624.0, 619521.0, 98672.0, 24391.0, 8074.0, 3321.0, 1435.0, 719.0, 395.0, 224.0, 158.0, 101.0, 84.0, 42.0, 40.0, 29.0, 24.0, 11.0, 13.0, 7.0, 14.0, 5.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22900390625, -0.2219676971435547, -0.21493148803710938, -0.20789527893066406, -0.20085906982421875, -0.19382286071777344, -0.18678665161132812, -0.1797504425048828, -0.1727142333984375, -0.1656780242919922, -0.15864181518554688, -0.15160560607910156, -0.14456939697265625, -0.13753318786621094, -0.13049697875976562, -0.12346076965332031, -0.116424560546875, -0.10938835144042969, -0.10235214233398438, -0.09531593322753906, -0.08827972412109375, -0.08124351501464844, -0.07420730590820312, -0.06717109680175781, -0.0601348876953125, -0.05309867858886719, -0.046062469482421875, -0.03902626037597656, -0.03199005126953125, -0.024953842163085938, -0.017917633056640625, -0.010881423950195312, -0.00384521484375, 0.0031909942626953125, 0.010227203369140625, 0.017263412475585938, 0.02429962158203125, 0.03133583068847656, 0.038372039794921875, 0.04540824890136719, 0.0524444580078125, 0.05948066711425781, 0.06651687622070312, 0.07355308532714844, 0.08058929443359375, 0.08762550354003906, 0.09466171264648438, 0.10169792175292969, 0.108734130859375, 0.11577033996582031, 0.12280654907226562, 0.12984275817871094, 0.13687896728515625, 0.14391517639160156, 0.15095138549804688, 0.1579875946044922, 0.1650238037109375, 0.1720600128173828, 0.17909622192382812, 0.18613243103027344, 0.19316864013671875, 0.20020484924316406, 0.20724105834960938, 0.2142772674560547, 0.2213134765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 16.0, 19.0, 22.0, 36.0, 98.0, 193.0, 343.0, 861.0, 1306.0, 633.0, 261.0, 128.0, 65.0, 44.0, 23.0, 3.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1888427734375, -0.1803302764892578, -0.17181777954101562, -0.16330528259277344, -0.15479278564453125, -0.14628028869628906, -0.13776779174804688, -0.1292552947998047, -0.1207427978515625, -0.11223030090332031, -0.10371780395507812, -0.09520530700683594, -0.08669281005859375, -0.07818031311035156, -0.06966781616210938, -0.06115531921386719, -0.052642822265625, -0.04413032531738281, -0.035617828369140625, -0.027105331420898438, -0.01859283447265625, -0.010080337524414062, -0.001567840576171875, 0.0069446563720703125, 0.0154571533203125, 0.023969650268554688, 0.032482147216796875, 0.04099464416503906, 0.04950714111328125, 0.05801963806152344, 0.06653213500976562, 0.07504463195800781, 0.08355712890625, 0.09206962585449219, 0.10058212280273438, 0.10909461975097656, 0.11760711669921875, 0.12611961364746094, 0.13463211059570312, 0.1431446075439453, 0.1516571044921875, 0.1601696014404297, 0.16868209838867188, 0.17719459533691406, 0.18570709228515625, 0.19421958923339844, 0.20273208618164062, 0.2112445831298828, 0.219757080078125, 0.2282695770263672, 0.23678207397460938, 0.24529457092285156, 0.25380706787109375, 0.26231956481933594, 0.2708320617675781, 0.2793445587158203, 0.2878570556640625, 0.2963695526123047, 0.3048820495605469, 0.31339454650878906, 0.32190704345703125, 0.33041954040527344, 0.3389320373535156, 0.3474445343017578, 0.35595703125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 12.0, 9.0, 32.0, 78.0, 103.0, 180.0, 204.0, 167.0, 122.0, 54.0, 24.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.012836217880249, -1.9730336666107178, -1.9332311153411865, -1.8934285640716553, -1.853626012802124, -1.8138234615325928, -1.7740209102630615, -1.7342183589935303, -1.694415807723999, -1.6546132564544678, -1.6148107051849365, -1.5750081539154053, -1.535205602645874, -1.4954030513763428, -1.4556005001068115, -1.4157979488372803, -1.375995397567749, -1.3361928462982178, -1.2963902950286865, -1.2565877437591553, -1.216785192489624, -1.1769826412200928, -1.1371800899505615, -1.0973775386810303, -1.0575751066207886, -1.0177725553512573, -0.9779700040817261, -0.9381674528121948, -0.8983649015426636, -0.8585623502731323, -0.8187597990036011, -0.7789572477340698, -0.7391547560691833, -0.6993522047996521, -0.6595496535301208, -0.6197471022605896, -0.5799445509910583, -0.5401419997215271, -0.5003395080566406, -0.460536926984787, -0.42073437571525574, -0.3809318244457245, -0.34112927317619324, -0.3013267517089844, -0.2615242004394531, -0.22172163426876068, -0.18191909790039062, -0.14211654663085938, -0.10231399536132812, -0.06251144409179688, -0.022708900272846222, 0.01709364354610443, 0.05689619481563568, 0.09669874608516693, 0.136501282453537, 0.17630383372306824, 0.2161063849925995, 0.25590893626213074, 0.295711487531662, 0.33551400899887085, 0.3753165602684021, 0.41511911153793335, 0.4549216628074646, 0.49472421407699585, 0.5345267653465271]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 17.0, 22.0, 23.0, 23.0, 25.0, 37.0, 32.0, 30.0, 42.0, 33.0, 49.0, 57.0, 58.0, 44.0, 56.0, 49.0, 43.0, 46.0, 32.0, 31.0, 44.0, 25.0, 25.0, 22.0, 21.0, 18.0, 10.0, 11.0, 11.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43947523832321167, -0.42583146691322327, -0.41218769550323486, -0.39854392409324646, -0.38490015268325806, -0.37125638127326965, -0.35761260986328125, -0.34396880865097046, -0.33032506704330444, -0.31668129563331604, -0.30303752422332764, -0.28939375281333923, -0.27574998140335083, -0.2621062099933624, -0.24846242368221283, -0.23481865227222443, -0.22117486596107483, -0.20753109455108643, -0.19388732314109802, -0.18024355173110962, -0.16659978032112122, -0.1529560089111328, -0.13931222259998322, -0.1256684511899948, -0.11202467978000641, -0.098380908370018, -0.0847371369600296, -0.0710933580994606, -0.0574495866894722, -0.043805815279483795, -0.030162036418914795, -0.01651826500892639, -0.0028744935989379883, 0.010769279673695564, 0.024413052946329117, 0.03805682808160782, 0.05170059949159622, 0.06534437090158463, 0.07898814976215363, 0.09263192117214203, 0.10627569258213043, 0.11991946399211884, 0.13356323540210724, 0.14720702171325684, 0.16085079312324524, 0.17449456453323364, 0.18813833594322205, 0.20178210735321045, 0.21542587876319885, 0.22906965017318726, 0.24271342158317566, 0.25635719299316406, 0.27000096440315247, 0.28364473581314087, 0.29728853702545166, 0.3109322786331177, 0.32457607984542847, 0.33821985125541687, 0.3518636226654053, 0.3655073940753937, 0.3791511654853821, 0.3927949368953705, 0.4064387083053589, 0.4200825095176697, 0.4337262511253357]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 18.0, 17.0, 27.0, 34.0, 50.0, 119.0, 168.0, 320.0, 529.0, 935.0, 1518.0, 2564.0, 4371.0, 6926.0, 11395.0, 18997.0, 32566.0, 59179.0, 120823.0, 243142.0, 258746.0, 134388.0, 65177.0, 34902.0, 20471.0, 12373.0, 7424.0, 4599.0, 2720.0, 1645.0, 974.0, 574.0, 382.0, 193.0, 108.0, 72.0, 48.0, 32.0, 11.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10052490234375, -0.09694385528564453, -0.09336280822753906, -0.0897817611694336, -0.08620071411132812, -0.08261966705322266, -0.07903861999511719, -0.07545757293701172, -0.07187652587890625, -0.06829547882080078, -0.06471443176269531, -0.061133384704589844, -0.057552337646484375, -0.053971290588378906, -0.05039024353027344, -0.04680919647216797, -0.0432281494140625, -0.03964710235595703, -0.03606605529785156, -0.032485008239746094, -0.028903961181640625, -0.025322914123535156, -0.021741867065429688, -0.01816082000732422, -0.01457977294921875, -0.010998725891113281, -0.0074176788330078125, -0.0038366317749023438, -0.000255584716796875, 0.0033254623413085938, 0.0069065093994140625, 0.010487556457519531, 0.014068603515625, 0.01764965057373047, 0.021230697631835938, 0.024811744689941406, 0.028392791748046875, 0.031973838806152344, 0.03555488586425781, 0.03913593292236328, 0.04271697998046875, 0.04629802703857422, 0.04987907409667969, 0.053460121154785156, 0.057041168212890625, 0.060622215270996094, 0.06420326232910156, 0.06778430938720703, 0.0713653564453125, 0.07494640350341797, 0.07852745056152344, 0.0821084976196289, 0.08568954467773438, 0.08927059173583984, 0.09285163879394531, 0.09643268585205078, 0.10001373291015625, 0.10359477996826172, 0.10717582702636719, 0.11075687408447266, 0.11433792114257812, 0.1179189682006836, 0.12150001525878906, 0.12508106231689453, 0.128662109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 5.0, 6.0, 10.0, 12.0, 14.0, 20.0, 10.0, 20.0, 16.0, 26.0, 28.0, 30.0, 40.0, 33.0, 61.0, 50.0, 48.0, 50.0, 43.0, 55.0, 41.0, 45.0, 37.0, 46.0, 42.0, 38.0, 25.0, 23.0, 20.0, 24.0, 12.0, 11.0, 8.0, 12.0, 5.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.08428955078125, -0.08184432983398438, -0.07939910888671875, -0.07695388793945312, -0.0745086669921875, -0.07206344604492188, -0.06961822509765625, -0.06717300415039062, -0.064727783203125, -0.062282562255859375, -0.05983734130859375, -0.057392120361328125, -0.0549468994140625, -0.052501678466796875, -0.05005645751953125, -0.047611236572265625, -0.045166015625, -0.042720794677734375, -0.04027557373046875, -0.037830352783203125, -0.0353851318359375, -0.032939910888671875, -0.03049468994140625, -0.028049468994140625, -0.025604248046875, -0.023159027099609375, -0.02071380615234375, -0.018268585205078125, -0.0158233642578125, -0.013378143310546875, -0.01093292236328125, -0.008487701416015625, -0.00604248046875, -0.003597259521484375, -0.00115203857421875, 0.001293182373046875, 0.0037384033203125, 0.006183624267578125, 0.00862884521484375, 0.011074066162109375, 0.013519287109375, 0.015964508056640625, 0.01840972900390625, 0.020854949951171875, 0.0233001708984375, 0.025745391845703125, 0.02819061279296875, 0.030635833740234375, 0.0330810546875, 0.035526275634765625, 0.03797149658203125, 0.040416717529296875, 0.0428619384765625, 0.045307159423828125, 0.04775238037109375, 0.050197601318359375, 0.052642822265625, 0.055088043212890625, 0.05753326416015625, 0.059978485107421875, 0.0624237060546875, 0.06486892700195312, 0.06731414794921875, 0.06975936889648438, 0.07220458984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 16.0, 19.0, 18.0, 29.0, 41.0, 76.0, 97.0, 166.0, 296.0, 567.0, 1360.0, 3434.0, 9498.0, 26724.0, 85602.0, 415392.0, 386225.0, 79527.0, 25021.0, 8767.0, 3206.0, 1181.0, 533.0, 258.0, 157.0, 90.0, 75.0, 45.0, 34.0, 27.0, 21.0, 8.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.272216796875, -0.2642040252685547, -0.2561912536621094, -0.24817848205566406, -0.24016571044921875, -0.23215293884277344, -0.22414016723632812, -0.2161273956298828, -0.2081146240234375, -0.2001018524169922, -0.19208908081054688, -0.18407630920410156, -0.17606353759765625, -0.16805076599121094, -0.16003799438476562, -0.1520252227783203, -0.144012451171875, -0.1359996795654297, -0.12798690795898438, -0.11997413635253906, -0.11196136474609375, -0.10394859313964844, -0.09593582153320312, -0.08792304992675781, -0.0799102783203125, -0.07189750671386719, -0.06388473510742188, -0.05587196350097656, -0.04785919189453125, -0.03984642028808594, -0.031833648681640625, -0.023820877075195312, -0.01580810546875, -0.0077953338623046875, 0.000217437744140625, 0.008230209350585938, 0.01624298095703125, 0.024255752563476562, 0.032268524169921875, 0.04028129577636719, 0.0482940673828125, 0.05630683898925781, 0.06431961059570312, 0.07233238220214844, 0.08034515380859375, 0.08835792541503906, 0.09637069702148438, 0.10438346862792969, 0.112396240234375, 0.12040901184082031, 0.12842178344726562, 0.13643455505371094, 0.14444732666015625, 0.15246009826660156, 0.16047286987304688, 0.1684856414794922, 0.1764984130859375, 0.1845111846923828, 0.19252395629882812, 0.20053672790527344, 0.20854949951171875, 0.21656227111816406, 0.22457504272460938, 0.2325878143310547, 0.2406005859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 4.0, 6.0, 14.0, 15.0, 15.0, 13.0, 20.0, 27.0, 34.0, 52.0, 38.0, 54.0, 63.0, 74.0, 51.0, 56.0, 49.0, 49.0, 54.0, 48.0, 37.0, 28.0, 39.0, 33.0, 21.0, 14.0, 17.0, 17.0, 17.0, 10.0, 2.0, 2.0, 7.0, 6.0, 1.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2127685546875, -0.2040576934814453, -0.19534683227539062, -0.18663597106933594, -0.17792510986328125, -0.16921424865722656, -0.16050338745117188, -0.1517925262451172, -0.1430816650390625, -0.1343708038330078, -0.12565994262695312, -0.11694908142089844, -0.10823822021484375, -0.09952735900878906, -0.09081649780273438, -0.08210563659667969, -0.073394775390625, -0.06468391418457031, -0.055973052978515625, -0.04726219177246094, -0.03855133056640625, -0.029840469360351562, -0.021129608154296875, -0.012418746948242188, -0.0037078857421875, 0.0050029754638671875, 0.013713836669921875, 0.022424697875976562, 0.03113555908203125, 0.03984642028808594, 0.048557281494140625, 0.05726814270019531, 0.06597900390625, 0.07468986511230469, 0.08340072631835938, 0.09211158752441406, 0.10082244873046875, 0.10953330993652344, 0.11824417114257812, 0.1269550323486328, 0.1356658935546875, 0.1443767547607422, 0.15308761596679688, 0.16179847717285156, 0.17050933837890625, 0.17922019958496094, 0.18793106079101562, 0.1966419219970703, 0.205352783203125, 0.2140636444091797, 0.22277450561523438, 0.23148536682128906, 0.24019622802734375, 0.24890708923339844, 0.2576179504394531, 0.2663288116455078, 0.2750396728515625, 0.2837505340576172, 0.2924613952636719, 0.30117225646972656, 0.30988311767578125, 0.31859397888183594, 0.3273048400878906, 0.3360157012939453, 0.3447265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 10.0, 8.0, 6.0, 12.0, 21.0, 24.0, 34.0, 67.0, 81.0, 169.0, 275.0, 425.0, 783.0, 1429.0, 2356.0, 4013.0, 7373.0, 13270.0, 24543.0, 50602.0, 155829.0, 463295.0, 201443.0, 61092.0, 27784.0, 14610.0, 8106.0, 4689.0, 2566.0, 1466.0, 884.0, 501.0, 282.0, 178.0, 110.0, 72.0, 48.0, 28.0, 20.0, 10.0, 5.0, 5.0, 5.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.0836181640625, -0.08112907409667969, -0.07863998413085938, -0.07615089416503906, -0.07366180419921875, -0.07117271423339844, -0.06868362426757812, -0.06619453430175781, -0.0637054443359375, -0.06121635437011719, -0.058727264404296875, -0.05623817443847656, -0.05374908447265625, -0.05125999450683594, -0.048770904541015625, -0.04628181457519531, -0.043792724609375, -0.04130363464355469, -0.038814544677734375, -0.03632545471191406, -0.03383636474609375, -0.03134727478027344, -0.028858184814453125, -0.026369094848632812, -0.0238800048828125, -0.021390914916992188, -0.018901824951171875, -0.016412734985351562, -0.01392364501953125, -0.011434555053710938, -0.008945465087890625, -0.0064563751220703125, -0.00396728515625, -0.0014781951904296875, 0.001010894775390625, 0.0034999847412109375, 0.00598907470703125, 0.008478164672851562, 0.010967254638671875, 0.013456344604492188, 0.0159454345703125, 0.018434524536132812, 0.020923614501953125, 0.023412704467773438, 0.02590179443359375, 0.028390884399414062, 0.030879974365234375, 0.03336906433105469, 0.035858154296875, 0.03834724426269531, 0.040836334228515625, 0.04332542419433594, 0.04581451416015625, 0.04830360412597656, 0.050792694091796875, 0.05328178405761719, 0.0557708740234375, 0.05825996398925781, 0.060749053955078125, 0.06323814392089844, 0.06572723388671875, 0.06821632385253906, 0.07070541381835938, 0.07319450378417969, 0.07568359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 7.0, 14.0, 12.0, 18.0, 28.0, 32.0, 45.0, 70.0, 101.0, 124.0, 123.0, 78.0, 95.0, 75.0, 36.0, 36.0, 24.0, 15.0, 7.0, 10.0, 9.0, 9.0, 4.0, 4.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3484230041503906e-05, -2.262834459543228e-05, -2.1772459149360657e-05, -2.0916573703289032e-05, -2.0060688257217407e-05, -1.9204802811145782e-05, -1.8348917365074158e-05, -1.7493031919002533e-05, -1.6637146472930908e-05, -1.5781261026859283e-05, -1.4925375580787659e-05, -1.4069490134716034e-05, -1.321360468864441e-05, -1.2357719242572784e-05, -1.150183379650116e-05, -1.0645948350429535e-05, -9.79006290435791e-06, -8.934177458286285e-06, -8.07829201221466e-06, -7.222406566143036e-06, -6.366521120071411e-06, -5.510635673999786e-06, -4.654750227928162e-06, -3.798864781856537e-06, -2.942979335784912e-06, -2.0870938897132874e-06, -1.2312084436416626e-06, -3.7532299757003784e-07, 4.805624485015869e-07, 1.3364478945732117e-06, 2.1923333406448364e-06, 3.048218786716461e-06, 3.904104232788086e-06, 4.759989678859711e-06, 5.6158751249313354e-06, 6.47176057100296e-06, 7.327646017074585e-06, 8.18353146314621e-06, 9.039416909217834e-06, 9.89530235528946e-06, 1.0751187801361084e-05, 1.1607073247432709e-05, 1.2462958693504333e-05, 1.3318844139575958e-05, 1.4174729585647583e-05, 1.5030615031719208e-05, 1.5886500477790833e-05, 1.6742385923862457e-05, 1.7598271369934082e-05, 1.8454156816005707e-05, 1.931004226207733e-05, 2.0165927708148956e-05, 2.102181315422058e-05, 2.1877698600292206e-05, 2.273358404636383e-05, 2.3589469492435455e-05, 2.444535493850708e-05, 2.5301240384578705e-05, 2.615712583065033e-05, 2.7013011276721954e-05, 2.786889672279358e-05, 2.8724782168865204e-05, 2.958066761493683e-05, 3.0436553061008453e-05, 3.129243850708008e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 5.0, 8.0, 5.0, 14.0, 18.0, 22.0, 33.0, 90.0, 100.0, 197.0, 344.0, 666.0, 1332.0, 2902.0, 5972.0, 12796.0, 28213.0, 74618.0, 298863.0, 440298.0, 112851.0, 37742.0, 16610.0, 7631.0, 3583.0, 1748.0, 896.0, 407.0, 247.0, 115.0, 77.0, 41.0, 34.0, 24.0, 21.0, 7.0, 17.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0924072265625, -0.08970260620117188, -0.08699798583984375, -0.08429336547851562, -0.0815887451171875, -0.07888412475585938, -0.07617950439453125, -0.07347488403320312, -0.070770263671875, -0.06806564331054688, -0.06536102294921875, -0.06265640258789062, -0.0599517822265625, -0.057247161865234375, -0.05454254150390625, -0.051837921142578125, -0.04913330078125, -0.046428680419921875, -0.04372406005859375, -0.041019439697265625, -0.0383148193359375, -0.035610198974609375, -0.03290557861328125, -0.030200958251953125, -0.027496337890625, -0.024791717529296875, -0.02208709716796875, -0.019382476806640625, -0.0166778564453125, -0.013973236083984375, -0.01126861572265625, -0.008563995361328125, -0.005859375, -0.003154754638671875, -0.00045013427734375, 0.002254486083984375, 0.0049591064453125, 0.007663726806640625, 0.01036834716796875, 0.013072967529296875, 0.015777587890625, 0.018482208251953125, 0.02118682861328125, 0.023891448974609375, 0.0265960693359375, 0.029300689697265625, 0.03200531005859375, 0.034709930419921875, 0.03741455078125, 0.040119171142578125, 0.04282379150390625, 0.045528411865234375, 0.0482330322265625, 0.050937652587890625, 0.05364227294921875, 0.056346893310546875, 0.059051513671875, 0.061756134033203125, 0.06446075439453125, 0.06716537475585938, 0.0698699951171875, 0.07257461547851562, 0.07527923583984375, 0.07798385620117188, 0.0806884765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 3.0, 8.0, 7.0, 8.0, 14.0, 15.0, 18.0, 27.0, 30.0, 49.0, 60.0, 93.0, 104.0, 132.0, 88.0, 82.0, 57.0, 49.0, 17.0, 20.0, 21.0, 12.0, 9.0, 11.0, 9.0, 8.0, 5.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0670166015625, -0.06473064422607422, -0.06244468688964844, -0.060158729553222656, -0.057872772216796875, -0.055586814880371094, -0.05330085754394531, -0.05101490020751953, -0.04872894287109375, -0.04644298553466797, -0.04415702819824219, -0.041871070861816406, -0.039585113525390625, -0.037299156188964844, -0.03501319885253906, -0.03272724151611328, -0.0304412841796875, -0.02815532684326172, -0.025869369506835938, -0.023583412170410156, -0.021297454833984375, -0.019011497497558594, -0.016725540161132812, -0.014439582824707031, -0.01215362548828125, -0.009867668151855469, -0.0075817108154296875, -0.005295753479003906, -0.003009796142578125, -0.0007238388061523438, 0.0015621185302734375, 0.0038480758666992188, 0.006134033203125, 0.008419990539550781, 0.010705947875976562, 0.012991905212402344, 0.015277862548828125, 0.017563819885253906, 0.019849777221679688, 0.02213573455810547, 0.02442169189453125, 0.02670764923095703, 0.028993606567382812, 0.031279563903808594, 0.033565521240234375, 0.035851478576660156, 0.03813743591308594, 0.04042339324951172, 0.0427093505859375, 0.04499530792236328, 0.04728126525878906, 0.049567222595214844, 0.051853179931640625, 0.054139137268066406, 0.05642509460449219, 0.05871105194091797, 0.06099700927734375, 0.06328296661376953, 0.06556892395019531, 0.0678548812866211, 0.07014083862304688, 0.07242679595947266, 0.07471275329589844, 0.07699871063232422, 0.07928466796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 16.0, 19.0, 28.0, 37.0, 55.0, 44.0, 82.0, 91.0, 88.0, 83.0, 79.0, 80.0, 65.0, 46.0, 37.0, 33.0, 28.0, 16.0, 17.0, 9.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5222840309143066, -0.5018109083175659, -0.4813377261161804, -0.4608645737171173, -0.4403914213180542, -0.4199182987213135, -0.39944514632225037, -0.37897199392318726, -0.35849884152412415, -0.33802568912506104, -0.3175525367259979, -0.2970793843269348, -0.2766062617301941, -0.2561330795288086, -0.23565995693206787, -0.21518680453300476, -0.19471365213394165, -0.17424049973487854, -0.15376734733581543, -0.1332942098379135, -0.1128210574388504, -0.09234790503978729, -0.07187476009130478, -0.051401615142822266, -0.030928462743759155, -0.010455314069986343, 0.010017834603786469, 0.03049098327755928, 0.05096413195133209, 0.0714372843503952, 0.09191042929887772, 0.11238357424736023, 0.13285678625106812, 0.15332993865013123, 0.17380309104919434, 0.19427622854709625, 0.21474938094615936, 0.23522253334522247, 0.2556956708431244, 0.2761688232421875, 0.2966419756412506, 0.3171151280403137, 0.33758828043937683, 0.35806143283843994, 0.37853455543518066, 0.39900773763656616, 0.4194808602333069, 0.43995401263237, 0.4604271650314331, 0.4809003174304962, 0.5013734698295593, 0.5218465924263, 0.5423197746276855, 0.5627928972244263, 0.5832660794258118, 0.6037392020225525, 0.624212384223938, 0.6446855068206787, 0.6651586890220642, 0.6856318116188049, 0.7061049938201904, 0.7265781164169312, 0.7470512986183167, 0.7675244212150574, 0.7879975438117981]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 5.0, 11.0, 10.0, 11.0, 10.0, 17.0, 13.0, 21.0, 16.0, 30.0, 26.0, 25.0, 31.0, 31.0, 39.0, 36.0, 47.0, 31.0, 36.0, 45.0, 43.0, 42.0, 31.0, 30.0, 32.0, 34.0, 36.0, 31.0, 25.0, 25.0, 25.0, 20.0, 22.0, 16.0, 17.0, 10.0, 16.0, 10.0, 9.0, 7.0, 7.0, 1.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.5383294224739075, -0.520634114742279, -0.5029388666152954, -0.485243558883667, -0.4675482511520386, -0.44985294342041016, -0.4321576654911041, -0.4144623875617981, -0.3967670798301697, -0.37907177209854126, -0.36137649416923523, -0.3436812162399292, -0.3259859085083008, -0.30829060077667236, -0.29059532284736633, -0.2729000449180603, -0.2552047371864319, -0.23750944435596466, -0.21981415152549744, -0.2021188586950302, -0.184423565864563, -0.16672827303409576, -0.14903298020362854, -0.13133768737316132, -0.11364239454269409, -0.09594710171222687, -0.07825180888175964, -0.06055651605129242, -0.042861223220825195, -0.02516593039035797, -0.007470637559890747, 0.010224655270576477, 0.027920007705688477, 0.0456153005361557, 0.06331059336662292, 0.08100588619709015, 0.09870117902755737, 0.1163964718580246, 0.13409176468849182, 0.15178705751895905, 0.16948235034942627, 0.1871776431798935, 0.20487293601036072, 0.22256822884082794, 0.24026352167129517, 0.2579588294029236, 0.2756541073322296, 0.29334938526153564, 0.31104469299316406, 0.3287400007247925, 0.3464352786540985, 0.36413055658340454, 0.38182586431503296, 0.3995211720466614, 0.4172164499759674, 0.43491172790527344, 0.45260703563690186, 0.4703023433685303, 0.4879976212978363, 0.5056928992271423, 0.5233882069587708, 0.5410835146903992, 0.5587787628173828, 0.5764740705490112, 0.5941693782806396]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 12.0, 18.0, 19.0, 25.0, 52.0, 71.0, 111.0, 176.0, 271.0, 476.0, 910.0, 1824.0, 3659.0, 8196.0, 20183.0, 54669.0, 175087.0, 781907.0, 2428191.0, 519374.0, 127768.0, 42106.0, 16098.0, 6947.0, 2951.0, 1349.0, 785.0, 412.0, 209.0, 150.0, 86.0, 63.0, 30.0, 31.0, 14.0, 15.0, 12.0, 10.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.142578125, -0.1385478973388672, -0.13451766967773438, -0.13048744201660156, -0.12645721435546875, -0.12242698669433594, -0.11839675903320312, -0.11436653137207031, -0.1103363037109375, -0.10630607604980469, -0.10227584838867188, -0.09824562072753906, -0.09421539306640625, -0.09018516540527344, -0.08615493774414062, -0.08212471008300781, -0.078094482421875, -0.07406425476074219, -0.07003402709960938, -0.06600379943847656, -0.06197357177734375, -0.05794334411621094, -0.053913116455078125, -0.04988288879394531, -0.0458526611328125, -0.04182243347167969, -0.037792205810546875, -0.03376197814941406, -0.02973175048828125, -0.025701522827148438, -0.021671295166015625, -0.017641067504882812, -0.01361083984375, -0.009580612182617188, -0.005550384521484375, -0.0015201568603515625, 0.00251007080078125, 0.0065402984619140625, 0.010570526123046875, 0.014600753784179688, 0.0186309814453125, 0.022661209106445312, 0.026691436767578125, 0.030721664428710938, 0.03475189208984375, 0.03878211975097656, 0.042812347412109375, 0.04684257507324219, 0.050872802734375, 0.05490303039550781, 0.058933258056640625, 0.06296348571777344, 0.06699371337890625, 0.07102394104003906, 0.07505416870117188, 0.07908439636230469, 0.0831146240234375, 0.08714485168457031, 0.09117507934570312, 0.09520530700683594, 0.09923553466796875, 0.10326576232910156, 0.10729598999023438, 0.11132621765136719, 0.1153564453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 14.0, 18.0, 11.0, 24.0, 22.0, 22.0, 29.0, 31.0, 26.0, 29.0, 42.0, 36.0, 40.0, 46.0, 51.0, 49.0, 47.0, 35.0, 43.0, 45.0, 31.0, 36.0, 28.0, 30.0, 30.0, 26.0, 24.0, 16.0, 22.0, 12.0, 9.0, 10.0, 10.0, 6.0, 5.0, 9.0, 6.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07720947265625, -0.07454204559326172, -0.07187461853027344, -0.06920719146728516, -0.06653976440429688, -0.0638723373413086, -0.06120491027832031, -0.05853748321533203, -0.05587005615234375, -0.05320262908935547, -0.05053520202636719, -0.047867774963378906, -0.045200347900390625, -0.042532920837402344, -0.03986549377441406, -0.03719806671142578, -0.0345306396484375, -0.03186321258544922, -0.029195785522460938, -0.026528358459472656, -0.023860931396484375, -0.021193504333496094, -0.018526077270507812, -0.01585865020751953, -0.01319122314453125, -0.010523796081542969, -0.007856369018554688, -0.005188941955566406, -0.002521514892578125, 0.00014591217041015625, 0.0028133392333984375, 0.005480766296386719, 0.008148193359375, 0.010815620422363281, 0.013483047485351562, 0.016150474548339844, 0.018817901611328125, 0.021485328674316406, 0.024152755737304688, 0.02682018280029297, 0.02948760986328125, 0.03215503692626953, 0.03482246398925781, 0.037489891052246094, 0.040157318115234375, 0.042824745178222656, 0.04549217224121094, 0.04815959930419922, 0.0508270263671875, 0.05349445343017578, 0.05616188049316406, 0.058829307556152344, 0.061496734619140625, 0.0641641616821289, 0.06683158874511719, 0.06949901580810547, 0.07216644287109375, 0.07483386993408203, 0.07750129699707031, 0.0801687240600586, 0.08283615112304688, 0.08550357818603516, 0.08817100524902344, 0.09083843231201172, 0.093505859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 13.0, 15.0, 14.0, 25.0, 38.0, 55.0, 66.0, 86.0, 128.0, 221.0, 349.0, 570.0, 905.0, 1591.0, 2834.0, 5769.0, 12501.0, 31583.0, 91128.0, 318455.0, 1590070.0, 1657637.0, 328848.0, 93287.0, 32282.0, 12892.0, 5810.0, 3030.0, 1552.0, 918.0, 537.0, 342.0, 214.0, 184.0, 95.0, 53.0, 54.0, 39.0, 24.0, 15.0, 14.0, 8.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1961669921875, -0.190399169921875, -0.18463134765625, -0.178863525390625, -0.173095703125, -0.167327880859375, -0.16156005859375, -0.155792236328125, -0.1500244140625, -0.144256591796875, -0.13848876953125, -0.132720947265625, -0.126953125, -0.121185302734375, -0.11541748046875, -0.109649658203125, -0.1038818359375, -0.098114013671875, -0.09234619140625, -0.086578369140625, -0.080810546875, -0.075042724609375, -0.06927490234375, -0.063507080078125, -0.0577392578125, -0.051971435546875, -0.04620361328125, -0.040435791015625, -0.03466796875, -0.028900146484375, -0.02313232421875, -0.017364501953125, -0.0115966796875, -0.005828857421875, -6.103515625e-05, 0.005706787109375, 0.011474609375, 0.017242431640625, 0.02301025390625, 0.028778076171875, 0.0345458984375, 0.040313720703125, 0.04608154296875, 0.051849365234375, 0.0576171875, 0.063385009765625, 0.06915283203125, 0.074920654296875, 0.0806884765625, 0.086456298828125, 0.09222412109375, 0.097991943359375, 0.103759765625, 0.109527587890625, 0.11529541015625, 0.121063232421875, 0.1268310546875, 0.132598876953125, 0.13836669921875, 0.144134521484375, 0.14990234375, 0.155670166015625, 0.16143798828125, 0.167205810546875, 0.1729736328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 7.0, 11.0, 16.0, 16.0, 34.0, 42.0, 73.0, 80.0, 128.0, 267.0, 447.0, 774.0, 886.0, 543.0, 272.0, 180.0, 92.0, 65.0, 45.0, 32.0, 19.0, 9.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2376708984375, -0.23123741149902344, -0.22480392456054688, -0.2183704376220703, -0.21193695068359375, -0.2055034637451172, -0.19906997680664062, -0.19263648986816406, -0.1862030029296875, -0.17976951599121094, -0.17333602905273438, -0.1669025421142578, -0.16046905517578125, -0.1540355682373047, -0.14760208129882812, -0.14116859436035156, -0.134735107421875, -0.12830162048339844, -0.12186813354492188, -0.11543464660644531, -0.10900115966796875, -0.10256767272949219, -0.09613418579101562, -0.08970069885253906, -0.0832672119140625, -0.07683372497558594, -0.07040023803710938, -0.06396675109863281, -0.05753326416015625, -0.05109977722167969, -0.044666290283203125, -0.03823280334472656, -0.03179931640625, -0.025365829467773438, -0.018932342529296875, -0.012498855590820312, -0.00606536865234375, 0.0003681182861328125, 0.006801605224609375, 0.013235092163085938, 0.0196685791015625, 0.026102066040039062, 0.032535552978515625, 0.03896903991699219, 0.04540252685546875, 0.05183601379394531, 0.058269500732421875, 0.06470298767089844, 0.071136474609375, 0.07756996154785156, 0.08400344848632812, 0.09043693542480469, 0.09687042236328125, 0.10330390930175781, 0.10973739624023438, 0.11617088317871094, 0.1226043701171875, 0.12903785705566406, 0.13547134399414062, 0.1419048309326172, 0.14833831787109375, 0.1547718048095703, 0.16120529174804688, 0.16763877868652344, 0.174072265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 16.0, 18.0, 34.0, 69.0, 92.0, 117.0, 143.0, 144.0, 131.0, 93.0, 49.0, 41.0, 31.0, 11.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5276952981948853, -1.4954850673675537, -1.4632747173309326, -1.431064486503601, -1.39885413646698, -1.3666439056396484, -1.3344335556030273, -1.3022233247756958, -1.2700129747390747, -1.2378027439117432, -1.205592393875122, -1.1733821630477905, -1.1411718130111694, -1.108961582183838, -1.0767512321472168, -1.0445410013198853, -1.0123307704925537, -0.9801204800605774, -0.9479101896286011, -0.9156998991966248, -0.8834896087646484, -0.8512793183326721, -0.8190690279006958, -0.7868587970733643, -0.7546484470367432, -0.7224381566047668, -0.6902278661727905, -0.6580175757408142, -0.6258072853088379, -0.5935969948768616, -0.5613867044448853, -0.5291764736175537, -0.4969661831855774, -0.4647558927536011, -0.43254560232162476, -0.40033531188964844, -0.3681250214576721, -0.3359147310256958, -0.30370447039604187, -0.27149417996406555, -0.23928388953208923, -0.20707359910011292, -0.1748633086681366, -0.14265303313732147, -0.11044274270534515, -0.07823245227336884, -0.04602217674255371, -0.013811886310577393, 0.018398404121398926, 0.050608690828084946, 0.08281897753477097, 0.11502926051616669, 0.147239550948143, 0.17944984138011932, 0.21166011691093445, 0.24387040734291077, 0.2760806977748871, 0.3082909882068634, 0.3405012786388397, 0.37271153926849365, 0.40492182970046997, 0.4371321201324463, 0.4693424105644226, 0.5015527009963989, 0.5337629914283752]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 10.0, 14.0, 14.0, 24.0, 26.0, 17.0, 29.0, 31.0, 36.0, 33.0, 29.0, 44.0, 46.0, 47.0, 49.0, 38.0, 31.0, 47.0, 42.0, 43.0, 51.0, 30.0, 29.0, 27.0, 27.0, 23.0, 18.0, 26.0, 25.0, 14.0, 16.0, 11.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48495209217071533, -0.46984732151031494, -0.45474252104759216, -0.4396377503871918, -0.424532949924469, -0.4094281792640686, -0.3943234086036682, -0.37921860814094543, -0.36411380767822266, -0.34900903701782227, -0.3339042365550995, -0.3187994658946991, -0.3036946654319763, -0.2885898947715759, -0.27348512411117554, -0.25838032364845276, -0.24327555298805237, -0.22817076742649078, -0.2130659818649292, -0.1979612112045288, -0.18285641074180603, -0.16775164008140564, -0.15264685451984406, -0.13754206895828247, -0.12243728339672089, -0.1073324978351593, -0.09222771227359772, -0.07712293416261673, -0.062018148601055145, -0.04691336303949356, -0.03180858492851257, -0.01670379936695099, -0.0015990138053894043, 0.013505769893527031, 0.028610553592443466, 0.04371533542871475, 0.05882012099027634, 0.07392490655183792, 0.08902968466281891, 0.1041344702243805, 0.11923925578594208, 0.13434404134750366, 0.14944882690906525, 0.16455361247062683, 0.17965838313102722, 0.19476318359375, 0.2098679542541504, 0.22497273981571198, 0.24007752537727356, 0.25518229603767395, 0.27028709650039673, 0.2853918671607971, 0.3004966676235199, 0.3156014382839203, 0.33070623874664307, 0.34581100940704346, 0.36091578006744385, 0.37602055072784424, 0.391125351190567, 0.4062301218509674, 0.4213349223136902, 0.4364396929740906, 0.45154446363449097, 0.46664926409721375, 0.4817540645599365]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 9.0, 2.0, 11.0, 10.0, 10.0, 10.0, 18.0, 27.0, 54.0, 69.0, 123.0, 196.0, 361.0, 688.0, 1118.0, 2270.0, 4415.0, 8673.0, 17216.0, 35711.0, 76400.0, 172875.0, 316340.0, 223068.0, 99043.0, 45863.0, 21791.0, 10688.0, 5383.0, 2724.0, 1450.0, 775.0, 461.0, 271.0, 135.0, 106.0, 63.0, 48.0, 15.0, 29.0, 8.0, 10.0, 10.0, 4.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.152587890625, -0.14818572998046875, -0.1437835693359375, -0.13938140869140625, -0.134979248046875, -0.13057708740234375, -0.1261749267578125, -0.12177276611328125, -0.11737060546875, -0.11296844482421875, -0.1085662841796875, -0.10416412353515625, -0.099761962890625, -0.09535980224609375, -0.0909576416015625, -0.08655548095703125, -0.0821533203125, -0.07775115966796875, -0.0733489990234375, -0.06894683837890625, -0.064544677734375, -0.06014251708984375, -0.0557403564453125, -0.05133819580078125, -0.04693603515625, -0.04253387451171875, -0.0381317138671875, -0.03372955322265625, -0.029327392578125, -0.02492523193359375, -0.0205230712890625, -0.01612091064453125, -0.01171875, -0.00731658935546875, -0.0029144287109375, 0.00148773193359375, 0.005889892578125, 0.01029205322265625, 0.0146942138671875, 0.01909637451171875, 0.02349853515625, 0.02790069580078125, 0.0323028564453125, 0.03670501708984375, 0.041107177734375, 0.04550933837890625, 0.0499114990234375, 0.05431365966796875, 0.0587158203125, 0.06311798095703125, 0.0675201416015625, 0.07192230224609375, 0.076324462890625, 0.08072662353515625, 0.0851287841796875, 0.08953094482421875, 0.09393310546875, 0.09833526611328125, 0.1027374267578125, 0.10713958740234375, 0.111541748046875, 0.11594390869140625, 0.1203460693359375, 0.12474822998046875, 0.129150390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 16.0, 14.0, 16.0, 22.0, 12.0, 22.0, 23.0, 25.0, 23.0, 26.0, 29.0, 44.0, 48.0, 55.0, 43.0, 50.0, 42.0, 61.0, 39.0, 39.0, 39.0, 33.0, 34.0, 35.0, 24.0, 23.0, 22.0, 13.0, 22.0, 13.0, 13.0, 15.0, 6.0, 6.0, 4.0, 9.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.0837850570678711, -0.08108329772949219, -0.07838153839111328, -0.07567977905273438, -0.07297801971435547, -0.07027626037597656, -0.06757450103759766, -0.06487274169921875, -0.062170982360839844, -0.05946922302246094, -0.05676746368408203, -0.054065704345703125, -0.05136394500732422, -0.04866218566894531, -0.045960426330566406, -0.0432586669921875, -0.040556907653808594, -0.03785514831542969, -0.03515338897705078, -0.032451629638671875, -0.02974987030029297, -0.027048110961914062, -0.024346351623535156, -0.02164459228515625, -0.018942832946777344, -0.016241073608398438, -0.013539314270019531, -0.010837554931640625, -0.008135795593261719, -0.0054340362548828125, -0.0027322769165039062, -3.0517578125e-05, 0.0026712417602539062, 0.0053730010986328125, 0.008074760437011719, 0.010776519775390625, 0.013478279113769531, 0.016180038452148438, 0.018881797790527344, 0.02158355712890625, 0.024285316467285156, 0.026987075805664062, 0.02968883514404297, 0.032390594482421875, 0.03509235382080078, 0.03779411315917969, 0.040495872497558594, 0.0431976318359375, 0.045899391174316406, 0.04860115051269531, 0.05130290985107422, 0.054004669189453125, 0.05670642852783203, 0.05940818786621094, 0.062109947204589844, 0.06481170654296875, 0.06751346588134766, 0.07021522521972656, 0.07291698455810547, 0.07561874389648438, 0.07832050323486328, 0.08102226257324219, 0.0837240219116211, 0.08642578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 6.0, 7.0, 15.0, 31.0, 16.0, 37.0, 50.0, 66.0, 99.0, 182.0, 258.0, 573.0, 1282.0, 3652.0, 12389.0, 45888.0, 205974.0, 575010.0, 151554.0, 36305.0, 9736.0, 3095.0, 1111.0, 503.0, 251.0, 138.0, 87.0, 65.0, 35.0, 37.0, 23.0, 16.0, 13.0, 12.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2864036560058594, -0.27666473388671875, -0.2669258117675781, -0.2571868896484375, -0.24744796752929688, -0.23770904541015625, -0.22797012329101562, -0.218231201171875, -0.20849227905273438, -0.19875335693359375, -0.18901443481445312, -0.1792755126953125, -0.16953659057617188, -0.15979766845703125, -0.15005874633789062, -0.14031982421875, -0.13058090209960938, -0.12084197998046875, -0.11110305786132812, -0.1013641357421875, -0.09162521362304688, -0.08188629150390625, -0.07214736938476562, -0.062408447265625, -0.052669525146484375, -0.04293060302734375, -0.033191680908203125, -0.0234527587890625, -0.013713836669921875, -0.00397491455078125, 0.005764007568359375, 0.0155029296875, 0.025241851806640625, 0.03498077392578125, 0.044719696044921875, 0.0544586181640625, 0.06419754028320312, 0.07393646240234375, 0.08367538452148438, 0.093414306640625, 0.10315322875976562, 0.11289215087890625, 0.12263107299804688, 0.1323699951171875, 0.14210891723632812, 0.15184783935546875, 0.16158676147460938, 0.17132568359375, 0.18106460571289062, 0.19080352783203125, 0.20054244995117188, 0.2102813720703125, 0.22002029418945312, 0.22975921630859375, 0.23949813842773438, 0.249237060546875, 0.2589759826660156, 0.26871490478515625, 0.2784538269042969, 0.2881927490234375, 0.2979316711425781, 0.30767059326171875, 0.3174095153808594, 0.3271484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 10.0, 14.0, 5.0, 16.0, 12.0, 20.0, 28.0, 34.0, 38.0, 45.0, 63.0, 54.0, 62.0, 68.0, 63.0, 67.0, 64.0, 48.0, 50.0, 38.0, 41.0, 42.0, 21.0, 16.0, 24.0, 13.0, 12.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.38525390625, -0.3737602233886719, -0.36226654052734375, -0.3507728576660156, -0.3392791748046875, -0.3277854919433594, -0.31629180908203125, -0.3047981262207031, -0.293304443359375, -0.2818107604980469, -0.27031707763671875, -0.2588233947753906, -0.2473297119140625, -0.23583602905273438, -0.22434234619140625, -0.21284866333007812, -0.20135498046875, -0.18986129760742188, -0.17836761474609375, -0.16687393188476562, -0.1553802490234375, -0.14388656616210938, -0.13239288330078125, -0.12089920043945312, -0.109405517578125, -0.09791183471679688, -0.08641815185546875, -0.07492446899414062, -0.0634307861328125, -0.051937103271484375, -0.04044342041015625, -0.028949737548828125, -0.0174560546875, -0.005962371826171875, 0.00553131103515625, 0.017024993896484375, 0.0285186767578125, 0.040012359619140625, 0.05150604248046875, 0.06299972534179688, 0.074493408203125, 0.08598709106445312, 0.09748077392578125, 0.10897445678710938, 0.1204681396484375, 0.13196182250976562, 0.14345550537109375, 0.15494918823242188, 0.16644287109375, 0.17793655395507812, 0.18943023681640625, 0.20092391967773438, 0.2124176025390625, 0.22391128540039062, 0.23540496826171875, 0.24689865112304688, 0.258392333984375, 0.2698860168457031, 0.28137969970703125, 0.2928733825683594, 0.3043670654296875, 0.3158607482910156, 0.32735443115234375, 0.3388481140136719, 0.350341796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 8.0, 12.0, 22.0, 34.0, 63.0, 76.0, 110.0, 161.0, 282.0, 501.0, 1038.0, 2015.0, 4137.0, 8959.0, 19172.0, 41385.0, 94187.0, 292851.0, 371413.0, 118998.0, 49442.0, 23077.0, 10578.0, 5035.0, 2319.0, 1168.0, 597.0, 330.0, 199.0, 106.0, 78.0, 58.0, 36.0, 29.0, 14.0, 13.0, 14.0, 6.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08209228515625, -0.07953643798828125, -0.0769805908203125, -0.07442474365234375, -0.071868896484375, -0.06931304931640625, -0.0667572021484375, -0.06420135498046875, -0.0616455078125, -0.05908966064453125, -0.0565338134765625, -0.05397796630859375, -0.051422119140625, -0.04886627197265625, -0.0463104248046875, -0.04375457763671875, -0.04119873046875, -0.03864288330078125, -0.0360870361328125, -0.03353118896484375, -0.030975341796875, -0.02841949462890625, -0.0258636474609375, -0.02330780029296875, -0.020751953125, -0.01819610595703125, -0.0156402587890625, -0.01308441162109375, -0.010528564453125, -0.00797271728515625, -0.0054168701171875, -0.00286102294921875, -0.00030517578125, 0.00225067138671875, 0.0048065185546875, 0.00736236572265625, 0.009918212890625, 0.01247406005859375, 0.0150299072265625, 0.01758575439453125, 0.0201416015625, 0.02269744873046875, 0.0252532958984375, 0.02780914306640625, 0.030364990234375, 0.03292083740234375, 0.0354766845703125, 0.03803253173828125, 0.04058837890625, 0.04314422607421875, 0.0457000732421875, 0.04825592041015625, 0.050811767578125, 0.05336761474609375, 0.0559234619140625, 0.05847930908203125, 0.06103515625, 0.06359100341796875, 0.0661468505859375, 0.06870269775390625, 0.071258544921875, 0.07381439208984375, 0.0763702392578125, 0.07892608642578125, 0.08148193359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 10.0, 7.0, 6.0, 24.0, 14.0, 31.0, 40.0, 41.0, 61.0, 87.0, 89.0, 99.0, 82.0, 77.0, 92.0, 61.0, 42.0, 38.0, 16.0, 16.0, 15.0, 11.0, 9.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-05, -1.478288322687149e-05, -1.4068558812141418e-05, -1.3354234397411346e-05, -1.2639909982681274e-05, -1.1925585567951202e-05, -1.121126115322113e-05, -1.0496936738491058e-05, -9.782612323760986e-06, -9.068287909030914e-06, -8.353963494300842e-06, -7.63963907957077e-06, -6.925314664840698e-06, -6.210990250110626e-06, -5.496665835380554e-06, -4.782341420650482e-06, -4.06801700592041e-06, -3.353692591190338e-06, -2.639368176460266e-06, -1.925043761730194e-06, -1.210719347000122e-06, -4.9639493227005e-07, 2.1792948246002197e-07, 9.32253897190094e-07, 1.646578311920166e-06, 2.360902726650238e-06, 3.07522714138031e-06, 3.789551556110382e-06, 4.503875970840454e-06, 5.218200385570526e-06, 5.932524800300598e-06, 6.64684921503067e-06, 7.361173629760742e-06, 8.075498044490814e-06, 8.789822459220886e-06, 9.504146873950958e-06, 1.021847128868103e-05, 1.0932795703411102e-05, 1.1647120118141174e-05, 1.2361444532871246e-05, 1.3075768947601318e-05, 1.379009336233139e-05, 1.4504417777061462e-05, 1.5218742191791534e-05, 1.5933066606521606e-05, 1.664739102125168e-05, 1.736171543598175e-05, 1.8076039850711823e-05, 1.8790364265441895e-05, 1.9504688680171967e-05, 2.021901309490204e-05, 2.093333750963211e-05, 2.1647661924362183e-05, 2.2361986339092255e-05, 2.3076310753822327e-05, 2.37906351685524e-05, 2.450495958328247e-05, 2.5219283998012543e-05, 2.5933608412742615e-05, 2.6647932827472687e-05, 2.736225724220276e-05, 2.807658165693283e-05, 2.8790906071662903e-05, 2.9505230486392975e-05, 3.0219554901123047e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 13.0, 17.0, 14.0, 36.0, 57.0, 88.0, 179.0, 380.0, 1282.0, 6167.0, 39904.0, 314487.0, 597301.0, 74278.0, 11211.0, 2052.0, 556.0, 210.0, 124.0, 82.0, 47.0, 22.0, 9.0, 11.0, 5.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.16275405883789062, -0.15717315673828125, -0.15159225463867188, -0.1460113525390625, -0.14043045043945312, -0.13484954833984375, -0.12926864624023438, -0.123687744140625, -0.11810684204101562, -0.11252593994140625, -0.10694503784179688, -0.1013641357421875, -0.09578323364257812, -0.09020233154296875, -0.08462142944335938, -0.07904052734375, -0.07345962524414062, -0.06787872314453125, -0.062297821044921875, -0.0567169189453125, -0.051136016845703125, -0.04555511474609375, -0.039974212646484375, -0.034393310546875, -0.028812408447265625, -0.02323150634765625, -0.017650604248046875, -0.0120697021484375, -0.006488800048828125, -0.00090789794921875, 0.004673004150390625, 0.01025390625, 0.015834808349609375, 0.02141571044921875, 0.026996612548828125, 0.0325775146484375, 0.038158416748046875, 0.04373931884765625, 0.049320220947265625, 0.054901123046875, 0.060482025146484375, 0.06606292724609375, 0.07164382934570312, 0.0772247314453125, 0.08280563354492188, 0.08838653564453125, 0.09396743774414062, 0.09954833984375, 0.10512924194335938, 0.11071014404296875, 0.11629104614257812, 0.1218719482421875, 0.12745285034179688, 0.13303375244140625, 0.13861465454101562, 0.144195556640625, 0.14977645874023438, 0.15535736083984375, 0.16093826293945312, 0.1665191650390625, 0.17210006713867188, 0.17768096923828125, 0.18326187133789062, 0.1888427734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 2.0, 8.0, 16.0, 19.0, 27.0, 30.0, 33.0, 39.0, 49.0, 76.0, 85.0, 97.0, 107.0, 88.0, 70.0, 42.0, 36.0, 26.0, 31.0, 31.0, 17.0, 11.0, 8.0, 10.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0738525390625, -0.07129096984863281, -0.06872940063476562, -0.06616783142089844, -0.06360626220703125, -0.06104469299316406, -0.058483123779296875, -0.05592155456542969, -0.0533599853515625, -0.05079841613769531, -0.048236846923828125, -0.04567527770996094, -0.04311370849609375, -0.04055213928222656, -0.037990570068359375, -0.03542900085449219, -0.032867431640625, -0.030305862426757812, -0.027744293212890625, -0.025182723999023438, -0.02262115478515625, -0.020059585571289062, -0.017498016357421875, -0.014936447143554688, -0.0123748779296875, -0.009813308715820312, -0.007251739501953125, -0.0046901702880859375, -0.00212860107421875, 0.0004329681396484375, 0.002994537353515625, 0.0055561065673828125, 0.00811767578125, 0.010679244995117188, 0.013240814208984375, 0.015802383422851562, 0.01836395263671875, 0.020925521850585938, 0.023487091064453125, 0.026048660278320312, 0.0286102294921875, 0.031171798706054688, 0.033733367919921875, 0.03629493713378906, 0.03885650634765625, 0.04141807556152344, 0.043979644775390625, 0.04654121398925781, 0.049102783203125, 0.05166435241699219, 0.054225921630859375, 0.05678749084472656, 0.05934906005859375, 0.06191062927246094, 0.06447219848632812, 0.06703376770019531, 0.0695953369140625, 0.07215690612792969, 0.07471847534179688, 0.07728004455566406, 0.07984161376953125, 0.08240318298339844, 0.08496475219726562, 0.08752632141113281, 0.090087890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 11.0, 21.0, 24.0, 54.0, 52.0, 104.0, 135.0, 138.0, 133.0, 110.0, 71.0, 56.0, 45.0, 26.0, 11.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6030570268630981, -1.5689101219177246, -1.534763216972351, -1.5006163120269775, -1.4664695262908936, -1.43232262134552, -1.3981757164001465, -1.364028811454773, -1.3298819065093994, -1.2957350015640259, -1.2615880966186523, -1.2274411916732788, -1.1932942867279053, -1.1591475009918213, -1.1250005960464478, -1.0908536911010742, -1.0567067861557007, -1.0225598812103271, -0.9884129762649536, -0.9542661309242249, -0.9201192259788513, -0.8859723210334778, -0.851825475692749, -0.8176785707473755, -0.783531665802002, -0.7493847608566284, -0.7152378559112549, -0.6810910105705261, -0.6469441056251526, -0.612797200679779, -0.5786503553390503, -0.5445034503936768, -0.510356605052948, -0.47620970010757446, -0.4420628249645233, -0.40791594982147217, -0.37376904487609863, -0.3396221399307251, -0.30547526478767395, -0.2713283896446228, -0.23718148469924927, -0.20303459465503693, -0.16888770461082458, -0.13474081456661224, -0.1005939245223999, -0.06644703447818756, -0.03230014443397522, 0.0018467456102371216, 0.03599363565444946, 0.0701405256986618, 0.10428741574287415, 0.1384343057870865, 0.17258119583129883, 0.20672808587551117, 0.2408749759197235, 0.27502185106277466, 0.3091687560081482, 0.34331566095352173, 0.3774625360965729, 0.411609411239624, 0.44575631618499756, 0.4799032211303711, 0.5140501260757446, 0.5481969714164734, 0.5823438763618469]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 3.0, 2.0, 12.0, 10.0, 12.0, 7.0, 15.0, 15.0, 21.0, 25.0, 25.0, 36.0, 31.0, 50.0, 34.0, 44.0, 39.0, 49.0, 50.0, 35.0, 39.0, 29.0, 50.0, 49.0, 41.0, 38.0, 34.0, 23.0, 31.0, 22.0, 18.0, 20.0, 25.0, 9.0, 14.0, 9.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7246189117431641, -0.7017057538032532, -0.6787925958633423, -0.6558793783187866, -0.6329662203788757, -0.6100530624389648, -0.5871398448944092, -0.5642266869544983, -0.5413135290145874, -0.5184003710746765, -0.49548718333244324, -0.47257399559020996, -0.4496608376502991, -0.4267476797103882, -0.4038344919681549, -0.38092130422592163, -0.35800814628601074, -0.33509498834609985, -0.3121818006038666, -0.2892686128616333, -0.2663554549217224, -0.24344228208065033, -0.22052910923957825, -0.19761593639850616, -0.17470276355743408, -0.151789590716362, -0.12887641787528992, -0.10596324503421783, -0.08305007219314575, -0.06013689935207367, -0.03722372651100159, -0.014310553669929504, 0.008602678775787354, 0.031515851616859436, 0.05442902445793152, 0.0773421972990036, 0.10025537014007568, 0.12316854298114777, 0.14608171582221985, 0.16899488866329193, 0.191908061504364, 0.2148212343454361, 0.23773440718650818, 0.26064759492874146, 0.28356075286865234, 0.30647391080856323, 0.3293870985507965, 0.3523002862930298, 0.3752134442329407, 0.39812660217285156, 0.42103978991508484, 0.4439529776573181, 0.466866135597229, 0.4897792935371399, 0.5126924514770508, 0.5356056690216064, 0.5585188269615173, 0.5814319849014282, 0.6043452024459839, 0.6272583603858948, 0.6501715183258057, 0.6730846762657166, 0.6959978342056274, 0.7189110517501831, 0.741824209690094]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 15.0, 21.0, 36.0, 49.0, 54.0, 108.0, 169.0, 255.0, 355.0, 565.0, 807.0, 1444.0, 2304.0, 3959.0, 6973.0, 11933.0, 22423.0, 43802.0, 93367.0, 231508.0, 710391.0, 1689451.0, 872148.0, 283659.0, 110648.0, 50658.0, 25264.0, 13472.0, 7511.0, 4254.0, 2502.0, 1512.0, 891.0, 577.0, 391.0, 244.0, 170.0, 113.0, 86.0, 52.0, 41.0, 23.0, 20.0, 19.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09295654296875, -0.08981513977050781, -0.08667373657226562, -0.08353233337402344, -0.08039093017578125, -0.07724952697753906, -0.07410812377929688, -0.07096672058105469, -0.0678253173828125, -0.06468391418457031, -0.061542510986328125, -0.05840110778808594, -0.05525970458984375, -0.05211830139160156, -0.048976898193359375, -0.04583549499511719, -0.042694091796875, -0.03955268859863281, -0.036411285400390625, -0.03326988220214844, -0.03012847900390625, -0.026987075805664062, -0.023845672607421875, -0.020704269409179688, -0.0175628662109375, -0.014421463012695312, -0.011280059814453125, -0.008138656616210938, -0.00499725341796875, -0.0018558502197265625, 0.001285552978515625, 0.0044269561767578125, 0.007568359375, 0.010709762573242188, 0.013851165771484375, 0.016992568969726562, 0.02013397216796875, 0.023275375366210938, 0.026416778564453125, 0.029558181762695312, 0.0326995849609375, 0.03584098815917969, 0.038982391357421875, 0.04212379455566406, 0.04526519775390625, 0.04840660095214844, 0.051548004150390625, 0.05468940734863281, 0.057830810546875, 0.06097221374511719, 0.06411361694335938, 0.06725502014160156, 0.07039642333984375, 0.07353782653808594, 0.07667922973632812, 0.07982063293457031, 0.0829620361328125, 0.08610343933105469, 0.08924484252929688, 0.09238624572753906, 0.09552764892578125, 0.09866905212402344, 0.10181045532226562, 0.10495185852050781, 0.10809326171875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 10.0, 4.0, 6.0, 9.0, 10.0, 10.0, 12.0, 10.0, 17.0, 21.0, 17.0, 27.0, 26.0, 34.0, 33.0, 31.0, 33.0, 41.0, 42.0, 37.0, 41.0, 42.0, 39.0, 41.0, 40.0, 41.0, 41.0, 29.0, 45.0, 24.0, 28.0, 28.0, 24.0, 22.0, 16.0, 13.0, 23.0, 11.0, 3.0, 7.0, 4.0, 5.0, 5.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0980224609375, -0.09510993957519531, -0.09219741821289062, -0.08928489685058594, -0.08637237548828125, -0.08345985412597656, -0.08054733276367188, -0.07763481140136719, -0.0747222900390625, -0.07180976867675781, -0.06889724731445312, -0.06598472595214844, -0.06307220458984375, -0.06015968322753906, -0.057247161865234375, -0.05433464050292969, -0.051422119140625, -0.04850959777832031, -0.045597076416015625, -0.04268455505371094, -0.03977203369140625, -0.03685951232910156, -0.033946990966796875, -0.031034469604492188, -0.0281219482421875, -0.025209426879882812, -0.022296905517578125, -0.019384384155273438, -0.01647186279296875, -0.013559341430664062, -0.010646820068359375, -0.0077342987060546875, -0.00482177734375, -0.0019092559814453125, 0.001003265380859375, 0.0039157867431640625, 0.00682830810546875, 0.009740829467773438, 0.012653350830078125, 0.015565872192382812, 0.0184783935546875, 0.021390914916992188, 0.024303436279296875, 0.027215957641601562, 0.03012847900390625, 0.03304100036621094, 0.035953521728515625, 0.03886604309082031, 0.041778564453125, 0.04469108581542969, 0.047603607177734375, 0.05051612854003906, 0.05342864990234375, 0.05634117126464844, 0.059253692626953125, 0.06216621398925781, 0.0650787353515625, 0.06799125671386719, 0.07090377807617188, 0.07381629943847656, 0.07672882080078125, 0.07964134216308594, 0.08255386352539062, 0.08546638488769531, 0.08837890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 11.0, 5.0, 10.0, 13.0, 16.0, 17.0, 31.0, 52.0, 65.0, 104.0, 172.0, 256.0, 455.0, 829.0, 1349.0, 2527.0, 4949.0, 10100.0, 23008.0, 57743.0, 161115.0, 553992.0, 2117138.0, 896333.0, 229072.0, 78314.0, 30348.0, 12979.0, 6168.0, 3088.0, 1650.0, 885.0, 575.0, 324.0, 187.0, 139.0, 80.0, 49.0, 32.0, 25.0, 19.0, 12.0, 12.0, 9.0, 4.0, 6.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0], "bins": [-0.19677734375, -0.1910991668701172, -0.18542098999023438, -0.17974281311035156, -0.17406463623046875, -0.16838645935058594, -0.16270828247070312, -0.1570301055908203, -0.1513519287109375, -0.1456737518310547, -0.13999557495117188, -0.13431739807128906, -0.12863922119140625, -0.12296104431152344, -0.11728286743164062, -0.11160469055175781, -0.105926513671875, -0.10024833679199219, -0.09457015991210938, -0.08889198303222656, -0.08321380615234375, -0.07753562927246094, -0.07185745239257812, -0.06617927551269531, -0.0605010986328125, -0.05482292175292969, -0.049144744873046875, -0.04346656799316406, -0.03778839111328125, -0.03211021423339844, -0.026432037353515625, -0.020753860473632812, -0.01507568359375, -0.009397506713867188, -0.003719329833984375, 0.0019588470458984375, 0.00763702392578125, 0.013315200805664062, 0.018993377685546875, 0.024671554565429688, 0.0303497314453125, 0.03602790832519531, 0.041706085205078125, 0.04738426208496094, 0.05306243896484375, 0.05874061584472656, 0.06441879272460938, 0.07009696960449219, 0.075775146484375, 0.08145332336425781, 0.08713150024414062, 0.09280967712402344, 0.09848785400390625, 0.10416603088378906, 0.10984420776367188, 0.11552238464355469, 0.1212005615234375, 0.1268787384033203, 0.13255691528320312, 0.13823509216308594, 0.14391326904296875, 0.14959144592285156, 0.15526962280273438, 0.1609477996826172, 0.1666259765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 8.0, 23.0, 37.0, 40.0, 42.0, 100.0, 147.0, 242.0, 443.0, 847.0, 854.0, 437.0, 275.0, 193.0, 133.0, 72.0, 54.0, 36.0, 19.0, 14.0, 17.0, 4.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2088623046875, -0.20018959045410156, -0.19151687622070312, -0.1828441619873047, -0.17417144775390625, -0.1654987335205078, -0.15682601928710938, -0.14815330505371094, -0.1394805908203125, -0.13080787658691406, -0.12213516235351562, -0.11346244812011719, -0.10478973388671875, -0.09611701965332031, -0.08744430541992188, -0.07877159118652344, -0.070098876953125, -0.06142616271972656, -0.052753448486328125, -0.04408073425292969, -0.03540802001953125, -0.026735305786132812, -0.018062591552734375, -0.009389877319335938, -0.0007171630859375, 0.007955551147460938, 0.016628265380859375, 0.025300979614257812, 0.03397369384765625, 0.04264640808105469, 0.051319122314453125, 0.05999183654785156, 0.06866455078125, 0.07733726501464844, 0.08600997924804688, 0.09468269348144531, 0.10335540771484375, 0.11202812194824219, 0.12070083618164062, 0.12937355041503906, 0.1380462646484375, 0.14671897888183594, 0.15539169311523438, 0.1640644073486328, 0.17273712158203125, 0.1814098358154297, 0.19008255004882812, 0.19875526428222656, 0.207427978515625, 0.21610069274902344, 0.22477340698242188, 0.2334461212158203, 0.24211883544921875, 0.2507915496826172, 0.2594642639160156, 0.26813697814941406, 0.2768096923828125, 0.28548240661621094, 0.2941551208496094, 0.3028278350830078, 0.31150054931640625, 0.3201732635498047, 0.3288459777832031, 0.33751869201660156, 0.34619140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 11.0, 11.0, 20.0, 42.0, 43.0, 61.0, 65.0, 68.0, 88.0, 76.0, 97.0, 95.0, 67.0, 62.0, 58.0, 38.0, 29.0, 25.0, 12.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7179831862449646, -0.6891993284225464, -0.6604154706001282, -0.63163161277771, -0.6028477549552917, -0.5740638971328735, -0.5452800393104553, -0.5164961814880371, -0.4877123236656189, -0.4589284658432007, -0.43014460802078247, -0.40136075019836426, -0.37257689237594604, -0.34379303455352783, -0.3150091767311096, -0.2862253189086914, -0.2574414610862732, -0.22865760326385498, -0.19987374544143677, -0.17108988761901855, -0.14230602979660034, -0.11352217197418213, -0.08473831415176392, -0.0559544563293457, -0.02717059850692749, 0.0016132593154907227, 0.030397117137908936, 0.05918097496032715, 0.08796483278274536, 0.11674869060516357, 0.1455325484275818, 0.17431640625, 0.203100323677063, 0.2318841814994812, 0.2606680393218994, 0.2894518971443176, 0.31823575496673584, 0.34701961278915405, 0.37580347061157227, 0.4045873284339905, 0.4333711862564087, 0.4621550440788269, 0.4909389019012451, 0.5197227597236633, 0.5485066175460815, 0.5772904753684998, 0.606074333190918, 0.6348581910133362, 0.6636420488357544, 0.6924259066581726, 0.7212097644805908, 0.749993622303009, 0.7787774801254272, 0.8075613379478455, 0.8363451957702637, 0.8651290535926819, 0.8939129114151001, 0.9226967692375183, 0.9514806270599365, 0.9802644848823547, 1.009048342704773, 1.037832260131836, 1.0666160583496094, 1.0953998565673828, 1.1241837739944458]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 2.0, 4.0, 9.0, 7.0, 8.0, 11.0, 15.0, 11.0, 14.0, 16.0, 26.0, 20.0, 23.0, 33.0, 47.0, 38.0, 38.0, 44.0, 36.0, 52.0, 40.0, 42.0, 46.0, 37.0, 46.0, 39.0, 42.0, 25.0, 42.0, 26.0, 20.0, 24.0, 17.0, 17.0, 20.0, 22.0, 6.0, 6.0, 10.0, 5.0, 1.0, 5.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.7060321569442749, -0.6867572665214539, -0.6674823760986328, -0.648207426071167, -0.628932535648346, -0.6096576452255249, -0.5903827548027039, -0.5711078643798828, -0.551832914352417, -0.532558023929596, -0.5132831335067749, -0.49400821328163147, -0.47473329305648804, -0.455458402633667, -0.43618351221084595, -0.4169086217880249, -0.39763373136520386, -0.3783588409423828, -0.3590839207172394, -0.33980903029441833, -0.3205341100692749, -0.30125921964645386, -0.2819843292236328, -0.26270943880081177, -0.24343451857566833, -0.2241596132516861, -0.20488470792770386, -0.1856098175048828, -0.16633491218090057, -0.14706000685691833, -0.1277851164340973, -0.10851021111011505, -0.08923536539077759, -0.06996046006679535, -0.05068556219339371, -0.03141066059470177, -0.012135758996009827, 0.007139146327972412, 0.026414044201374054, 0.045688942074775696, 0.06496384739875793, 0.08423875272274017, 0.10351365059614182, 0.12278854846954346, 0.1420634537935257, 0.16133835911750793, 0.18061324954032898, 0.19988815486431122, 0.21916306018829346, 0.2384379655122757, 0.25771287083625793, 0.276987761259079, 0.2962626814842224, 0.31553757190704346, 0.3348124623298645, 0.35408735275268555, 0.373362272977829, 0.39263716340065, 0.41191208362579346, 0.4311869740486145, 0.45046186447143555, 0.469736784696579, 0.4890116751194, 0.5082865953445435, 0.5275614857673645]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 14.0, 15.0, 12.0, 36.0, 37.0, 58.0, 78.0, 138.0, 182.0, 290.0, 441.0, 648.0, 1023.0, 1579.0, 2470.0, 3808.0, 6063.0, 9441.0, 15051.0, 24500.0, 40044.0, 68297.0, 119027.0, 194994.0, 216051.0, 140948.0, 80324.0, 47138.0, 28047.0, 17388.0, 10976.0, 6989.0, 4484.0, 2800.0, 1795.0, 1152.0, 763.0, 475.0, 306.0, 225.0, 145.0, 98.0, 56.0, 41.0, 33.0, 23.0, 19.0, 6.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.10882568359375, -0.10544109344482422, -0.10205650329589844, -0.09867191314697266, -0.09528732299804688, -0.0919027328491211, -0.08851814270019531, -0.08513355255126953, -0.08174896240234375, -0.07836437225341797, -0.07497978210449219, -0.0715951919555664, -0.06821060180664062, -0.06482601165771484, -0.06144142150878906, -0.05805683135986328, -0.0546722412109375, -0.05128765106201172, -0.04790306091308594, -0.044518470764160156, -0.041133880615234375, -0.037749290466308594, -0.03436470031738281, -0.03098011016845703, -0.02759552001953125, -0.02421092987060547, -0.020826339721679688, -0.017441749572753906, -0.014057159423828125, -0.010672569274902344, -0.0072879791259765625, -0.0039033889770507812, -0.000518798828125, 0.0028657913208007812, 0.0062503814697265625, 0.009634971618652344, 0.013019561767578125, 0.016404151916503906, 0.019788742065429688, 0.02317333221435547, 0.02655792236328125, 0.02994251251220703, 0.03332710266113281, 0.036711692810058594, 0.040096282958984375, 0.043480873107910156, 0.04686546325683594, 0.05025005340576172, 0.0536346435546875, 0.05701923370361328, 0.06040382385253906, 0.06378841400146484, 0.06717300415039062, 0.0705575942993164, 0.07394218444824219, 0.07732677459716797, 0.08071136474609375, 0.08409595489501953, 0.08748054504394531, 0.0908651351928711, 0.09424972534179688, 0.09763431549072266, 0.10101890563964844, 0.10440349578857422, 0.1077880859375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 5.0, 7.0, 7.0, 9.0, 9.0, 12.0, 8.0, 19.0, 21.0, 17.0, 24.0, 27.0, 29.0, 36.0, 40.0, 45.0, 42.0, 46.0, 42.0, 34.0, 45.0, 49.0, 31.0, 42.0, 45.0, 31.0, 42.0, 33.0, 24.0, 25.0, 21.0, 16.0, 20.0, 13.0, 23.0, 10.0, 11.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.092041015625, -0.08898544311523438, -0.08592987060546875, -0.08287429809570312, -0.0798187255859375, -0.07676315307617188, -0.07370758056640625, -0.07065200805664062, -0.067596435546875, -0.06454086303710938, -0.06148529052734375, -0.058429718017578125, -0.0553741455078125, -0.052318572998046875, -0.04926300048828125, -0.046207427978515625, -0.04315185546875, -0.040096282958984375, -0.03704071044921875, -0.033985137939453125, -0.0309295654296875, -0.027873992919921875, -0.02481842041015625, -0.021762847900390625, -0.018707275390625, -0.015651702880859375, -0.01259613037109375, -0.009540557861328125, -0.0064849853515625, -0.003429412841796875, -0.00037384033203125, 0.002681732177734375, 0.0057373046875, 0.008792877197265625, 0.01184844970703125, 0.014904022216796875, 0.0179595947265625, 0.021015167236328125, 0.02407073974609375, 0.027126312255859375, 0.030181884765625, 0.033237457275390625, 0.03629302978515625, 0.039348602294921875, 0.0424041748046875, 0.045459747314453125, 0.04851531982421875, 0.051570892333984375, 0.05462646484375, 0.057682037353515625, 0.06073760986328125, 0.06379318237304688, 0.0668487548828125, 0.06990432739257812, 0.07295989990234375, 0.07601547241210938, 0.079071044921875, 0.08212661743164062, 0.08518218994140625, 0.08823776245117188, 0.0912933349609375, 0.09434890747070312, 0.09740447998046875, 0.10046005249023438, 0.103515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 7.0, 5.0, 6.0, 8.0, 15.0, 28.0, 33.0, 34.0, 50.0, 64.0, 118.0, 167.0, 280.0, 501.0, 1220.0, 3540.0, 13381.0, 52740.0, 228368.0, 530576.0, 163788.0, 38678.0, 9917.0, 2841.0, 968.0, 425.0, 251.0, 166.0, 105.0, 69.0, 61.0, 37.0, 24.0, 14.0, 17.0, 19.0, 8.0, 7.0, 9.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3583984375, -0.3479766845703125, -0.337554931640625, -0.3271331787109375, -0.31671142578125, -0.3062896728515625, -0.295867919921875, -0.2854461669921875, -0.2750244140625, -0.2646026611328125, -0.254180908203125, -0.2437591552734375, -0.23333740234375, -0.2229156494140625, -0.212493896484375, -0.2020721435546875, -0.191650390625, -0.1812286376953125, -0.170806884765625, -0.1603851318359375, -0.14996337890625, -0.1395416259765625, -0.129119873046875, -0.1186981201171875, -0.1082763671875, -0.0978546142578125, -0.087432861328125, -0.0770111083984375, -0.06658935546875, -0.0561676025390625, -0.045745849609375, -0.0353240966796875, -0.02490234375, -0.0144805908203125, -0.004058837890625, 0.0063629150390625, 0.01678466796875, 0.0272064208984375, 0.037628173828125, 0.0480499267578125, 0.0584716796875, 0.0688934326171875, 0.079315185546875, 0.0897369384765625, 0.10015869140625, 0.1105804443359375, 0.121002197265625, 0.1314239501953125, 0.141845703125, 0.1522674560546875, 0.162689208984375, 0.1731109619140625, 0.18353271484375, 0.1939544677734375, 0.204376220703125, 0.2147979736328125, 0.2252197265625, 0.2356414794921875, 0.246063232421875, 0.2564849853515625, 0.26690673828125, 0.2773284912109375, 0.287750244140625, 0.2981719970703125, 0.30859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 3.0, 7.0, 4.0, 8.0, 7.0, 14.0, 17.0, 11.0, 13.0, 16.0, 16.0, 15.0, 26.0, 25.0, 30.0, 26.0, 37.0, 37.0, 39.0, 36.0, 60.0, 42.0, 39.0, 38.0, 33.0, 45.0, 27.0, 29.0, 45.0, 24.0, 25.0, 25.0, 26.0, 23.0, 22.0, 12.0, 15.0, 14.0, 10.0, 9.0, 9.0, 10.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2918434143066406, -0.28217315673828125, -0.2725028991699219, -0.2628326416015625, -0.2531623840332031, -0.24349212646484375, -0.23382186889648438, -0.224151611328125, -0.21448135375976562, -0.20481109619140625, -0.19514083862304688, -0.1854705810546875, -0.17580032348632812, -0.16613006591796875, -0.15645980834960938, -0.14678955078125, -0.13711929321289062, -0.12744903564453125, -0.11777877807617188, -0.1081085205078125, -0.09843826293945312, -0.08876800537109375, -0.07909774780273438, -0.069427490234375, -0.059757232666015625, -0.05008697509765625, -0.040416717529296875, -0.0307464599609375, -0.021076202392578125, -0.01140594482421875, -0.001735687255859375, 0.0079345703125, 0.017604827880859375, 0.02727508544921875, 0.036945343017578125, 0.0466156005859375, 0.056285858154296875, 0.06595611572265625, 0.07562637329101562, 0.085296630859375, 0.09496688842773438, 0.10463714599609375, 0.11430740356445312, 0.1239776611328125, 0.13364791870117188, 0.14331817626953125, 0.15298843383789062, 0.16265869140625, 0.17232894897460938, 0.18199920654296875, 0.19166946411132812, 0.2013397216796875, 0.21100997924804688, 0.22068023681640625, 0.23035049438476562, 0.240020751953125, 0.24969100952148438, 0.25936126708984375, 0.2690315246582031, 0.2787017822265625, 0.2883720397949219, 0.29804229736328125, 0.3077125549316406, 0.3173828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 8.0, 4.0, 4.0, 9.0, 10.0, 16.0, 21.0, 41.0, 62.0, 111.0, 163.0, 276.0, 464.0, 853.0, 1563.0, 3000.0, 5891.0, 12000.0, 24741.0, 53800.0, 122987.0, 280158.0, 297353.0, 133822.0, 58071.0, 26899.0, 12659.0, 6418.0, 3224.0, 1712.0, 907.0, 516.0, 296.0, 184.0, 105.0, 70.0, 47.0, 25.0, 23.0, 15.0, 15.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.09271240234375, -0.0902099609375, -0.08770751953125, -0.085205078125, -0.08270263671875, -0.0802001953125, -0.07769775390625, -0.0751953125, -0.07269287109375, -0.0701904296875, -0.06768798828125, -0.065185546875, -0.06268310546875, -0.0601806640625, -0.05767822265625, -0.05517578125, -0.05267333984375, -0.0501708984375, -0.04766845703125, -0.045166015625, -0.04266357421875, -0.0401611328125, -0.03765869140625, -0.03515625, -0.03265380859375, -0.0301513671875, -0.02764892578125, -0.025146484375, -0.02264404296875, -0.0201416015625, -0.01763916015625, -0.01513671875, -0.01263427734375, -0.0101318359375, -0.00762939453125, -0.005126953125, -0.00262451171875, -0.0001220703125, 0.00238037109375, 0.0048828125, 0.00738525390625, 0.0098876953125, 0.01239013671875, 0.014892578125, 0.01739501953125, 0.0198974609375, 0.02239990234375, 0.02490234375, 0.02740478515625, 0.0299072265625, 0.03240966796875, 0.034912109375, 0.03741455078125, 0.0399169921875, 0.04241943359375, 0.044921875, 0.04742431640625, 0.0499267578125, 0.05242919921875, 0.054931640625, 0.05743408203125, 0.0599365234375, 0.06243896484375, 0.06494140625, 0.06744384765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 7.0, 7.0, 8.0, 6.0, 16.0, 9.0, 21.0, 26.0, 28.0, 26.0, 41.0, 54.0, 81.0, 78.0, 81.0, 72.0, 95.0, 61.0, 55.0, 59.0, 33.0, 28.0, 28.0, 16.0, 9.0, 8.0, 10.0, 13.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.8950551748275757e-05, -1.8231570720672607e-05, -1.7512589693069458e-05, -1.679360866546631e-05, -1.607462763786316e-05, -1.535564661026001e-05, -1.463666558265686e-05, -1.3917684555053711e-05, -1.3198703527450562e-05, -1.2479722499847412e-05, -1.1760741472244263e-05, -1.1041760444641113e-05, -1.0322779417037964e-05, -9.603798389434814e-06, -8.884817361831665e-06, -8.165836334228516e-06, -7.446855306625366e-06, -6.727874279022217e-06, -6.008893251419067e-06, -5.289912223815918e-06, -4.5709311962127686e-06, -3.851950168609619e-06, -3.1329691410064697e-06, -2.4139881134033203e-06, -1.695007085800171e-06, -9.760260581970215e-07, -2.5704503059387207e-07, 4.6193599700927734e-07, 1.1809170246124268e-06, 1.8998980522155762e-06, 2.6188790798187256e-06, 3.337860107421875e-06, 4.056841135025024e-06, 4.775822162628174e-06, 5.494803190231323e-06, 6.213784217834473e-06, 6.932765245437622e-06, 7.651746273040771e-06, 8.370727300643921e-06, 9.08970832824707e-06, 9.80868935585022e-06, 1.0527670383453369e-05, 1.1246651411056519e-05, 1.1965632438659668e-05, 1.2684613466262817e-05, 1.3403594493865967e-05, 1.4122575521469116e-05, 1.4841556549072266e-05, 1.5560537576675415e-05, 1.6279518604278564e-05, 1.6998499631881714e-05, 1.7717480659484863e-05, 1.8436461687088013e-05, 1.9155442714691162e-05, 1.987442374229431e-05, 2.059340476989746e-05, 2.131238579750061e-05, 2.203136682510376e-05, 2.275034785270691e-05, 2.346932888031006e-05, 2.4188309907913208e-05, 2.4907290935516357e-05, 2.5626271963119507e-05, 2.6345252990722656e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 6.0, 21.0, 25.0, 20.0, 44.0, 60.0, 92.0, 119.0, 256.0, 388.0, 799.0, 1476.0, 3159.0, 7165.0, 17992.0, 45949.0, 115350.0, 273312.0, 328109.0, 152045.0, 60644.0, 23916.0, 9785.0, 3872.0, 1782.0, 896.0, 470.0, 277.0, 163.0, 121.0, 64.0, 43.0, 28.0, 24.0, 17.0, 17.0, 13.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08245849609375, -0.07962989807128906, -0.07680130004882812, -0.07397270202636719, -0.07114410400390625, -0.06831550598144531, -0.06548690795898438, -0.06265830993652344, -0.0598297119140625, -0.05700111389160156, -0.054172515869140625, -0.05134391784667969, -0.04851531982421875, -0.04568672180175781, -0.042858123779296875, -0.04002952575683594, -0.037200927734375, -0.03437232971191406, -0.031543731689453125, -0.028715133666992188, -0.02588653564453125, -0.023057937622070312, -0.020229339599609375, -0.017400741577148438, -0.0145721435546875, -0.011743545532226562, -0.008914947509765625, -0.0060863494873046875, -0.00325775146484375, -0.0004291534423828125, 0.002399444580078125, 0.0052280426025390625, 0.008056640625, 0.010885238647460938, 0.013713836669921875, 0.016542434692382812, 0.01937103271484375, 0.022199630737304688, 0.025028228759765625, 0.027856826782226562, 0.0306854248046875, 0.03351402282714844, 0.036342620849609375, 0.03917121887207031, 0.04199981689453125, 0.04482841491699219, 0.047657012939453125, 0.05048561096191406, 0.053314208984375, 0.05614280700683594, 0.058971405029296875, 0.06180000305175781, 0.06462860107421875, 0.06745719909667969, 0.07028579711914062, 0.07311439514160156, 0.0759429931640625, 0.07877159118652344, 0.08160018920898438, 0.08442878723144531, 0.08725738525390625, 0.09008598327636719, 0.09291458129882812, 0.09574317932128906, 0.09857177734375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 12.0, 7.0, 6.0, 17.0, 15.0, 16.0, 18.0, 18.0, 20.0, 21.0, 46.0, 34.0, 37.0, 53.0, 51.0, 51.0, 65.0, 45.0, 59.0, 56.0, 52.0, 42.0, 38.0, 32.0, 22.0, 12.0, 22.0, 19.0, 8.0, 14.0, 11.0, 16.0, 7.0, 4.0, 5.0, 6.0, 4.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05950927734375, -0.057511329650878906, -0.05551338195800781, -0.05351543426513672, -0.051517486572265625, -0.04951953887939453, -0.04752159118652344, -0.045523643493652344, -0.04352569580078125, -0.041527748107910156, -0.03952980041503906, -0.03753185272216797, -0.035533905029296875, -0.03353595733642578, -0.03153800964355469, -0.029540061950683594, -0.0275421142578125, -0.025544166564941406, -0.023546218872070312, -0.02154827117919922, -0.019550323486328125, -0.01755237579345703, -0.015554428100585938, -0.013556480407714844, -0.01155853271484375, -0.009560585021972656, -0.0075626373291015625, -0.005564689636230469, -0.003566741943359375, -0.0015687942504882812, 0.0004291534423828125, 0.0024271011352539062, 0.004425048828125, 0.006422996520996094, 0.008420944213867188, 0.010418891906738281, 0.012416839599609375, 0.014414787292480469, 0.016412734985351562, 0.018410682678222656, 0.02040863037109375, 0.022406578063964844, 0.024404525756835938, 0.02640247344970703, 0.028400421142578125, 0.03039836883544922, 0.03239631652832031, 0.034394264221191406, 0.0363922119140625, 0.038390159606933594, 0.04038810729980469, 0.04238605499267578, 0.044384002685546875, 0.04638195037841797, 0.04837989807128906, 0.050377845764160156, 0.05237579345703125, 0.054373741149902344, 0.05637168884277344, 0.05836963653564453, 0.060367584228515625, 0.06236553192138672, 0.06436347961425781, 0.0663614273071289, 0.068359375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 4.0, 10.0, 23.0, 33.0, 51.0, 88.0, 112.0, 144.0, 142.0, 133.0, 93.0, 66.0, 44.0, 26.0, 17.0, 8.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.3549394607543945, -2.309924840927124, -2.2649102210998535, -2.219895601272583, -2.1748809814453125, -2.129866361618042, -2.0848517417907715, -2.03983736038208, -1.99482262134552, -1.9498080015182495, -1.904793381690979, -1.8597787618637085, -1.8147642612457275, -1.769749641418457, -1.7247350215911865, -1.679720401763916, -1.6347057819366455, -1.589691162109375, -1.5446765422821045, -1.499661922454834, -1.4546473026275635, -1.4096328020095825, -1.364618182182312, -1.3196035623550415, -1.274588942527771, -1.2295743227005005, -1.18455970287323, -1.1395450830459595, -1.0945305824279785, -1.049515962600708, -1.0045013427734375, -0.959486722946167, -0.9144719839096069, -0.8694573640823364, -0.8244427442550659, -0.7794281840324402, -0.7344135642051697, -0.6893989443778992, -0.6443843841552734, -0.5993697643280029, -0.5543551445007324, -0.5093405246734619, -0.4643259346485138, -0.4193113446235657, -0.37429672479629517, -0.32928210496902466, -0.28426751494407654, -0.23925292491912842, -0.1942383050918579, -0.1492237001657486, -0.10420909523963928, -0.05919449031352997, -0.014179885387420654, 0.03083471953868866, 0.07584932446479797, 0.1208639144897461, 0.1658785343170166, 0.21089313924312592, 0.25590774416923523, 0.30092233419418335, 0.34593695402145386, 0.39095157384872437, 0.4359661638736725, 0.4809807538986206, 0.5259953737258911]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 12.0, 13.0, 15.0, 7.0, 22.0, 12.0, 17.0, 23.0, 22.0, 19.0, 22.0, 37.0, 31.0, 31.0, 30.0, 41.0, 32.0, 35.0, 35.0, 40.0, 37.0, 42.0, 42.0, 45.0, 40.0, 37.0, 29.0, 31.0, 22.0, 14.0, 16.0, 14.0, 20.0, 18.0, 13.0, 12.0, 9.0, 7.0, 8.0, 7.0, 6.0, 10.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.9691280126571655, -0.9407927989959717, -0.9124576449394226, -0.8841224312782288, -0.8557872176170349, -0.8274520635604858, -0.799116849899292, -0.7707816362380981, -0.7424464225769043, -0.7141112089157104, -0.6857760548591614, -0.6574408411979675, -0.6291056275367737, -0.6007704734802246, -0.5724352598190308, -0.5441000461578369, -0.5157648921012878, -0.4874297082424164, -0.45909449458122253, -0.4307593107223511, -0.4024240970611572, -0.37408891320228577, -0.3457537293434143, -0.31741851568222046, -0.289083331823349, -0.26074814796447754, -0.2324129343032837, -0.20407775044441223, -0.17574255168437958, -0.14740735292434692, -0.11907216906547546, -0.09073697030544281, -0.06240183115005493, -0.034066636115312576, -0.005731441080570221, 0.022603750228881836, 0.05093894898891449, 0.07927414774894714, 0.1076093316078186, 0.13594453036785126, 0.1642797291278839, 0.19261492788791656, 0.22095012664794922, 0.24928531050682068, 0.27762049436569214, 0.305955708026886, 0.33429089188575745, 0.3626260757446289, 0.39096128940582275, 0.4192964732646942, 0.44763168692588806, 0.4759668707847595, 0.5043020844459534, 0.5326372385025024, 0.5609724521636963, 0.5893076658248901, 0.617642879486084, 0.6459780931472778, 0.6743132472038269, 0.7026484608650208, 0.7309836745262146, 0.7593188285827637, 0.7876540422439575, 0.8159892559051514, 0.8443244099617004]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 6.0, 12.0, 23.0, 37.0, 62.0, 69.0, 116.0, 186.0, 301.0, 566.0, 914.0, 1681.0, 2881.0, 5438.0, 10303.0, 19970.0, 40644.0, 87958.0, 210742.0, 600209.0, 1556215.0, 1042441.0, 356942.0, 136372.0, 59774.0, 29248.0, 14404.0, 7658.0, 3963.0, 2213.0, 1198.0, 665.0, 413.0, 244.0, 140.0, 94.0, 63.0, 36.0, 24.0, 18.0, 9.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11224365234375, -0.10870933532714844, -0.10517501831054688, -0.10164070129394531, -0.09810638427734375, -0.09457206726074219, -0.09103775024414062, -0.08750343322753906, -0.0839691162109375, -0.08043479919433594, -0.07690048217773438, -0.07336616516113281, -0.06983184814453125, -0.06629753112792969, -0.06276321411132812, -0.05922889709472656, -0.055694580078125, -0.05216026306152344, -0.048625946044921875, -0.04509162902832031, -0.04155731201171875, -0.03802299499511719, -0.034488677978515625, -0.030954360961914062, -0.0274200439453125, -0.023885726928710938, -0.020351409912109375, -0.016817092895507812, -0.01328277587890625, -0.009748458862304688, -0.006214141845703125, -0.0026798248291015625, 0.0008544921875, 0.0043888092041015625, 0.007923126220703125, 0.011457443237304688, 0.01499176025390625, 0.018526077270507812, 0.022060394287109375, 0.025594711303710938, 0.0291290283203125, 0.03266334533691406, 0.036197662353515625, 0.03973197937011719, 0.04326629638671875, 0.04680061340332031, 0.050334930419921875, 0.05386924743652344, 0.057403564453125, 0.06093788146972656, 0.06447219848632812, 0.06800651550292969, 0.07154083251953125, 0.07507514953613281, 0.07860946655273438, 0.08214378356933594, 0.0856781005859375, 0.08921241760253906, 0.09274673461914062, 0.09628105163574219, 0.09981536865234375, 0.10334968566894531, 0.10688400268554688, 0.11041831970214844, 0.11395263671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 13.0, 7.0, 10.0, 12.0, 13.0, 16.0, 21.0, 23.0, 21.0, 36.0, 29.0, 31.0, 39.0, 40.0, 49.0, 40.0, 44.0, 43.0, 42.0, 56.0, 50.0, 41.0, 44.0, 40.0, 39.0, 25.0, 31.0, 24.0, 20.0, 15.0, 19.0, 13.0, 8.0, 15.0, 8.0, 12.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10894775390625, -0.10504627227783203, -0.10114479064941406, -0.0972433090209961, -0.09334182739257812, -0.08944034576416016, -0.08553886413574219, -0.08163738250732422, -0.07773590087890625, -0.07383441925048828, -0.06993293762207031, -0.06603145599365234, -0.062129974365234375, -0.058228492736816406, -0.05432701110839844, -0.05042552947998047, -0.0465240478515625, -0.04262256622314453, -0.03872108459472656, -0.034819602966308594, -0.030918121337890625, -0.027016639709472656, -0.023115158081054688, -0.01921367645263672, -0.01531219482421875, -0.011410713195800781, -0.0075092315673828125, -0.0036077499389648438, 0.000293731689453125, 0.004195213317871094, 0.008096694946289062, 0.011998176574707031, 0.015899658203125, 0.01980113983154297, 0.023702621459960938, 0.027604103088378906, 0.031505584716796875, 0.035407066345214844, 0.03930854797363281, 0.04321002960205078, 0.04711151123046875, 0.05101299285888672, 0.05491447448730469, 0.058815956115722656, 0.06271743774414062, 0.0666189193725586, 0.07052040100097656, 0.07442188262939453, 0.0783233642578125, 0.08222484588623047, 0.08612632751464844, 0.0900278091430664, 0.09392929077148438, 0.09783077239990234, 0.10173225402832031, 0.10563373565673828, 0.10953521728515625, 0.11343669891357422, 0.11733818054199219, 0.12123966217041016, 0.12514114379882812, 0.1290426254272461, 0.13294410705566406, 0.13684558868408203, 0.1407470703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 4.0, 7.0, 6.0, 11.0, 11.0, 15.0, 30.0, 47.0, 63.0, 92.0, 149.0, 252.0, 425.0, 759.0, 1273.0, 2455.0, 4547.0, 8794.0, 17678.0, 36095.0, 77088.0, 173153.0, 433088.0, 1291568.0, 1354873.0, 454928.0, 181546.0, 80245.0, 37627.0, 18107.0, 9018.0, 4657.0, 2447.0, 1298.0, 790.0, 437.0, 247.0, 148.0, 102.0, 67.0, 42.0, 33.0, 20.0, 16.0, 9.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.1562786102294922, -0.15154647827148438, -0.14681434631347656, -0.14208221435546875, -0.13735008239746094, -0.13261795043945312, -0.1278858184814453, -0.1231536865234375, -0.11842155456542969, -0.11368942260742188, -0.10895729064941406, -0.10422515869140625, -0.09949302673339844, -0.09476089477539062, -0.09002876281738281, -0.085296630859375, -0.08056449890136719, -0.07583236694335938, -0.07110023498535156, -0.06636810302734375, -0.06163597106933594, -0.056903839111328125, -0.05217170715332031, -0.0474395751953125, -0.04270744323730469, -0.037975311279296875, -0.03324317932128906, -0.02851104736328125, -0.023778915405273438, -0.019046783447265625, -0.014314651489257812, -0.00958251953125, -0.0048503875732421875, -0.000118255615234375, 0.0046138763427734375, 0.00934600830078125, 0.014078140258789062, 0.018810272216796875, 0.023542404174804688, 0.0282745361328125, 0.03300666809082031, 0.037738800048828125, 0.04247093200683594, 0.04720306396484375, 0.05193519592285156, 0.056667327880859375, 0.06139945983886719, 0.066131591796875, 0.07086372375488281, 0.07559585571289062, 0.08032798767089844, 0.08506011962890625, 0.08979225158691406, 0.09452438354492188, 0.09925651550292969, 0.1039886474609375, 0.10872077941894531, 0.11345291137695312, 0.11818504333496094, 0.12291717529296875, 0.12764930725097656, 0.13238143920898438, 0.1371135711669922, 0.141845703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 11.0, 15.0, 23.0, 31.0, 37.0, 47.0, 66.0, 86.0, 104.0, 165.0, 202.0, 327.0, 472.0, 612.0, 528.0, 385.0, 263.0, 178.0, 129.0, 92.0, 60.0, 72.0, 37.0, 29.0, 25.0, 15.0, 14.0, 5.0, 7.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2308349609375, -0.2237548828125, -0.2166748046875, -0.2095947265625, -0.2025146484375, -0.1954345703125, -0.1883544921875, -0.1812744140625, -0.1741943359375, -0.1671142578125, -0.1600341796875, -0.1529541015625, -0.1458740234375, -0.1387939453125, -0.1317138671875, -0.1246337890625, -0.1175537109375, -0.1104736328125, -0.1033935546875, -0.0963134765625, -0.0892333984375, -0.0821533203125, -0.0750732421875, -0.0679931640625, -0.0609130859375, -0.0538330078125, -0.0467529296875, -0.0396728515625, -0.0325927734375, -0.0255126953125, -0.0184326171875, -0.0113525390625, -0.0042724609375, 0.0028076171875, 0.0098876953125, 0.0169677734375, 0.0240478515625, 0.0311279296875, 0.0382080078125, 0.0452880859375, 0.0523681640625, 0.0594482421875, 0.0665283203125, 0.0736083984375, 0.0806884765625, 0.0877685546875, 0.0948486328125, 0.1019287109375, 0.1090087890625, 0.1160888671875, 0.1231689453125, 0.1302490234375, 0.1373291015625, 0.1444091796875, 0.1514892578125, 0.1585693359375, 0.1656494140625, 0.1727294921875, 0.1798095703125, 0.1868896484375, 0.1939697265625, 0.2010498046875, 0.2081298828125, 0.2152099609375, 0.2222900390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 11.0, 14.0, 27.0, 33.0, 47.0, 57.0, 76.0, 83.0, 80.0, 94.0, 87.0, 82.0, 77.0, 68.0, 50.0, 34.0, 27.0, 20.0, 10.0, 3.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2320847511291504, -1.2008845806121826, -1.1696845293045044, -1.1384843587875366, -1.1072843074798584, -1.0760841369628906, -1.0448839664459229, -1.0136839151382446, -0.9824837446212769, -0.9512836337089539, -0.9200835227966309, -0.8888833522796631, -0.8576832413673401, -0.8264831304550171, -0.7952830195426941, -0.7640829086303711, -0.7328827381134033, -0.7016826272010803, -0.6704825162887573, -0.6392823457717896, -0.6080822348594666, -0.5768821239471436, -0.5456820130348206, -0.5144819021224976, -0.48328179121017456, -0.45208168029785156, -0.4208815395832062, -0.3896814286708832, -0.3584812879562378, -0.3272811770439148, -0.2960810661315918, -0.2648809254169464, -0.23368078470230103, -0.20248065888881683, -0.17128053307533264, -0.14008042216300964, -0.10888028889894485, -0.07768017053604126, -0.04648004472255707, -0.015279918909072876, 0.015920206904411316, 0.04712033271789551, 0.0783204585313797, 0.1095205768942833, 0.1407206952571869, 0.17192082107067108, 0.20312094688415527, 0.23432107269763947, 0.26552119851112366, 0.29672130942344666, 0.32792145013809204, 0.35912156105041504, 0.3903217017650604, 0.4215218126773834, 0.4527219533920288, 0.4839220643043518, 0.5151221752166748, 0.5463222861289978, 0.5775223970413208, 0.6087225675582886, 0.6399226784706116, 0.6711227893829346, 0.7023229002952576, 0.7335230112075806, 0.7647231817245483]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 1.0, 3.0, 11.0, 2.0, 9.0, 10.0, 11.0, 9.0, 8.0, 20.0, 20.0, 20.0, 20.0, 26.0, 22.0, 28.0, 31.0, 43.0, 29.0, 39.0, 34.0, 44.0, 30.0, 35.0, 50.0, 34.0, 45.0, 39.0, 34.0, 27.0, 20.0, 31.0, 27.0, 25.0, 27.0, 21.0, 16.0, 17.0, 18.0, 12.0, 10.0, 6.0, 9.0, 8.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.5972824096679688, -0.5777754187583923, -0.5582684278488159, -0.5387613773345947, -0.5192543864250183, -0.4997473955154419, -0.4802403748035431, -0.4607333540916443, -0.44122636318206787, -0.42171937227249146, -0.40221235156059265, -0.38270533084869385, -0.36319833993911743, -0.343691349029541, -0.3241843283176422, -0.3046773076057434, -0.285170316696167, -0.2656633257865906, -0.24615630507469177, -0.22664929926395416, -0.20714229345321655, -0.18763528764247894, -0.16812828183174133, -0.14862127602100372, -0.1291142702102661, -0.1096072643995285, -0.0901002585887909, -0.07059325277805328, -0.051086246967315674, -0.031579241156578064, -0.012072235345840454, 0.007434770464897156, 0.02694183588027954, 0.04644884169101715, 0.06595584750175476, 0.08546285331249237, 0.10496985912322998, 0.12447686493396759, 0.1439838707447052, 0.1634908765554428, 0.18299788236618042, 0.20250488817691803, 0.22201189398765564, 0.24151889979839325, 0.26102590560913086, 0.2805328965187073, 0.3000399172306061, 0.3195469379425049, 0.3390539288520813, 0.3585609197616577, 0.3780679404735565, 0.3975749611854553, 0.41708195209503174, 0.43658894300460815, 0.45609596371650696, 0.47560298442840576, 0.4951099753379822, 0.5146169662475586, 0.5341240167617798, 0.5536310076713562, 0.5731379985809326, 0.592644989490509, 0.6121519804000854, 0.6316590309143066, 0.6511660218238831]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 6.0, 7.0, 11.0, 14.0, 17.0, 34.0, 42.0, 65.0, 90.0, 135.0, 169.0, 306.0, 465.0, 618.0, 939.0, 1534.0, 2260.0, 3533.0, 5439.0, 8378.0, 13110.0, 21035.0, 35799.0, 67459.0, 147278.0, 288174.0, 225953.0, 101065.0, 49497.0, 27861.0, 16857.0, 10595.0, 6844.0, 4492.0, 2872.0, 1911.0, 1219.0, 854.0, 521.0, 379.0, 253.0, 150.0, 102.0, 65.0, 54.0, 30.0, 29.0, 19.0, 13.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11358642578125, -0.1097707748413086, -0.10595512390136719, -0.10213947296142578, -0.09832382202148438, -0.09450817108154297, -0.09069252014160156, -0.08687686920166016, -0.08306121826171875, -0.07924556732177734, -0.07542991638183594, -0.07161426544189453, -0.06779861450195312, -0.06398296356201172, -0.06016731262207031, -0.056351661682128906, -0.0525360107421875, -0.048720359802246094, -0.04490470886230469, -0.04108905792236328, -0.037273406982421875, -0.03345775604248047, -0.029642105102539062, -0.025826454162597656, -0.02201080322265625, -0.018195152282714844, -0.014379501342773438, -0.010563850402832031, -0.006748199462890625, -0.0029325485229492188, 0.0008831024169921875, 0.004698753356933594, 0.008514404296875, 0.012330055236816406, 0.016145706176757812, 0.01996135711669922, 0.023777008056640625, 0.02759265899658203, 0.03140830993652344, 0.035223960876464844, 0.03903961181640625, 0.042855262756347656, 0.04667091369628906, 0.05048656463623047, 0.054302215576171875, 0.05811786651611328, 0.06193351745605469, 0.0657491683959961, 0.0695648193359375, 0.0733804702758789, 0.07719612121582031, 0.08101177215576172, 0.08482742309570312, 0.08864307403564453, 0.09245872497558594, 0.09627437591552734, 0.10009002685546875, 0.10390567779541016, 0.10772132873535156, 0.11153697967529297, 0.11535263061523438, 0.11916828155517578, 0.12298393249511719, 0.1267995834350586, 0.130615234375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 10.0, 6.0, 5.0, 13.0, 12.0, 13.0, 26.0, 19.0, 19.0, 31.0, 34.0, 35.0, 46.0, 56.0, 31.0, 49.0, 42.0, 37.0, 50.0, 49.0, 38.0, 43.0, 61.0, 42.0, 33.0, 24.0, 24.0, 21.0, 24.0, 20.0, 20.0, 10.0, 11.0, 10.0, 7.0, 8.0, 1.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.1134805679321289, -0.10983467102050781, -0.10618877410888672, -0.10254287719726562, -0.09889698028564453, -0.09525108337402344, -0.09160518646240234, -0.08795928955078125, -0.08431339263916016, -0.08066749572753906, -0.07702159881591797, -0.07337570190429688, -0.06972980499267578, -0.06608390808105469, -0.062438011169433594, -0.0587921142578125, -0.055146217346191406, -0.05150032043457031, -0.04785442352294922, -0.044208526611328125, -0.04056262969970703, -0.03691673278808594, -0.033270835876464844, -0.02962493896484375, -0.025979042053222656, -0.022333145141601562, -0.01868724822998047, -0.015041351318359375, -0.011395454406738281, -0.0077495574951171875, -0.004103660583496094, -0.000457763671875, 0.0031881332397460938, 0.0068340301513671875, 0.010479927062988281, 0.014125823974609375, 0.01777172088623047, 0.021417617797851562, 0.025063514709472656, 0.02870941162109375, 0.032355308532714844, 0.03600120544433594, 0.03964710235595703, 0.043292999267578125, 0.04693889617919922, 0.05058479309082031, 0.054230690002441406, 0.0578765869140625, 0.061522483825683594, 0.06516838073730469, 0.06881427764892578, 0.07246017456054688, 0.07610607147216797, 0.07975196838378906, 0.08339786529541016, 0.08704376220703125, 0.09068965911865234, 0.09433555603027344, 0.09798145294189453, 0.10162734985351562, 0.10527324676513672, 0.10891914367675781, 0.1125650405883789, 0.1162109375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 4.0, 11.0, 9.0, 13.0, 24.0, 31.0, 29.0, 53.0, 76.0, 100.0, 155.0, 291.0, 507.0, 1119.0, 2375.0, 5595.0, 12790.0, 30672.0, 83868.0, 334928.0, 409340.0, 103309.0, 36415.0, 14903.0, 6386.0, 2795.0, 1332.0, 562.0, 300.0, 179.0, 108.0, 80.0, 51.0, 38.0, 29.0, 19.0, 16.0, 9.0, 10.0, 2.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2198657989501953, -0.21255874633789062, -0.20525169372558594, -0.19794464111328125, -0.19063758850097656, -0.18333053588867188, -0.1760234832763672, -0.1687164306640625, -0.1614093780517578, -0.15410232543945312, -0.14679527282714844, -0.13948822021484375, -0.13218116760253906, -0.12487411499023438, -0.11756706237792969, -0.110260009765625, -0.10295295715332031, -0.09564590454101562, -0.08833885192871094, -0.08103179931640625, -0.07372474670410156, -0.06641769409179688, -0.05911064147949219, -0.0518035888671875, -0.04449653625488281, -0.037189483642578125, -0.029882431030273438, -0.02257537841796875, -0.015268325805664062, -0.007961273193359375, -0.0006542205810546875, 0.00665283203125, 0.013959884643554688, 0.021266937255859375, 0.028573989868164062, 0.03588104248046875, 0.04318809509277344, 0.050495147705078125, 0.05780220031738281, 0.0651092529296875, 0.07241630554199219, 0.07972335815429688, 0.08703041076660156, 0.09433746337890625, 0.10164451599121094, 0.10895156860351562, 0.11625862121582031, 0.123565673828125, 0.1308727264404297, 0.13817977905273438, 0.14548683166503906, 0.15279388427734375, 0.16010093688964844, 0.16740798950195312, 0.1747150421142578, 0.1820220947265625, 0.1893291473388672, 0.19663619995117188, 0.20394325256347656, 0.21125030517578125, 0.21855735778808594, 0.22586441040039062, 0.2331714630126953, 0.240478515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 4.0, 7.0, 4.0, 8.0, 11.0, 17.0, 11.0, 19.0, 27.0, 27.0, 28.0, 33.0, 41.0, 31.0, 35.0, 41.0, 33.0, 54.0, 60.0, 47.0, 41.0, 40.0, 45.0, 40.0, 36.0, 38.0, 38.0, 26.0, 35.0, 22.0, 15.0, 12.0, 16.0, 13.0, 13.0, 8.0, 8.0, 8.0, 6.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.36474609375, -0.3546714782714844, -0.34459686279296875, -0.3345222473144531, -0.3244476318359375, -0.3143730163574219, -0.30429840087890625, -0.2942237854003906, -0.284149169921875, -0.2740745544433594, -0.26399993896484375, -0.2539253234863281, -0.2438507080078125, -0.23377609252929688, -0.22370147705078125, -0.21362686157226562, -0.20355224609375, -0.19347763061523438, -0.18340301513671875, -0.17332839965820312, -0.1632537841796875, -0.15317916870117188, -0.14310455322265625, -0.13302993774414062, -0.122955322265625, -0.11288070678710938, -0.10280609130859375, -0.09273147583007812, -0.0826568603515625, -0.07258224487304688, -0.06250762939453125, -0.052433013916015625, -0.0423583984375, -0.032283782958984375, -0.02220916748046875, -0.012134552001953125, -0.0020599365234375, 0.008014678955078125, 0.01808929443359375, 0.028163909912109375, 0.038238525390625, 0.048313140869140625, 0.05838775634765625, 0.06846237182617188, 0.0785369873046875, 0.08861160278320312, 0.09868621826171875, 0.10876083374023438, 0.11883544921875, 0.12891006469726562, 0.13898468017578125, 0.14905929565429688, 0.1591339111328125, 0.16920852661132812, 0.17928314208984375, 0.18935775756835938, 0.199432373046875, 0.20950698852539062, 0.21958160400390625, 0.22965621948242188, 0.2397308349609375, 0.24980545043945312, 0.25988006591796875, 0.2699546813964844, 0.280029296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 13.0, 27.0, 24.0, 65.0, 78.0, 131.0, 258.0, 418.0, 775.0, 1534.0, 3008.0, 6152.0, 12925.0, 29036.0, 69745.0, 191529.0, 444882.0, 172713.0, 64238.0, 26992.0, 12207.0, 5767.0, 2896.0, 1419.0, 774.0, 399.0, 231.0, 129.0, 70.0, 43.0, 29.0, 14.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0894775390625, -0.08688068389892578, -0.08428382873535156, -0.08168697357177734, -0.07909011840820312, -0.0764932632446289, -0.07389640808105469, -0.07129955291748047, -0.06870269775390625, -0.06610584259033203, -0.06350898742675781, -0.060912132263183594, -0.058315277099609375, -0.055718421936035156, -0.05312156677246094, -0.05052471160888672, -0.0479278564453125, -0.04533100128173828, -0.04273414611816406, -0.040137290954589844, -0.037540435791015625, -0.034943580627441406, -0.03234672546386719, -0.02974987030029297, -0.02715301513671875, -0.02455615997314453, -0.021959304809570312, -0.019362449645996094, -0.016765594482421875, -0.014168739318847656, -0.011571884155273438, -0.008975028991699219, -0.006378173828125, -0.0037813186645507812, -0.0011844635009765625, 0.0014123916625976562, 0.004009246826171875, 0.006606101989746094, 0.009202957153320312, 0.011799812316894531, 0.01439666748046875, 0.01699352264404297, 0.019590377807617188, 0.022187232971191406, 0.024784088134765625, 0.027380943298339844, 0.029977798461914062, 0.03257465362548828, 0.0351715087890625, 0.03776836395263672, 0.04036521911621094, 0.042962074279785156, 0.045558929443359375, 0.048155784606933594, 0.05075263977050781, 0.05334949493408203, 0.05594635009765625, 0.05854320526123047, 0.06114006042480469, 0.0637369155883789, 0.06633377075195312, 0.06893062591552734, 0.07152748107910156, 0.07412433624267578, 0.07672119140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 6.0, 7.0, 11.0, 14.0, 23.0, 27.0, 48.0, 65.0, 98.0, 110.0, 123.0, 108.0, 106.0, 61.0, 52.0, 22.0, 26.0, 20.0, 12.0, 6.0, 6.0, 11.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8431415557861328e-05, -2.7553178369998932e-05, -2.6674941182136536e-05, -2.579670399427414e-05, -2.4918466806411743e-05, -2.4040229618549347e-05, -2.316199243068695e-05, -2.2283755242824554e-05, -2.1405518054962158e-05, -2.0527280867099762e-05, -1.9649043679237366e-05, -1.877080649137497e-05, -1.7892569303512573e-05, -1.7014332115650177e-05, -1.613609492778778e-05, -1.5257857739925385e-05, -1.4379620552062988e-05, -1.3501383364200592e-05, -1.2623146176338196e-05, -1.17449089884758e-05, -1.0866671800613403e-05, -9.988434612751007e-06, -9.11019742488861e-06, -8.231960237026215e-06, -7.353723049163818e-06, -6.475485861301422e-06, -5.597248673439026e-06, -4.71901148557663e-06, -3.840774297714233e-06, -2.962537109851837e-06, -2.084299921989441e-06, -1.2060627341270447e-06, -3.2782554626464844e-07, 5.504116415977478e-07, 1.428648829460144e-06, 2.3068860173225403e-06, 3.1851232051849365e-06, 4.063360393047333e-06, 4.941597580909729e-06, 5.819834768772125e-06, 6.6980719566345215e-06, 7.576309144496918e-06, 8.454546332359314e-06, 9.33278352022171e-06, 1.0211020708084106e-05, 1.1089257895946503e-05, 1.1967495083808899e-05, 1.2845732271671295e-05, 1.3723969459533691e-05, 1.4602206647396088e-05, 1.5480443835258484e-05, 1.635868102312088e-05, 1.7236918210983276e-05, 1.8115155398845673e-05, 1.899339258670807e-05, 1.9871629774570465e-05, 2.074986696243286e-05, 2.1628104150295258e-05, 2.2506341338157654e-05, 2.338457852602005e-05, 2.4262815713882446e-05, 2.5141052901744843e-05, 2.601929008960724e-05, 2.6897527277469635e-05, 2.777576446533203e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 6.0, 18.0, 23.0, 22.0, 43.0, 66.0, 92.0, 117.0, 201.0, 326.0, 645.0, 1306.0, 2974.0, 7903.0, 24932.0, 93267.0, 428567.0, 373177.0, 80419.0, 21983.0, 7156.0, 2680.0, 1166.0, 621.0, 284.0, 203.0, 105.0, 85.0, 40.0, 49.0, 28.0, 18.0, 12.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11431884765625, -0.11036968231201172, -0.10642051696777344, -0.10247135162353516, -0.09852218627929688, -0.0945730209350586, -0.09062385559082031, -0.08667469024658203, -0.08272552490234375, -0.07877635955810547, -0.07482719421386719, -0.0708780288696289, -0.06692886352539062, -0.06297969818115234, -0.05903053283691406, -0.05508136749267578, -0.0511322021484375, -0.04718303680419922, -0.04323387145996094, -0.039284706115722656, -0.035335540771484375, -0.031386375427246094, -0.027437210083007812, -0.02348804473876953, -0.01953887939453125, -0.015589714050292969, -0.011640548706054688, -0.007691383361816406, -0.003742218017578125, 0.00020694732666015625, 0.0041561126708984375, 0.008105278015136719, 0.012054443359375, 0.01600360870361328, 0.019952774047851562, 0.023901939392089844, 0.027851104736328125, 0.031800270080566406, 0.03574943542480469, 0.03969860076904297, 0.04364776611328125, 0.04759693145751953, 0.05154609680175781, 0.055495262145996094, 0.059444427490234375, 0.06339359283447266, 0.06734275817871094, 0.07129192352294922, 0.0752410888671875, 0.07919025421142578, 0.08313941955566406, 0.08708858489990234, 0.09103775024414062, 0.0949869155883789, 0.09893608093261719, 0.10288524627685547, 0.10683441162109375, 0.11078357696533203, 0.11473274230957031, 0.1186819076538086, 0.12263107299804688, 0.12658023834228516, 0.13052940368652344, 0.13447856903076172, 0.138427734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 6.0, 13.0, 14.0, 11.0, 14.0, 14.0, 21.0, 31.0, 43.0, 38.0, 54.0, 54.0, 84.0, 89.0, 93.0, 74.0, 69.0, 40.0, 50.0, 36.0, 30.0, 17.0, 24.0, 17.0, 15.0, 7.0, 11.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0833740234375, -0.08090877532958984, -0.07844352722167969, -0.07597827911376953, -0.07351303100585938, -0.07104778289794922, -0.06858253479003906, -0.0661172866821289, -0.06365203857421875, -0.061186790466308594, -0.05872154235839844, -0.05625629425048828, -0.053791046142578125, -0.05132579803466797, -0.04886054992675781, -0.046395301818847656, -0.0439300537109375, -0.041464805603027344, -0.03899955749511719, -0.03653430938720703, -0.034069061279296875, -0.03160381317138672, -0.029138565063476562, -0.026673316955566406, -0.02420806884765625, -0.021742820739746094, -0.019277572631835938, -0.01681232452392578, -0.014347076416015625, -0.011881828308105469, -0.009416580200195312, -0.006951332092285156, -0.004486083984375, -0.0020208358764648438, 0.0004444122314453125, 0.0029096603393554688, 0.005374908447265625, 0.007840156555175781, 0.010305404663085938, 0.012770652770996094, 0.01523590087890625, 0.017701148986816406, 0.020166397094726562, 0.02263164520263672, 0.025096893310546875, 0.02756214141845703, 0.030027389526367188, 0.032492637634277344, 0.0349578857421875, 0.037423133850097656, 0.03988838195800781, 0.04235363006591797, 0.044818878173828125, 0.04728412628173828, 0.04974937438964844, 0.052214622497558594, 0.05467987060546875, 0.057145118713378906, 0.05961036682128906, 0.06207561492919922, 0.06454086303710938, 0.06700611114501953, 0.06947135925292969, 0.07193660736083984, 0.07440185546875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 14.0, 21.0, 56.0, 73.0, 101.0, 131.0, 163.0, 155.0, 104.0, 81.0, 45.0, 20.0, 14.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.010113000869751, -1.9697915315628052, -1.9294699430465698, -1.889148473739624, -1.8488268852233887, -1.8085054159164429, -1.768183946609497, -1.7278623580932617, -1.687540888786316, -1.6472194194793701, -1.6068978309631348, -1.566576361656189, -1.5262548923492432, -1.4859333038330078, -1.445611834526062, -1.4052903652191162, -1.3649687767028809, -1.324647307395935, -1.2843257188796997, -1.244004249572754, -1.2036826610565186, -1.1633611917495728, -1.123039722442627, -1.0827181339263916, -1.0423966646194458, -1.0020751953125, -0.9617536067962646, -0.9214321374893188, -0.8811106085777283, -0.8407890796661377, -0.8004676103591919, -0.7601460814476013, -0.7198245525360107, -0.6795030236244202, -0.6391814947128296, -0.5988600254058838, -0.5585384964942932, -0.5182169675827026, -0.47789546847343445, -0.43757396936416626, -0.3972524404525757, -0.3569309115409851, -0.3166094124317169, -0.27628791332244873, -0.23596638441085815, -0.19564487040042877, -0.1553233563899994, -0.1150018572807312, -0.07468032836914062, -0.03435881435871124, 0.00596269965171814, 0.04628421366214752, 0.0866057276725769, 0.1269272416830063, 0.16724875569343567, 0.20757025480270386, 0.24789178371429443, 0.288213312625885, 0.3285348117351532, 0.3688563108444214, 0.40917783975601196, 0.44949936866760254, 0.4898208677768707, 0.5301423668861389, 0.5704638957977295]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 1.0, 5.0, 1.0, 7.0, 7.0, 13.0, 19.0, 26.0, 19.0, 23.0, 13.0, 36.0, 32.0, 28.0, 45.0, 39.0, 35.0, 52.0, 46.0, 39.0, 51.0, 50.0, 42.0, 41.0, 38.0, 34.0, 38.0, 28.0, 24.0, 37.0, 35.0, 23.0, 17.0, 9.0, 10.0, 9.0, 4.0, 5.0, 3.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.9345296621322632, -0.909970760345459, -0.8854118585586548, -0.8608529567718506, -0.8362940549850464, -0.8117351531982422, -0.787176251411438, -0.7626173496246338, -0.7380584478378296, -0.7134995460510254, -0.6889406442642212, -0.664381742477417, -0.6398228406906128, -0.6152639389038086, -0.5907050371170044, -0.5661461353302002, -0.541587233543396, -0.5170283317565918, -0.4924694299697876, -0.4679105281829834, -0.4433516263961792, -0.418792724609375, -0.3942338228225708, -0.3696749210357666, -0.3451159596443176, -0.3205570578575134, -0.29599815607070923, -0.27143925428390503, -0.24688035249710083, -0.22232145071029663, -0.19776253402233124, -0.17320363223552704, -0.14864474534988403, -0.12408584356307983, -0.09952694177627563, -0.07496803253889084, -0.05040913075208664, -0.02585022896528244, -0.001291319727897644, 0.023267582058906555, 0.047826483845710754, 0.07238538563251495, 0.09694428741931915, 0.12150319665670395, 0.14606210589408875, 0.17062100768089294, 0.19517990946769714, 0.21973881125450134, 0.24429771304130554, 0.26885661482810974, 0.29341551661491394, 0.31797441840171814, 0.34253332018852234, 0.36709222197532654, 0.3916511535644531, 0.4162100553512573, 0.4407689571380615, 0.4653278589248657, 0.4898867607116699, 0.5144456624984741, 0.5390045642852783, 0.5635634660720825, 0.5881223678588867, 0.6126812696456909, 0.6372401714324951]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 2.0, 1.0, 7.0, 13.0, 23.0, 24.0, 52.0, 78.0, 76.0, 145.0, 247.0, 388.0, 627.0, 1076.0, 1737.0, 3101.0, 5087.0, 9056.0, 16377.0, 30152.0, 58160.0, 120450.0, 291675.0, 926038.0, 1696154.0, 618978.0, 214516.0, 94726.0, 47652.0, 25307.0, 13977.0, 7674.0, 4385.0, 2530.0, 1459.0, 885.0, 567.0, 363.0, 208.0, 117.0, 75.0, 50.0, 28.0, 20.0, 10.0, 1.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09246826171875, -0.0889577865600586, -0.08544731140136719, -0.08193683624267578, -0.07842636108398438, -0.07491588592529297, -0.07140541076660156, -0.06789493560791016, -0.06438446044921875, -0.060873985290527344, -0.05736351013183594, -0.05385303497314453, -0.050342559814453125, -0.04683208465576172, -0.04332160949707031, -0.039811134338378906, -0.0363006591796875, -0.032790184020996094, -0.029279708862304688, -0.02576923370361328, -0.022258758544921875, -0.01874828338623047, -0.015237808227539062, -0.011727333068847656, -0.00821685791015625, -0.004706382751464844, -0.0011959075927734375, 0.0023145675659179688, 0.005825042724609375, 0.009335517883300781, 0.012845993041992188, 0.016356468200683594, 0.019866943359375, 0.023377418518066406, 0.026887893676757812, 0.03039836883544922, 0.033908843994140625, 0.03741931915283203, 0.04092979431152344, 0.044440269470214844, 0.04795074462890625, 0.051461219787597656, 0.05497169494628906, 0.05848217010498047, 0.061992645263671875, 0.06550312042236328, 0.06901359558105469, 0.0725240707397461, 0.0760345458984375, 0.0795450210571289, 0.08305549621582031, 0.08656597137451172, 0.09007644653320312, 0.09358692169189453, 0.09709739685058594, 0.10060787200927734, 0.10411834716796875, 0.10762882232666016, 0.11113929748535156, 0.11464977264404297, 0.11816024780273438, 0.12167072296142578, 0.1251811981201172, 0.1286916732788086, 0.1322021484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 6.0, 7.0, 11.0, 16.0, 17.0, 15.0, 13.0, 24.0, 19.0, 23.0, 35.0, 20.0, 24.0, 30.0, 38.0, 49.0, 51.0, 44.0, 40.0, 57.0, 45.0, 41.0, 32.0, 36.0, 35.0, 31.0, 35.0, 44.0, 14.0, 24.0, 21.0, 21.0, 12.0, 16.0, 6.0, 8.0, 12.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096923828125, -0.0936574935913086, -0.09039115905761719, -0.08712482452392578, -0.08385848999023438, -0.08059215545654297, -0.07732582092285156, -0.07405948638916016, -0.07079315185546875, -0.06752681732177734, -0.06426048278808594, -0.06099414825439453, -0.057727813720703125, -0.05446147918701172, -0.05119514465332031, -0.047928810119628906, -0.0446624755859375, -0.041396141052246094, -0.03812980651855469, -0.03486347198486328, -0.031597137451171875, -0.02833080291748047, -0.025064468383789062, -0.021798133850097656, -0.01853179931640625, -0.015265464782714844, -0.011999130249023438, -0.008732795715332031, -0.005466461181640625, -0.0022001266479492188, 0.0010662078857421875, 0.004332542419433594, 0.007598876953125, 0.010865211486816406, 0.014131546020507812, 0.01739788055419922, 0.020664215087890625, 0.02393054962158203, 0.027196884155273438, 0.030463218688964844, 0.03372955322265625, 0.036995887756347656, 0.04026222229003906, 0.04352855682373047, 0.046794891357421875, 0.05006122589111328, 0.05332756042480469, 0.056593894958496094, 0.0598602294921875, 0.0631265640258789, 0.06639289855957031, 0.06965923309326172, 0.07292556762695312, 0.07619190216064453, 0.07945823669433594, 0.08272457122802734, 0.08599090576171875, 0.08925724029541016, 0.09252357482910156, 0.09578990936279297, 0.09905624389648438, 0.10232257843017578, 0.10558891296386719, 0.1088552474975586, 0.11212158203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 23.0, 9.0, 32.0, 35.0, 48.0, 62.0, 113.0, 153.0, 200.0, 367.0, 499.0, 818.0, 1190.0, 1942.0, 3034.0, 5287.0, 8538.0, 14711.0, 25626.0, 46330.0, 86720.0, 170527.0, 389847.0, 1161608.0, 1385018.0, 473022.0, 197845.0, 98441.0, 52690.0, 28852.0, 16387.0, 9433.0, 5631.0, 3339.0, 2048.0, 1275.0, 887.0, 558.0, 341.0, 267.0, 151.0, 107.0, 73.0, 46.0, 41.0, 31.0, 20.0, 20.0, 7.0, 10.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.1219482421875, -0.1180267333984375, -0.114105224609375, -0.1101837158203125, -0.10626220703125, -0.1023406982421875, -0.098419189453125, -0.0944976806640625, -0.090576171875, -0.0866546630859375, -0.082733154296875, -0.0788116455078125, -0.07489013671875, -0.0709686279296875, -0.067047119140625, -0.0631256103515625, -0.0592041015625, -0.0552825927734375, -0.051361083984375, -0.0474395751953125, -0.04351806640625, -0.0395965576171875, -0.035675048828125, -0.0317535400390625, -0.02783203125, -0.0239105224609375, -0.019989013671875, -0.0160675048828125, -0.01214599609375, -0.0082244873046875, -0.004302978515625, -0.0003814697265625, 0.0035400390625, 0.0074615478515625, 0.011383056640625, 0.0153045654296875, 0.01922607421875, 0.0231475830078125, 0.027069091796875, 0.0309906005859375, 0.034912109375, 0.0388336181640625, 0.042755126953125, 0.0466766357421875, 0.05059814453125, 0.0545196533203125, 0.058441162109375, 0.0623626708984375, 0.0662841796875, 0.0702056884765625, 0.074127197265625, 0.0780487060546875, 0.08197021484375, 0.0858917236328125, 0.089813232421875, 0.0937347412109375, 0.09765625, 0.1015777587890625, 0.105499267578125, 0.1094207763671875, 0.11334228515625, 0.1172637939453125, 0.121185302734375, 0.1251068115234375, 0.1290283203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 7.0, 17.0, 15.0, 19.0, 25.0, 23.0, 39.0, 34.0, 54.0, 88.0, 120.0, 152.0, 259.0, 345.0, 545.0, 623.0, 508.0, 304.0, 217.0, 168.0, 113.0, 87.0, 69.0, 40.0, 34.0, 32.0, 24.0, 22.0, 18.0, 10.0, 9.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.1827411651611328, -0.17651748657226562, -0.17029380798339844, -0.16407012939453125, -0.15784645080566406, -0.15162277221679688, -0.1453990936279297, -0.1391754150390625, -0.1329517364501953, -0.12672805786132812, -0.12050437927246094, -0.11428070068359375, -0.10805702209472656, -0.10183334350585938, -0.09560966491699219, -0.089385986328125, -0.08316230773925781, -0.07693862915039062, -0.07071495056152344, -0.06449127197265625, -0.05826759338378906, -0.052043914794921875, -0.04582023620605469, -0.0395965576171875, -0.03337287902832031, -0.027149200439453125, -0.020925521850585938, -0.01470184326171875, -0.008478164672851562, -0.002254486083984375, 0.0039691925048828125, 0.01019287109375, 0.016416549682617188, 0.022640228271484375, 0.028863906860351562, 0.03508758544921875, 0.04131126403808594, 0.047534942626953125, 0.05375862121582031, 0.0599822998046875, 0.06620597839355469, 0.07242965698242188, 0.07865333557128906, 0.08487701416015625, 0.09110069274902344, 0.09732437133789062, 0.10354804992675781, 0.109771728515625, 0.11599540710449219, 0.12221908569335938, 0.12844276428222656, 0.13466644287109375, 0.14089012145996094, 0.14711380004882812, 0.1533374786376953, 0.1595611572265625, 0.1657848358154297, 0.17200851440429688, 0.17823219299316406, 0.18445587158203125, 0.19067955017089844, 0.19690322875976562, 0.2031269073486328, 0.2093505859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 15.0, 22.0, 47.0, 68.0, 123.0, 147.0, 148.0, 158.0, 123.0, 68.0, 39.0, 19.0, 7.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935222625732422, -1.3399029970169067, -1.2862837314605713, -1.2326644659042358, -1.1790452003479004, -1.1254260540008545, -1.071806788444519, -1.0181875228881836, -0.9645682573318481, -0.9109489917755127, -0.8573297262191772, -0.8037105202674866, -0.7500912547111511, -0.6964719891548157, -0.642852783203125, -0.5892335176467896, -0.5356142520904541, -0.48199498653411865, -0.4283757507801056, -0.37475651502609253, -0.3211372494697571, -0.26751798391342163, -0.21389874815940857, -0.1602795124053955, -0.10666024684906006, -0.0530409961938858, 0.0005782544612884521, 0.05419750511646271, 0.10781675577163696, 0.1614360213279724, 0.21505525708198547, 0.26867449283599854, 0.322293758392334, 0.37591302394866943, 0.4295322597026825, 0.48315149545669556, 0.536770761013031, 0.5903900265693665, 0.6440092325210571, 0.6976284980773926, 0.751247763633728, 0.8048670291900635, 0.8584862947463989, 0.9121055006980896, 0.965724766254425, 1.0193440914154053, 1.0729632377624512, 1.1265825033187866, 1.180201768875122, 1.2338210344314575, 1.287440299987793, 1.3410595655441284, 1.3946788311004639, 1.4482979774475098, 1.5019172430038452, 1.5555365085601807, 1.6091557741165161, 1.6627750396728516, 1.716394305229187, 1.7700135707855225, 1.8236327171325684, 1.8772521018981934, 1.9308712482452393, 1.9844905138015747, 2.03810977935791]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 6.0, 5.0, 9.0, 13.0, 17.0, 15.0, 17.0, 17.0, 18.0, 28.0, 39.0, 27.0, 38.0, 23.0, 52.0, 38.0, 37.0, 38.0, 37.0, 48.0, 46.0, 37.0, 43.0, 41.0, 32.0, 33.0, 21.0, 35.0, 26.0, 26.0, 12.0, 19.0, 14.0, 13.0, 9.0, 8.0, 17.0, 6.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6053301095962524, -0.5854455828666687, -0.5655609965324402, -0.5456764698028564, -0.5257918834686279, -0.5059073567390442, -0.48602283000946045, -0.4661382734775543, -0.4462537169456482, -0.42636916041374207, -0.40648460388183594, -0.3866000771522522, -0.36671552062034607, -0.34683096408843994, -0.3269464373588562, -0.3070618808269501, -0.28717732429504395, -0.2672927677631378, -0.24740822613239288, -0.22752368450164795, -0.20763912796974182, -0.1877545714378357, -0.16787002980709076, -0.14798548817634583, -0.1281009316444397, -0.10821638256311417, -0.08833183348178864, -0.0684472844004631, -0.04856273531913757, -0.028678186237812042, -0.008793637156486511, 0.011090904474258423, 0.03097546100616455, 0.05086001008749008, 0.07074455916881561, 0.09062910825014114, 0.11051365733146667, 0.1303982138633728, 0.15028275549411774, 0.17016729712486267, 0.1900518536567688, 0.20993641018867493, 0.22982095181941986, 0.2497054934501648, 0.2695900499820709, 0.28947460651397705, 0.3093591332435608, 0.3292436897754669, 0.34912824630737305, 0.3690128028392792, 0.3888973593711853, 0.40878188610076904, 0.42866644263267517, 0.4485509991645813, 0.46843552589416504, 0.48832008242607117, 0.5082046389579773, 0.528089165687561, 0.5479737520217896, 0.5678582787513733, 0.587742805480957, 0.6076273918151855, 0.6275119185447693, 0.647396445274353, 0.6672810316085815]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 8.0, 10.0, 19.0, 22.0, 53.0, 49.0, 93.0, 141.0, 233.0, 315.0, 484.0, 743.0, 1112.0, 1741.0, 2446.0, 3375.0, 5458.0, 8369.0, 13729.0, 23788.0, 47070.0, 101016.0, 215417.0, 286510.0, 169797.0, 77491.0, 37002.0, 19414.0, 11265.0, 7145.0, 4656.0, 3150.0, 2042.0, 1472.0, 979.0, 643.0, 420.0, 307.0, 222.0, 116.0, 96.0, 52.0, 33.0, 19.0, 13.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1141357421875, -0.11049270629882812, -0.10684967041015625, -0.10320663452148438, -0.0995635986328125, -0.09592056274414062, -0.09227752685546875, -0.08863449096679688, -0.084991455078125, -0.08134841918945312, -0.07770538330078125, -0.07406234741210938, -0.0704193115234375, -0.06677627563476562, -0.06313323974609375, -0.059490203857421875, -0.05584716796875, -0.052204132080078125, -0.04856109619140625, -0.044918060302734375, -0.0412750244140625, -0.037631988525390625, -0.03398895263671875, -0.030345916748046875, -0.026702880859375, -0.023059844970703125, -0.01941680908203125, -0.015773773193359375, -0.0121307373046875, -0.008487701416015625, -0.00484466552734375, -0.001201629638671875, 0.00244140625, 0.006084442138671875, 0.00972747802734375, 0.013370513916015625, 0.0170135498046875, 0.020656585693359375, 0.02429962158203125, 0.027942657470703125, 0.031585693359375, 0.035228729248046875, 0.03887176513671875, 0.042514801025390625, 0.0461578369140625, 0.049800872802734375, 0.05344390869140625, 0.057086944580078125, 0.06072998046875, 0.06437301635742188, 0.06801605224609375, 0.07165908813476562, 0.0753021240234375, 0.07894515991210938, 0.08258819580078125, 0.08623123168945312, 0.089874267578125, 0.09351730346679688, 0.09716033935546875, 0.10080337524414062, 0.1044464111328125, 0.10808944702148438, 0.11173248291015625, 0.11537551879882812, 0.1190185546875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 6.0, 7.0, 11.0, 5.0, 10.0, 6.0, 15.0, 21.0, 15.0, 31.0, 22.0, 30.0, 32.0, 27.0, 36.0, 30.0, 45.0, 34.0, 43.0, 53.0, 45.0, 44.0, 39.0, 38.0, 41.0, 33.0, 37.0, 39.0, 34.0, 23.0, 31.0, 15.0, 10.0, 9.0, 19.0, 11.0, 7.0, 13.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1126708984375, -0.1093902587890625, -0.106109619140625, -0.1028289794921875, -0.09954833984375, -0.0962677001953125, -0.092987060546875, -0.0897064208984375, -0.08642578125, -0.0831451416015625, -0.079864501953125, -0.0765838623046875, -0.07330322265625, -0.0700225830078125, -0.066741943359375, -0.0634613037109375, -0.0601806640625, -0.0569000244140625, -0.053619384765625, -0.0503387451171875, -0.04705810546875, -0.0437774658203125, -0.040496826171875, -0.0372161865234375, -0.033935546875, -0.0306549072265625, -0.027374267578125, -0.0240936279296875, -0.02081298828125, -0.0175323486328125, -0.014251708984375, -0.0109710693359375, -0.0076904296875, -0.0044097900390625, -0.001129150390625, 0.0021514892578125, 0.00543212890625, 0.0087127685546875, 0.011993408203125, 0.0152740478515625, 0.0185546875, 0.0218353271484375, 0.025115966796875, 0.0283966064453125, 0.03167724609375, 0.0349578857421875, 0.038238525390625, 0.0415191650390625, 0.0447998046875, 0.0480804443359375, 0.051361083984375, 0.0546417236328125, 0.05792236328125, 0.0612030029296875, 0.064483642578125, 0.0677642822265625, 0.071044921875, 0.0743255615234375, 0.077606201171875, 0.0808868408203125, 0.08416748046875, 0.0874481201171875, 0.090728759765625, 0.0940093994140625, 0.0972900390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 9.0, 10.0, 13.0, 18.0, 23.0, 38.0, 44.0, 80.0, 130.0, 211.0, 456.0, 953.0, 1863.0, 4118.0, 9656.0, 26288.0, 89065.0, 351518.0, 405284.0, 108093.0, 30656.0, 11104.0, 4608.0, 2102.0, 1009.0, 510.0, 238.0, 145.0, 99.0, 67.0, 28.0, 26.0, 22.0, 12.0, 18.0, 11.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.2147674560546875, -0.207855224609375, -0.2009429931640625, -0.19403076171875, -0.1871185302734375, -0.180206298828125, -0.1732940673828125, -0.1663818359375, -0.1594696044921875, -0.152557373046875, -0.1456451416015625, -0.13873291015625, -0.1318206787109375, -0.124908447265625, -0.1179962158203125, -0.111083984375, -0.1041717529296875, -0.097259521484375, -0.0903472900390625, -0.08343505859375, -0.0765228271484375, -0.069610595703125, -0.0626983642578125, -0.0557861328125, -0.0488739013671875, -0.041961669921875, -0.0350494384765625, -0.02813720703125, -0.0212249755859375, -0.014312744140625, -0.0074005126953125, -0.00048828125, 0.0064239501953125, 0.013336181640625, 0.0202484130859375, 0.02716064453125, 0.0340728759765625, 0.040985107421875, 0.0478973388671875, 0.0548095703125, 0.0617218017578125, 0.068634033203125, 0.0755462646484375, 0.08245849609375, 0.0893707275390625, 0.096282958984375, 0.1031951904296875, 0.110107421875, 0.1170196533203125, 0.123931884765625, 0.1308441162109375, 0.13775634765625, 0.1446685791015625, 0.151580810546875, 0.1584930419921875, 0.1654052734375, 0.1723175048828125, 0.179229736328125, 0.1861419677734375, 0.19305419921875, 0.1999664306640625, 0.206878662109375, 0.2137908935546875, 0.220703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 7.0, 8.0, 11.0, 8.0, 11.0, 13.0, 12.0, 16.0, 13.0, 26.0, 29.0, 32.0, 34.0, 31.0, 46.0, 45.0, 43.0, 45.0, 52.0, 62.0, 44.0, 36.0, 37.0, 38.0, 29.0, 32.0, 26.0, 29.0, 26.0, 29.0, 25.0, 16.0, 15.0, 14.0, 9.0, 17.0, 7.0, 3.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.298583984375, -0.2895927429199219, -0.28060150146484375, -0.2716102600097656, -0.2626190185546875, -0.2536277770996094, -0.24463653564453125, -0.23564529418945312, -0.226654052734375, -0.21766281127929688, -0.20867156982421875, -0.19968032836914062, -0.1906890869140625, -0.18169784545898438, -0.17270660400390625, -0.16371536254882812, -0.15472412109375, -0.14573287963867188, -0.13674163818359375, -0.12775039672851562, -0.1187591552734375, -0.10976791381835938, -0.10077667236328125, -0.09178543090820312, -0.082794189453125, -0.07380294799804688, -0.06481170654296875, -0.055820465087890625, -0.0468292236328125, -0.037837982177734375, -0.02884674072265625, -0.019855499267578125, -0.0108642578125, -0.001873016357421875, 0.00711822509765625, 0.016109466552734375, 0.0251007080078125, 0.034091949462890625, 0.04308319091796875, 0.052074432373046875, 0.061065673828125, 0.07005691528320312, 0.07904815673828125, 0.08803939819335938, 0.0970306396484375, 0.10602188110351562, 0.11501312255859375, 0.12400436401367188, 0.13299560546875, 0.14198684692382812, 0.15097808837890625, 0.15996932983398438, 0.1689605712890625, 0.17795181274414062, 0.18694305419921875, 0.19593429565429688, 0.204925537109375, 0.21391677856445312, 0.22290802001953125, 0.23189926147460938, 0.2408905029296875, 0.24988174438476562, 0.25887298583984375, 0.2678642272949219, 0.27685546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 0.0, 7.0, 4.0, 9.0, 11.0, 23.0, 36.0, 44.0, 88.0, 111.0, 198.0, 368.0, 789.0, 1660.0, 4061.0, 9941.0, 25878.0, 72219.0, 220432.0, 420701.0, 190191.0, 63084.0, 23052.0, 8969.0, 3577.0, 1534.0, 734.0, 349.0, 166.0, 122.0, 61.0, 38.0, 32.0, 19.0, 13.0, 7.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0814208984375, -0.07891082763671875, -0.0764007568359375, -0.07389068603515625, -0.071380615234375, -0.06887054443359375, -0.0663604736328125, -0.06385040283203125, -0.06134033203125, -0.05883026123046875, -0.0563201904296875, -0.05381011962890625, -0.051300048828125, -0.04878997802734375, -0.0462799072265625, -0.04376983642578125, -0.041259765625, -0.03874969482421875, -0.0362396240234375, -0.03372955322265625, -0.031219482421875, -0.02870941162109375, -0.0261993408203125, -0.02368927001953125, -0.02117919921875, -0.01866912841796875, -0.0161590576171875, -0.01364898681640625, -0.011138916015625, -0.00862884521484375, -0.0061187744140625, -0.00360870361328125, -0.0010986328125, 0.00141143798828125, 0.0039215087890625, 0.00643157958984375, 0.008941650390625, 0.01145172119140625, 0.0139617919921875, 0.01647186279296875, 0.01898193359375, 0.02149200439453125, 0.0240020751953125, 0.02651214599609375, 0.029022216796875, 0.03153228759765625, 0.0340423583984375, 0.03655242919921875, 0.0390625, 0.04157257080078125, 0.0440826416015625, 0.04659271240234375, 0.049102783203125, 0.05161285400390625, 0.0541229248046875, 0.05663299560546875, 0.05914306640625, 0.06165313720703125, 0.0641632080078125, 0.06667327880859375, 0.069183349609375, 0.07169342041015625, 0.0742034912109375, 0.07671356201171875, 0.0792236328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 5.0, 20.0, 13.0, 20.0, 31.0, 33.0, 55.0, 58.0, 64.0, 63.0, 81.0, 84.0, 97.0, 76.0, 56.0, 37.0, 40.0, 20.0, 22.0, 27.0, 13.0, 10.0, 13.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633167266845703e-05, -1.5737488865852356e-05, -1.514330506324768e-05, -1.4549121260643005e-05, -1.395493745803833e-05, -1.3360753655433655e-05, -1.276656985282898e-05, -1.2172386050224304e-05, -1.1578202247619629e-05, -1.0984018445014954e-05, -1.0389834642410278e-05, -9.795650839805603e-06, -9.201467037200928e-06, -8.607283234596252e-06, -8.013099431991577e-06, -7.418915629386902e-06, -6.8247318267822266e-06, -6.230548024177551e-06, -5.636364221572876e-06, -5.042180418968201e-06, -4.447996616363525e-06, -3.85381281375885e-06, -3.259629011154175e-06, -2.6654452085494995e-06, -2.0712614059448242e-06, -1.477077603340149e-06, -8.828938007354736e-07, -2.8870999813079834e-07, 3.0547380447387695e-07, 8.996576070785522e-07, 1.4938414096832275e-06, 2.088025212287903e-06, 2.682209014892578e-06, 3.2763928174972534e-06, 3.870576620101929e-06, 4.464760422706604e-06, 5.058944225311279e-06, 5.653128027915955e-06, 6.24731183052063e-06, 6.841495633125305e-06, 7.4356794357299805e-06, 8.029863238334656e-06, 8.624047040939331e-06, 9.218230843544006e-06, 9.812414646148682e-06, 1.0406598448753357e-05, 1.1000782251358032e-05, 1.1594966053962708e-05, 1.2189149856567383e-05, 1.2783333659172058e-05, 1.3377517461776733e-05, 1.3971701264381409e-05, 1.4565885066986084e-05, 1.516006886959076e-05, 1.5754252672195435e-05, 1.634843647480011e-05, 1.6942620277404785e-05, 1.753680408000946e-05, 1.8130987882614136e-05, 1.872517168521881e-05, 1.9319355487823486e-05, 1.991353929042816e-05, 2.0507723093032837e-05, 2.1101906895637512e-05, 2.1696090698242188e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 9.0, 20.0, 28.0, 58.0, 88.0, 140.0, 288.0, 620.0, 1652.0, 5230.0, 20276.0, 93368.0, 408385.0, 399957.0, 90578.0, 19802.0, 5183.0, 1622.0, 636.0, 307.0, 121.0, 76.0, 45.0, 25.0, 16.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11260986328125, -0.10872554779052734, -0.10484123229980469, -0.10095691680908203, -0.09707260131835938, -0.09318828582763672, -0.08930397033691406, -0.0854196548461914, -0.08153533935546875, -0.0776510238647461, -0.07376670837402344, -0.06988239288330078, -0.06599807739257812, -0.06211376190185547, -0.05822944641113281, -0.054345130920410156, -0.0504608154296875, -0.046576499938964844, -0.04269218444824219, -0.03880786895751953, -0.034923553466796875, -0.03103923797607422, -0.027154922485351562, -0.023270606994628906, -0.01938629150390625, -0.015501976013183594, -0.011617660522460938, -0.007733345031738281, -0.003849029541015625, 3.528594970703125e-05, 0.0039196014404296875, 0.007803916931152344, 0.011688232421875, 0.015572547912597656, 0.019456863403320312, 0.02334117889404297, 0.027225494384765625, 0.03110980987548828, 0.03499412536621094, 0.038878440856933594, 0.04276275634765625, 0.046647071838378906, 0.05053138732910156, 0.05441570281982422, 0.058300018310546875, 0.06218433380126953, 0.06606864929199219, 0.06995296478271484, 0.0738372802734375, 0.07772159576416016, 0.08160591125488281, 0.08549022674560547, 0.08937454223632812, 0.09325885772705078, 0.09714317321777344, 0.1010274887084961, 0.10491180419921875, 0.1087961196899414, 0.11268043518066406, 0.11656475067138672, 0.12044906616210938, 0.12433338165283203, 0.1282176971435547, 0.13210201263427734, 0.135986328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 4.0, 9.0, 13.0, 11.0, 22.0, 19.0, 22.0, 29.0, 24.0, 41.0, 71.0, 66.0, 70.0, 80.0, 85.0, 66.0, 80.0, 55.0, 44.0, 38.0, 28.0, 29.0, 15.0, 25.0, 9.0, 6.0, 11.0, 4.0, 3.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062286376953125, -0.05999422073364258, -0.057702064514160156, -0.055409908294677734, -0.05311775207519531, -0.05082559585571289, -0.04853343963623047, -0.04624128341674805, -0.043949127197265625, -0.0416569709777832, -0.03936481475830078, -0.03707265853881836, -0.03478050231933594, -0.032488346099853516, -0.030196189880371094, -0.027904033660888672, -0.02561187744140625, -0.023319721221923828, -0.021027565002441406, -0.018735408782958984, -0.016443252563476562, -0.01415109634399414, -0.011858940124511719, -0.009566783905029297, -0.007274627685546875, -0.004982471466064453, -0.0026903152465820312, -0.0003981590270996094, 0.0018939971923828125, 0.004186153411865234, 0.006478309631347656, 0.008770465850830078, 0.0110626220703125, 0.013354778289794922, 0.015646934509277344, 0.017939090728759766, 0.020231246948242188, 0.02252340316772461, 0.02481555938720703, 0.027107715606689453, 0.029399871826171875, 0.0316920280456543, 0.03398418426513672, 0.03627634048461914, 0.03856849670410156, 0.040860652923583984, 0.043152809143066406, 0.04544496536254883, 0.04773712158203125, 0.05002927780151367, 0.052321434020996094, 0.054613590240478516, 0.05690574645996094, 0.05919790267944336, 0.06149005889892578, 0.0637822151184082, 0.06607437133789062, 0.06836652755737305, 0.07065868377685547, 0.07295083999633789, 0.07524299621582031, 0.07753515243530273, 0.07982730865478516, 0.08211946487426758, 0.08441162109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 4.0, 11.0, 8.0, 41.0, 47.0, 79.0, 153.0, 179.0, 175.0, 113.0, 90.0, 53.0, 24.0, 14.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2466351985931396, -1.2071583271026611, -1.1676814556121826, -1.1282047033309937, -1.0887278318405151, -1.0492509603500366, -1.0097742080688477, -0.9702973365783691, -0.9308204650878906, -0.8913435935974121, -0.8518667817115784, -0.8123899698257446, -0.7729130983352661, -0.7334362268447876, -0.6939594149589539, -0.6544826030731201, -0.6150057315826416, -0.5755288600921631, -0.5360520482063293, -0.4965752065181732, -0.4570983648300171, -0.41762152314186096, -0.37814468145370483, -0.3386678397655487, -0.2991909980773926, -0.25971415638923645, -0.22023731470108032, -0.1807604730129242, -0.14128363132476807, -0.10180678963661194, -0.06232994794845581, -0.022853106260299683, 0.016623735427856445, 0.05610057711601257, 0.0955774188041687, 0.13505426049232483, 0.17453110218048096, 0.21400794386863708, 0.2534847855567932, 0.29296162724494934, 0.33243846893310547, 0.3719153106212616, 0.4113921523094177, 0.45086899399757385, 0.49034583568573, 0.5298227071762085, 0.5692995190620422, 0.608776330947876, 0.6482532024383545, 0.687730073928833, 0.7272068858146667, 0.7666836977005005, 0.806160569190979, 0.8456374406814575, 0.8851142525672913, 0.924591064453125, 0.9640679359436035, 1.003544807434082, 1.0430216789245605, 1.0824984312057495, 1.121975302696228, 1.1614521741867065, 1.2009289264678955, 1.240405797958374, 1.2798826694488525]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 3.0, 5.0, 11.0, 7.0, 12.0, 9.0, 9.0, 12.0, 16.0, 13.0, 21.0, 29.0, 25.0, 30.0, 39.0, 37.0, 29.0, 35.0, 37.0, 45.0, 38.0, 45.0, 38.0, 33.0, 40.0, 45.0, 25.0, 33.0, 30.0, 28.0, 18.0, 22.0, 26.0, 18.0, 16.0, 20.0, 18.0, 13.0, 7.0, 9.0, 10.0, 6.0, 5.0, 13.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.6316085457801819, -0.6122825741767883, -0.5929566025733948, -0.5736305713653564, -0.5543045997619629, -0.5349786281585693, -0.5156526565551758, -0.49632665514945984, -0.4770006537437439, -0.45767468214035034, -0.4383486807346344, -0.41902270913124084, -0.3996967077255249, -0.38037073612213135, -0.3610447645187378, -0.34171876311302185, -0.3223927915096283, -0.30306681990623474, -0.2837408185005188, -0.26441484689712524, -0.2450888454914093, -0.22576287388801575, -0.206436887383461, -0.18711090087890625, -0.1677849143743515, -0.14845892786979675, -0.129132941365242, -0.10980696231126785, -0.0904809758067131, -0.07115498930215836, -0.051829010248184204, -0.032503023743629456, -0.013177037239074707, 0.006148947402834892, 0.02547493204474449, 0.04480091482400894, 0.06412690132856369, 0.08345288783311844, 0.10277886688709259, 0.12210485339164734, 0.1414308398962021, 0.16075682640075684, 0.18008281290531158, 0.19940879940986633, 0.2187347710132599, 0.23806077241897583, 0.2573867440223694, 0.27671271562576294, 0.2960387170314789, 0.31536468863487244, 0.3346906900405884, 0.35401666164398193, 0.3733426630496979, 0.39266863465309143, 0.4119946360588074, 0.4313206076622009, 0.4506465792655945, 0.46997255086898804, 0.489298552274704, 0.5086245536804199, 0.5279505252838135, 0.547276496887207, 0.5666024684906006, 0.5859284400939941, 0.6052544713020325]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 7.0, 14.0, 12.0, 14.0, 25.0, 36.0, 48.0, 39.0, 59.0, 83.0, 118.0, 187.0, 244.0, 410.0, 601.0, 875.0, 1545.0, 2636.0, 4837.0, 8976.0, 17593.0, 34855.0, 74868.0, 178487.0, 523403.0, 1476474.0, 1205430.0, 395181.0, 143552.0, 61976.0, 29398.0, 14637.0, 7683.0, 3975.0, 2208.0, 1323.0, 803.0, 516.0, 329.0, 249.0, 158.0, 102.0, 80.0, 64.0, 47.0, 32.0, 23.0, 17.0, 14.0, 10.0, 10.0, 7.0, 3.0, 0.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.126953125, -0.1229705810546875, -0.118988037109375, -0.1150054931640625, -0.11102294921875, -0.1070404052734375, -0.103057861328125, -0.0990753173828125, -0.0950927734375, -0.0911102294921875, -0.087127685546875, -0.0831451416015625, -0.07916259765625, -0.0751800537109375, -0.071197509765625, -0.0672149658203125, -0.063232421875, -0.0592498779296875, -0.055267333984375, -0.0512847900390625, -0.04730224609375, -0.0433197021484375, -0.039337158203125, -0.0353546142578125, -0.0313720703125, -0.0273895263671875, -0.023406982421875, -0.0194244384765625, -0.01544189453125, -0.0114593505859375, -0.007476806640625, -0.0034942626953125, 0.00048828125, 0.0044708251953125, 0.008453369140625, 0.0124359130859375, 0.01641845703125, 0.0204010009765625, 0.024383544921875, 0.0283660888671875, 0.0323486328125, 0.0363311767578125, 0.040313720703125, 0.0442962646484375, 0.04827880859375, 0.0522613525390625, 0.056243896484375, 0.0602264404296875, 0.064208984375, 0.0681915283203125, 0.072174072265625, 0.0761566162109375, 0.08013916015625, 0.0841217041015625, 0.088104248046875, 0.0920867919921875, 0.0960693359375, 0.1000518798828125, 0.104034423828125, 0.1080169677734375, 0.11199951171875, 0.1159820556640625, 0.119964599609375, 0.1239471435546875, 0.1279296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 5.0, 9.0, 13.0, 14.0, 14.0, 17.0, 11.0, 14.0, 26.0, 28.0, 29.0, 29.0, 40.0, 39.0, 28.0, 42.0, 41.0, 43.0, 55.0, 38.0, 40.0, 39.0, 47.0, 29.0, 33.0, 33.0, 41.0, 27.0, 21.0, 24.0, 18.0, 21.0, 14.0, 15.0, 14.0, 10.0, 5.0, 10.0, 9.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1046142578125, -0.10133075714111328, -0.09804725646972656, -0.09476375579833984, -0.09148025512695312, -0.0881967544555664, -0.08491325378417969, -0.08162975311279297, -0.07834625244140625, -0.07506275177001953, -0.07177925109863281, -0.0684957504272461, -0.06521224975585938, -0.061928749084472656, -0.05864524841308594, -0.05536174774169922, -0.0520782470703125, -0.04879474639892578, -0.04551124572753906, -0.042227745056152344, -0.038944244384765625, -0.035660743713378906, -0.03237724304199219, -0.02909374237060547, -0.02581024169921875, -0.02252674102783203, -0.019243240356445312, -0.015959739685058594, -0.012676239013671875, -0.009392738342285156, -0.0061092376708984375, -0.0028257369995117188, 0.000457763671875, 0.0037412643432617188, 0.0070247650146484375, 0.010308265686035156, 0.013591766357421875, 0.016875267028808594, 0.020158767700195312, 0.02344226837158203, 0.02672576904296875, 0.03000926971435547, 0.03329277038574219, 0.036576271057128906, 0.039859771728515625, 0.043143272399902344, 0.04642677307128906, 0.04971027374267578, 0.0529937744140625, 0.05627727508544922, 0.05956077575683594, 0.06284427642822266, 0.06612777709960938, 0.0694112777709961, 0.07269477844238281, 0.07597827911376953, 0.07926177978515625, 0.08254528045654297, 0.08582878112792969, 0.0891122817993164, 0.09239578247070312, 0.09567928314208984, 0.09896278381347656, 0.10224628448486328, 0.10552978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 11.0, 12.0, 20.0, 20.0, 33.0, 48.0, 61.0, 138.0, 194.0, 293.0, 526.0, 989.0, 1744.0, 3603.0, 7216.0, 16320.0, 38239.0, 94795.0, 267441.0, 1086910.0, 1942587.0, 481207.0, 150027.0, 57639.0, 23772.0, 10423.0, 4741.0, 2323.0, 1174.0, 709.0, 364.0, 246.0, 149.0, 90.0, 58.0, 47.0, 33.0, 22.0, 21.0, 10.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15185546875, -0.14647674560546875, -0.1410980224609375, -0.13571929931640625, -0.130340576171875, -0.12496185302734375, -0.1195831298828125, -0.11420440673828125, -0.10882568359375, -0.10344696044921875, -0.0980682373046875, -0.09268951416015625, -0.087310791015625, -0.08193206787109375, -0.0765533447265625, -0.07117462158203125, -0.0657958984375, -0.06041717529296875, -0.0550384521484375, -0.04965972900390625, -0.044281005859375, -0.03890228271484375, -0.0335235595703125, -0.02814483642578125, -0.02276611328125, -0.01738739013671875, -0.0120086669921875, -0.00662994384765625, -0.001251220703125, 0.00412750244140625, 0.0095062255859375, 0.01488494873046875, 0.020263671875, 0.02564239501953125, 0.0310211181640625, 0.03639984130859375, 0.041778564453125, 0.04715728759765625, 0.0525360107421875, 0.05791473388671875, 0.06329345703125, 0.06867218017578125, 0.0740509033203125, 0.07942962646484375, 0.084808349609375, 0.09018707275390625, 0.0955657958984375, 0.10094451904296875, 0.1063232421875, 0.11170196533203125, 0.1170806884765625, 0.12245941162109375, 0.127838134765625, 0.13321685791015625, 0.1385955810546875, 0.14397430419921875, 0.14935302734375, 0.15473175048828125, 0.1601104736328125, 0.16548919677734375, 0.170867919921875, 0.17624664306640625, 0.1816253662109375, 0.18700408935546875, 0.1923828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 5.0, 4.0, 5.0, 5.0, 12.0, 20.0, 20.0, 18.0, 40.0, 37.0, 47.0, 66.0, 67.0, 135.0, 162.0, 253.0, 347.0, 511.0, 611.0, 511.0, 351.0, 230.0, 152.0, 110.0, 95.0, 62.0, 43.0, 36.0, 29.0, 20.0, 16.0, 16.0, 5.0, 6.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1730194091796875, -0.166473388671875, -0.1599273681640625, -0.15338134765625, -0.1468353271484375, -0.140289306640625, -0.1337432861328125, -0.127197265625, -0.1206512451171875, -0.114105224609375, -0.1075592041015625, -0.10101318359375, -0.0944671630859375, -0.087921142578125, -0.0813751220703125, -0.0748291015625, -0.0682830810546875, -0.061737060546875, -0.0551910400390625, -0.04864501953125, -0.0420989990234375, -0.035552978515625, -0.0290069580078125, -0.0224609375, -0.0159149169921875, -0.009368896484375, -0.0028228759765625, 0.00372314453125, 0.0102691650390625, 0.016815185546875, 0.0233612060546875, 0.0299072265625, 0.0364532470703125, 0.042999267578125, 0.0495452880859375, 0.05609130859375, 0.0626373291015625, 0.069183349609375, 0.0757293701171875, 0.082275390625, 0.0888214111328125, 0.095367431640625, 0.1019134521484375, 0.10845947265625, 0.1150054931640625, 0.121551513671875, 0.1280975341796875, 0.1346435546875, 0.1411895751953125, 0.147735595703125, 0.1542816162109375, 0.16082763671875, 0.1673736572265625, 0.173919677734375, 0.1804656982421875, 0.18701171875, 0.1935577392578125, 0.200103759765625, 0.2066497802734375, 0.21319580078125, 0.2197418212890625, 0.226287841796875, 0.2328338623046875, 0.2393798828125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 15.0, 40.0, 92.0, 185.0, 225.0, 218.0, 147.0, 57.0, 17.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6309990882873535, -1.5492908954620361, -1.4675827026367188, -1.3858745098114014, -1.304166316986084, -1.2224581241607666, -1.1407500505447388, -1.0590418577194214, -0.977333664894104, -0.8956254720687866, -0.8139172792434692, -0.7322091460227966, -0.6505009531974792, -0.5687927603721619, -0.48708459734916687, -0.4053764343261719, -0.3236682415008545, -0.2419600635766983, -0.16025188565254211, -0.07854370772838593, 0.0031644701957702637, 0.08487266302108765, 0.16658082604408264, 0.24828898906707764, 0.329997181892395, 0.4117053747177124, 0.4934135377407074, 0.5751217007637024, 0.6568298935890198, 0.7385380864143372, 0.8202462196350098, 0.9019544124603271, 0.9836626052856445, 1.065370798110962, 1.1470789909362793, 1.2287871837615967, 1.310495376586914, 1.3922035694122314, 1.4739116430282593, 1.5556198358535767, 1.637328028678894, 1.7190362215042114, 1.8007444143295288, 1.8824526071548462, 1.964160680770874, 2.0458688735961914, 2.127577066421509, 2.209285259246826, 2.2909934520721436, 2.372701644897461, 2.4544098377227783, 2.5361180305480957, 2.617826223373413, 2.6995344161987305, 2.781242609024048, 2.8629508018493652, 2.9446587562561035, 3.026366949081421, 3.1080751419067383, 3.1897833347320557, 3.271491527557373, 3.3531997203826904, 3.434907913208008, 3.516615867614746, 3.5983242988586426]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 7.0, 11.0, 8.0, 13.0, 14.0, 16.0, 18.0, 28.0, 18.0, 22.0, 21.0, 30.0, 43.0, 34.0, 34.0, 39.0, 40.0, 37.0, 46.0, 45.0, 28.0, 28.0, 49.0, 45.0, 21.0, 31.0, 32.0, 29.0, 29.0, 33.0, 19.0, 22.0, 21.0, 12.0, 19.0, 11.0, 11.0, 6.0, 8.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.7219914793968201, -0.7021827697753906, -0.6823740005493164, -0.662565290927887, -0.6427565217018127, -0.6229478120803833, -0.6031390428543091, -0.5833303332328796, -0.5635216236114502, -0.5437129139900208, -0.5239041447639465, -0.5040954351425171, -0.48428669571876526, -0.4644779562950134, -0.4446692168712616, -0.42486047744750977, -0.40505173802375793, -0.3852429986000061, -0.3654342591762543, -0.34562551975250244, -0.325816810131073, -0.30600807070732117, -0.28619933128356934, -0.2663906216621399, -0.24658186733722687, -0.22677312791347504, -0.2069644033908844, -0.18715566396713257, -0.16734692454338074, -0.1475382000207901, -0.12772946059703827, -0.10792073607444763, -0.0881119966506958, -0.06830326467752457, -0.048494528979063034, -0.0286857932806015, -0.008877061307430267, 0.010931670665740967, 0.030740410089492798, 0.050549134612083435, 0.07035787403583527, 0.0901666060090065, 0.10997533798217773, 0.12978407740592957, 0.1495928168296814, 0.16940154135227203, 0.18921028077602386, 0.2090190052986145, 0.22882774472236633, 0.24863648414611816, 0.26844522356987, 0.2882539629936218, 0.30806267261505127, 0.3278714120388031, 0.34768015146255493, 0.3674888610839844, 0.3872976303100586, 0.4071063697338104, 0.42691510915756226, 0.4467238187789917, 0.46653255820274353, 0.48634129762649536, 0.5061500072479248, 0.525958776473999, 0.5457674860954285]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 8.0, 20.0, 18.0, 32.0, 49.0, 61.0, 110.0, 160.0, 193.0, 319.0, 429.0, 683.0, 922.0, 1332.0, 1898.0, 2852.0, 3944.0, 5847.0, 8584.0, 13260.0, 22869.0, 48716.0, 136404.0, 348240.0, 270209.0, 92215.0, 35750.0, 18462.0, 11030.0, 7346.0, 5001.0, 3629.0, 2437.0, 1650.0, 1183.0, 818.0, 559.0, 374.0, 308.0, 210.0, 131.0, 94.0, 70.0, 61.0, 15.0, 19.0, 11.0, 7.0, 6.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1595458984375, -0.15436935424804688, -0.14919281005859375, -0.14401626586914062, -0.1388397216796875, -0.13366317749023438, -0.12848663330078125, -0.12331008911132812, -0.118133544921875, -0.11295700073242188, -0.10778045654296875, -0.10260391235351562, -0.0974273681640625, -0.09225082397460938, -0.08707427978515625, -0.08189773559570312, -0.07672119140625, -0.07154464721679688, -0.06636810302734375, -0.061191558837890625, -0.0560150146484375, -0.050838470458984375, -0.04566192626953125, -0.040485382080078125, -0.035308837890625, -0.030132293701171875, -0.02495574951171875, -0.019779205322265625, -0.0146026611328125, -0.009426116943359375, -0.00424957275390625, 0.000926971435546875, 0.006103515625, 0.011280059814453125, 0.01645660400390625, 0.021633148193359375, 0.0268096923828125, 0.031986236572265625, 0.03716278076171875, 0.042339324951171875, 0.047515869140625, 0.052692413330078125, 0.05786895751953125, 0.06304550170898438, 0.0682220458984375, 0.07339859008789062, 0.07857513427734375, 0.08375167846679688, 0.08892822265625, 0.09410476684570312, 0.09928131103515625, 0.10445785522460938, 0.1096343994140625, 0.11481094360351562, 0.11998748779296875, 0.12516403198242188, 0.130340576171875, 0.13551712036132812, 0.14069366455078125, 0.14587020874023438, 0.1510467529296875, 0.15622329711914062, 0.16139984130859375, 0.16657638549804688, 0.1717529296875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 2.0, 7.0, 16.0, 15.0, 12.0, 13.0, 25.0, 21.0, 22.0, 29.0, 34.0, 31.0, 33.0, 36.0, 48.0, 28.0, 43.0, 42.0, 42.0, 41.0, 40.0, 42.0, 27.0, 37.0, 31.0, 26.0, 34.0, 33.0, 24.0, 28.0, 20.0, 16.0, 16.0, 8.0, 9.0, 12.0, 8.0, 8.0, 9.0, 3.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10955810546875, -0.10638427734375, -0.10321044921875, -0.10003662109375, -0.09686279296875, -0.09368896484375, -0.09051513671875, -0.08734130859375, -0.08416748046875, -0.08099365234375, -0.07781982421875, -0.07464599609375, -0.07147216796875, -0.06829833984375, -0.06512451171875, -0.06195068359375, -0.05877685546875, -0.05560302734375, -0.05242919921875, -0.04925537109375, -0.04608154296875, -0.04290771484375, -0.03973388671875, -0.03656005859375, -0.03338623046875, -0.03021240234375, -0.02703857421875, -0.02386474609375, -0.02069091796875, -0.01751708984375, -0.01434326171875, -0.01116943359375, -0.00799560546875, -0.00482177734375, -0.00164794921875, 0.00152587890625, 0.00469970703125, 0.00787353515625, 0.01104736328125, 0.01422119140625, 0.01739501953125, 0.02056884765625, 0.02374267578125, 0.02691650390625, 0.03009033203125, 0.03326416015625, 0.03643798828125, 0.03961181640625, 0.04278564453125, 0.04595947265625, 0.04913330078125, 0.05230712890625, 0.05548095703125, 0.05865478515625, 0.06182861328125, 0.06500244140625, 0.06817626953125, 0.07135009765625, 0.07452392578125, 0.07769775390625, 0.08087158203125, 0.08404541015625, 0.08721923828125, 0.09039306640625, 0.09356689453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 6.0, 14.0, 23.0, 25.0, 49.0, 48.0, 72.0, 129.0, 185.0, 388.0, 688.0, 1419.0, 3359.0, 8594.0, 24478.0, 79511.0, 464894.0, 366803.0, 63964.0, 20441.0, 7582.0, 3066.0, 1251.0, 643.0, 347.0, 196.0, 122.0, 68.0, 56.0, 32.0, 25.0, 19.0, 12.0, 9.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302978515625, -0.29250335693359375, -0.2820281982421875, -0.27155303955078125, -0.261077880859375, -0.25060272216796875, -0.2401275634765625, -0.22965240478515625, -0.21917724609375, -0.20870208740234375, -0.1982269287109375, -0.18775177001953125, -0.177276611328125, -0.16680145263671875, -0.1563262939453125, -0.14585113525390625, -0.1353759765625, -0.12490081787109375, -0.1144256591796875, -0.10395050048828125, -0.093475341796875, -0.08300018310546875, -0.0725250244140625, -0.06204986572265625, -0.05157470703125, -0.04109954833984375, -0.0306243896484375, -0.02014923095703125, -0.009674072265625, 0.00080108642578125, 0.0112762451171875, 0.02175140380859375, 0.0322265625, 0.04270172119140625, 0.0531768798828125, 0.06365203857421875, 0.074127197265625, 0.08460235595703125, 0.0950775146484375, 0.10555267333984375, 0.11602783203125, 0.12650299072265625, 0.1369781494140625, 0.14745330810546875, 0.157928466796875, 0.16840362548828125, 0.1788787841796875, 0.18935394287109375, 0.1998291015625, 0.21030426025390625, 0.2207794189453125, 0.23125457763671875, 0.241729736328125, 0.25220489501953125, 0.2626800537109375, 0.27315521240234375, 0.28363037109375, 0.29410552978515625, 0.3045806884765625, 0.31505584716796875, 0.325531005859375, 0.33600616455078125, 0.3464813232421875, 0.35695648193359375, 0.367431640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 7.0, 10.0, 11.0, 18.0, 18.0, 21.0, 31.0, 26.0, 40.0, 33.0, 41.0, 46.0, 42.0, 38.0, 41.0, 48.0, 37.0, 42.0, 49.0, 53.0, 42.0, 31.0, 50.0, 31.0, 27.0, 17.0, 28.0, 18.0, 22.0, 18.0, 12.0, 10.0, 5.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.335205078125, -0.32517242431640625, -0.3151397705078125, -0.30510711669921875, -0.295074462890625, -0.28504180908203125, -0.2750091552734375, -0.26497650146484375, -0.25494384765625, -0.24491119384765625, -0.2348785400390625, -0.22484588623046875, -0.214813232421875, -0.20478057861328125, -0.1947479248046875, -0.18471527099609375, -0.1746826171875, -0.16464996337890625, -0.1546173095703125, -0.14458465576171875, -0.134552001953125, -0.12451934814453125, -0.1144866943359375, -0.10445404052734375, -0.09442138671875, -0.08438873291015625, -0.0743560791015625, -0.06432342529296875, -0.054290771484375, -0.04425811767578125, -0.0342254638671875, -0.02419281005859375, -0.01416015625, -0.00412750244140625, 0.0059051513671875, 0.01593780517578125, 0.025970458984375, 0.03600311279296875, 0.0460357666015625, 0.05606842041015625, 0.06610107421875, 0.07613372802734375, 0.0861663818359375, 0.09619903564453125, 0.106231689453125, 0.11626434326171875, 0.1262969970703125, 0.13632965087890625, 0.1463623046875, 0.15639495849609375, 0.1664276123046875, 0.17646026611328125, 0.186492919921875, 0.19652557373046875, 0.2065582275390625, 0.21659088134765625, 0.22662353515625, 0.23665618896484375, 0.2466888427734375, 0.25672149658203125, 0.266754150390625, 0.27678680419921875, 0.2868194580078125, 0.29685211181640625, 0.306884765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 7.0, 6.0, 10.0, 14.0, 41.0, 30.0, 67.0, 94.0, 184.0, 253.0, 415.0, 626.0, 1045.0, 1777.0, 2726.0, 4390.0, 7065.0, 11889.0, 22422.0, 50067.0, 141150.0, 364062.0, 271221.0, 91526.0, 35209.0, 17059.0, 9501.0, 5803.0, 3706.0, 2341.0, 1444.0, 867.0, 556.0, 360.0, 228.0, 118.0, 89.0, 69.0, 38.0, 29.0, 5.0, 14.0, 8.0, 6.0, 4.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0675048828125, -0.06531333923339844, -0.06312179565429688, -0.06093025207519531, -0.05873870849609375, -0.05654716491699219, -0.054355621337890625, -0.05216407775878906, -0.0499725341796875, -0.04778099060058594, -0.045589447021484375, -0.04339790344238281, -0.04120635986328125, -0.03901481628417969, -0.036823272705078125, -0.03463172912597656, -0.032440185546875, -0.030248641967773438, -0.028057098388671875, -0.025865554809570312, -0.02367401123046875, -0.021482467651367188, -0.019290924072265625, -0.017099380493164062, -0.0149078369140625, -0.012716293334960938, -0.010524749755859375, -0.008333206176757812, -0.00614166259765625, -0.0039501190185546875, -0.001758575439453125, 0.0004329681396484375, 0.00262451171875, 0.0048160552978515625, 0.007007598876953125, 0.009199142456054688, 0.01139068603515625, 0.013582229614257812, 0.015773773193359375, 0.017965316772460938, 0.0201568603515625, 0.022348403930664062, 0.024539947509765625, 0.026731491088867188, 0.02892303466796875, 0.031114578247070312, 0.033306121826171875, 0.03549766540527344, 0.037689208984375, 0.03988075256347656, 0.042072296142578125, 0.04426383972167969, 0.04645538330078125, 0.04864692687988281, 0.050838470458984375, 0.05303001403808594, 0.0552215576171875, 0.05741310119628906, 0.059604644775390625, 0.06179618835449219, 0.06398773193359375, 0.06617927551269531, 0.06837081909179688, 0.07056236267089844, 0.07275390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 5.0, 14.0, 13.0, 18.0, 33.0, 63.0, 107.0, 179.0, 213.0, 137.0, 84.0, 45.0, 22.0, 19.0, 10.0, 4.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4776668548583984e-05, -5.330517888069153e-05, -5.183368921279907e-05, -5.0362199544906616e-05, -4.889070987701416e-05, -4.7419220209121704e-05, -4.594773054122925e-05, -4.447624087333679e-05, -4.3004751205444336e-05, -4.153326153755188e-05, -4.0061771869659424e-05, -3.859028220176697e-05, -3.711879253387451e-05, -3.5647302865982056e-05, -3.41758131980896e-05, -3.2704323530197144e-05, -3.123283386230469e-05, -2.976134419441223e-05, -2.8289854526519775e-05, -2.681836485862732e-05, -2.5346875190734863e-05, -2.3875385522842407e-05, -2.240389585494995e-05, -2.0932406187057495e-05, -1.946091651916504e-05, -1.7989426851272583e-05, -1.6517937183380127e-05, -1.5046447515487671e-05, -1.3574957847595215e-05, -1.2103468179702759e-05, -1.0631978511810303e-05, -9.160488843917847e-06, -7.68899917602539e-06, -6.2175095081329346e-06, -4.7460198402404785e-06, -3.2745301723480225e-06, -1.8030405044555664e-06, -3.3155083656311035e-07, 1.1399388313293457e-06, 2.6114284992218018e-06, 4.082918167114258e-06, 5.554407835006714e-06, 7.02589750289917e-06, 8.497387170791626e-06, 9.968876838684082e-06, 1.1440366506576538e-05, 1.2911856174468994e-05, 1.438334584236145e-05, 1.5854835510253906e-05, 1.7326325178146362e-05, 1.879781484603882e-05, 2.0269304513931274e-05, 2.174079418182373e-05, 2.3212283849716187e-05, 2.4683773517608643e-05, 2.61552631855011e-05, 2.7626752853393555e-05, 2.909824252128601e-05, 3.056973218917847e-05, 3.204122185707092e-05, 3.351271152496338e-05, 3.4984201192855835e-05, 3.645569086074829e-05, 3.792718052864075e-05, 3.93986701965332e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 6.0, 9.0, 14.0, 28.0, 46.0, 58.0, 95.0, 157.0, 355.0, 745.0, 1794.0, 4671.0, 12836.0, 41780.0, 208976.0, 533179.0, 186131.0, 38395.0, 11722.0, 4449.0, 1687.0, 654.0, 345.0, 151.0, 108.0, 63.0, 39.0, 18.0, 16.0, 10.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1112060546875, -0.10767173767089844, -0.10413742065429688, -0.10060310363769531, -0.09706878662109375, -0.09353446960449219, -0.09000015258789062, -0.08646583557128906, -0.0829315185546875, -0.07939720153808594, -0.07586288452148438, -0.07232856750488281, -0.06879425048828125, -0.06525993347167969, -0.061725616455078125, -0.05819129943847656, -0.054656982421875, -0.05112266540527344, -0.047588348388671875, -0.04405403137207031, -0.04051971435546875, -0.03698539733886719, -0.033451080322265625, -0.029916763305664062, -0.0263824462890625, -0.022848129272460938, -0.019313812255859375, -0.015779495239257812, -0.01224517822265625, -0.008710861206054688, -0.005176544189453125, -0.0016422271728515625, 0.00189208984375, 0.0054264068603515625, 0.008960723876953125, 0.012495040893554688, 0.01602935791015625, 0.019563674926757812, 0.023097991943359375, 0.026632308959960938, 0.0301666259765625, 0.03370094299316406, 0.037235260009765625, 0.04076957702636719, 0.04430389404296875, 0.04783821105957031, 0.051372528076171875, 0.05490684509277344, 0.058441162109375, 0.06197547912597656, 0.06550979614257812, 0.06904411315917969, 0.07257843017578125, 0.07611274719238281, 0.07964706420898438, 0.08318138122558594, 0.0867156982421875, 0.09025001525878906, 0.09378433227539062, 0.09731864929199219, 0.10085296630859375, 0.10438728332519531, 0.10792160034179688, 0.11145591735839844, 0.114990234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 8.0, 13.0, 12.0, 17.0, 19.0, 31.0, 27.0, 36.0, 46.0, 57.0, 48.0, 85.0, 72.0, 64.0, 77.0, 60.0, 58.0, 36.0, 39.0, 37.0, 31.0, 21.0, 13.0, 13.0, 12.0, 10.0, 7.0, 4.0, 7.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.06573486328125, -0.06371688842773438, -0.06169891357421875, -0.059680938720703125, -0.0576629638671875, -0.055644989013671875, -0.05362701416015625, -0.051609039306640625, -0.049591064453125, -0.047573089599609375, -0.04555511474609375, -0.043537139892578125, -0.0415191650390625, -0.039501190185546875, -0.03748321533203125, -0.035465240478515625, -0.033447265625, -0.031429290771484375, -0.02941131591796875, -0.027393341064453125, -0.0253753662109375, -0.023357391357421875, -0.02133941650390625, -0.019321441650390625, -0.017303466796875, -0.015285491943359375, -0.01326751708984375, -0.011249542236328125, -0.0092315673828125, -0.007213592529296875, -0.00519561767578125, -0.003177642822265625, -0.00115966796875, 0.000858306884765625, 0.00287628173828125, 0.004894256591796875, 0.0069122314453125, 0.008930206298828125, 0.01094818115234375, 0.012966156005859375, 0.014984130859375, 0.017002105712890625, 0.01902008056640625, 0.021038055419921875, 0.0230560302734375, 0.025074005126953125, 0.02709197998046875, 0.029109954833984375, 0.0311279296875, 0.033145904541015625, 0.03516387939453125, 0.037181854248046875, 0.0391998291015625, 0.041217803955078125, 0.04323577880859375, 0.045253753662109375, 0.047271728515625, 0.049289703369140625, 0.05130767822265625, 0.053325653076171875, 0.0553436279296875, 0.057361602783203125, 0.05937957763671875, 0.061397552490234375, 0.06341552734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 26.0, 61.0, 77.0, 169.0, 182.0, 161.0, 128.0, 82.0, 39.0, 25.0, 10.0, 9.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6487930417060852, -0.6004930734634399, -0.5521931052207947, -0.5038931369781494, -0.4555931091308594, -0.4072931408882141, -0.35899317264556885, -0.3106931746006012, -0.26239320635795593, -0.21409322321414948, -0.16579324007034302, -0.11749327182769775, -0.0691932886838913, -0.02089330554008484, 0.027406662702560425, 0.07570666074752808, 0.12400662899017334, 0.1723066121339798, 0.22060659527778625, 0.2689065635204315, 0.31720656156539917, 0.36550652980804443, 0.4138064980506897, 0.46210649609565735, 0.510406494140625, 0.5587064623832703, 0.6070064306259155, 0.6553064584732056, 0.7036064267158508, 0.7519063949584961, 0.8002063632011414, 0.8485063314437866, 0.8968063592910767, 0.9451063275337219, 0.9934062957763672, 1.0417063236236572, 1.0900062322616577, 1.1383062601089478, 1.1866061687469482, 1.2349061965942383, 1.2832062244415283, 1.3315062522888184, 1.3798061609268188, 1.4281061887741089, 1.4764060974121094, 1.5247061252593994, 1.5730061531066895, 1.62130606174469, 1.6696059703826904, 1.7179059982299805, 1.766205906867981, 1.814505934715271, 1.8628058433532715, 1.9111058712005615, 1.9594058990478516, 2.0077059268951416, 2.0560059547424316, 2.1043059825897217, 2.1526060104370117, 2.2009057998657227, 2.2492058277130127, 2.2975058555603027, 2.3458058834075928, 2.394105911254883, 2.4424057006835938]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 6.0, 10.0, 8.0, 3.0, 6.0, 14.0, 15.0, 14.0, 23.0, 20.0, 20.0, 19.0, 22.0, 24.0, 37.0, 31.0, 31.0, 34.0, 41.0, 46.0, 52.0, 35.0, 35.0, 46.0, 39.0, 31.0, 32.0, 34.0, 24.0, 32.0, 23.0, 20.0, 27.0, 26.0, 28.0, 15.0, 18.0, 10.0, 6.0, 7.0, 11.0, 6.0, 4.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.717904269695282, -0.6953877210617065, -0.6728712320327759, -0.6503546833992004, -0.627838134765625, -0.6053216457366943, -0.5828050971031189, -0.5602885484695435, -0.5377720594406128, -0.5152555108070374, -0.4927389919757843, -0.47022247314453125, -0.4477059245109558, -0.42518940567970276, -0.4026728868484497, -0.38015633821487427, -0.35763978958129883, -0.3351232707500458, -0.31260672211647034, -0.2900902032852173, -0.26757365465164185, -0.2450571358203888, -0.22254061698913574, -0.2000240832567215, -0.17750754952430725, -0.154991015791893, -0.13247448205947876, -0.10995796322822571, -0.08744142949581146, -0.06492489576339722, -0.042408376932144165, -0.01989184319972992, 0.002624690532684326, 0.025141220539808273, 0.04765775054693222, 0.07017427682876587, 0.09269081056118011, 0.11520734429359436, 0.1377238631248474, 0.16024039685726166, 0.1827569305896759, 0.20527346432209015, 0.2277899980545044, 0.25030651688575745, 0.2728230357170105, 0.29533958435058594, 0.317856103181839, 0.34037262201309204, 0.3628891706466675, 0.38540568947792053, 0.40792223811149597, 0.430438756942749, 0.45295530557632446, 0.4754718244075775, 0.49798834323883057, 0.520504891872406, 0.5430214405059814, 0.5655379891395569, 0.5880544781684875, 0.610571026802063, 0.6330875754356384, 0.6556041240692139, 0.6781206130981445, 0.70063716173172, 0.7231536507606506]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 3.0, 10.0, 22.0, 26.0, 43.0, 49.0, 59.0, 86.0, 141.0, 221.0, 329.0, 515.0, 807.0, 1442.0, 2449.0, 4382.0, 7913.0, 14878.0, 29022.0, 62745.0, 154527.0, 465585.0, 1352727.0, 1342342.0, 471229.0, 157614.0, 62805.0, 29336.0, 14949.0, 7827.0, 4169.0, 2448.0, 1343.0, 849.0, 477.0, 323.0, 197.0, 106.0, 91.0, 63.0, 36.0, 26.0, 14.0, 11.0, 9.0, 7.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.1326904296875, -0.12854385375976562, -0.12439727783203125, -0.12025070190429688, -0.1161041259765625, -0.11195755004882812, -0.10781097412109375, -0.10366439819335938, -0.099517822265625, -0.09537124633789062, -0.09122467041015625, -0.08707809448242188, -0.0829315185546875, -0.07878494262695312, -0.07463836669921875, -0.07049179077148438, -0.06634521484375, -0.062198638916015625, -0.05805206298828125, -0.053905487060546875, -0.0497589111328125, -0.045612335205078125, -0.04146575927734375, -0.037319183349609375, -0.033172607421875, -0.029026031494140625, -0.02487945556640625, -0.020732879638671875, -0.0165863037109375, -0.012439727783203125, -0.00829315185546875, -0.004146575927734375, 0.0, 0.004146575927734375, 0.00829315185546875, 0.012439727783203125, 0.0165863037109375, 0.020732879638671875, 0.02487945556640625, 0.029026031494140625, 0.033172607421875, 0.037319183349609375, 0.04146575927734375, 0.045612335205078125, 0.0497589111328125, 0.053905487060546875, 0.05805206298828125, 0.062198638916015625, 0.06634521484375, 0.07049179077148438, 0.07463836669921875, 0.07878494262695312, 0.0829315185546875, 0.08707809448242188, 0.09122467041015625, 0.09537124633789062, 0.099517822265625, 0.10366439819335938, 0.10781097412109375, 0.11195755004882812, 0.1161041259765625, 0.12025070190429688, 0.12439727783203125, 0.12854385375976562, 0.1326904296875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 11.0, 11.0, 8.0, 17.0, 27.0, 16.0, 30.0, 14.0, 31.0, 31.0, 27.0, 36.0, 39.0, 41.0, 46.0, 52.0, 53.0, 46.0, 41.0, 42.0, 48.0, 43.0, 35.0, 31.0, 35.0, 33.0, 22.0, 28.0, 19.0, 14.0, 12.0, 8.0, 9.0, 5.0, 6.0, 11.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.118408203125, -0.11446189880371094, -0.11051559448242188, -0.10656929016113281, -0.10262298583984375, -0.09867668151855469, -0.09473037719726562, -0.09078407287597656, -0.0868377685546875, -0.08289146423339844, -0.07894515991210938, -0.07499885559082031, -0.07105255126953125, -0.06710624694824219, -0.06315994262695312, -0.05921363830566406, -0.055267333984375, -0.05132102966308594, -0.047374725341796875, -0.04342842102050781, -0.03948211669921875, -0.03553581237792969, -0.031589508056640625, -0.027643203735351562, -0.0236968994140625, -0.019750595092773438, -0.015804290771484375, -0.011857986450195312, -0.00791168212890625, -0.0039653778076171875, -1.9073486328125e-05, 0.0039272308349609375, 0.00787353515625, 0.011819839477539062, 0.015766143798828125, 0.019712448120117188, 0.02365875244140625, 0.027605056762695312, 0.031551361083984375, 0.03549766540527344, 0.0394439697265625, 0.04339027404785156, 0.047336578369140625, 0.05128288269042969, 0.05522918701171875, 0.05917549133300781, 0.06312179565429688, 0.06706809997558594, 0.071014404296875, 0.07496070861816406, 0.07890701293945312, 0.08285331726074219, 0.08679962158203125, 0.09074592590332031, 0.09469223022460938, 0.09863853454589844, 0.1025848388671875, 0.10653114318847656, 0.11047744750976562, 0.11442375183105469, 0.11837005615234375, 0.12231636047363281, 0.12626266479492188, 0.13020896911621094, 0.1341552734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 10.0, 14.0, 20.0, 29.0, 56.0, 56.0, 89.0, 177.0, 390.0, 661.0, 1606.0, 4762.0, 18684.0, 90418.0, 731318.0, 2970468.0, 308852.0, 49804.0, 11175.0, 3234.0, 1254.0, 534.0, 274.0, 156.0, 101.0, 51.0, 38.0, 21.0, 9.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387939453125, -0.3769569396972656, -0.36597442626953125, -0.3549919128417969, -0.3440093994140625, -0.3330268859863281, -0.32204437255859375, -0.3110618591308594, -0.300079345703125, -0.2890968322753906, -0.27811431884765625, -0.2671318054199219, -0.2561492919921875, -0.24516677856445312, -0.23418426513671875, -0.22320175170898438, -0.21221923828125, -0.20123672485351562, -0.19025421142578125, -0.17927169799804688, -0.1682891845703125, -0.15730667114257812, -0.14632415771484375, -0.13534164428710938, -0.124359130859375, -0.11337661743164062, -0.10239410400390625, -0.09141159057617188, -0.0804290771484375, -0.06944656372070312, -0.05846405029296875, -0.047481536865234375, -0.0364990234375, -0.025516510009765625, -0.01453399658203125, -0.003551483154296875, 0.0074310302734375, 0.018413543701171875, 0.02939605712890625, 0.040378570556640625, 0.051361083984375, 0.062343597412109375, 0.07332611083984375, 0.08430862426757812, 0.0952911376953125, 0.10627365112304688, 0.11725616455078125, 0.12823867797851562, 0.13922119140625, 0.15020370483398438, 0.16118621826171875, 0.17216873168945312, 0.1831512451171875, 0.19413375854492188, 0.20511627197265625, 0.21609878540039062, 0.227081298828125, 0.23806381225585938, 0.24904632568359375, 0.2600288391113281, 0.2710113525390625, 0.2819938659667969, 0.29297637939453125, 0.3039588928222656, 0.31494140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 14.0, 29.0, 45.0, 53.0, 69.0, 122.0, 157.0, 283.0, 509.0, 762.0, 799.0, 498.0, 242.0, 153.0, 109.0, 68.0, 42.0, 28.0, 13.0, 18.0, 11.0, 2.0, 5.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.364013671875, -0.3536109924316406, -0.34320831298828125, -0.3328056335449219, -0.3224029541015625, -0.3120002746582031, -0.30159759521484375, -0.2911949157714844, -0.280792236328125, -0.2703895568847656, -0.25998687744140625, -0.24958419799804688, -0.2391815185546875, -0.22877883911132812, -0.21837615966796875, -0.20797348022460938, -0.19757080078125, -0.18716812133789062, -0.17676544189453125, -0.16636276245117188, -0.1559600830078125, -0.14555740356445312, -0.13515472412109375, -0.12475204467773438, -0.114349365234375, -0.10394668579101562, -0.09354400634765625, -0.08314132690429688, -0.0727386474609375, -0.062335968017578125, -0.05193328857421875, -0.041530609130859375, -0.0311279296875, -0.020725250244140625, -0.01032257080078125, 8.0108642578125e-05, 0.0104827880859375, 0.020885467529296875, 0.03128814697265625, 0.041690826416015625, 0.052093505859375, 0.062496185302734375, 0.07289886474609375, 0.08330154418945312, 0.0937042236328125, 0.10410690307617188, 0.11450958251953125, 0.12491226196289062, 0.13531494140625, 0.14571762084960938, 0.15612030029296875, 0.16652297973632812, 0.1769256591796875, 0.18732833862304688, 0.19773101806640625, 0.20813369750976562, 0.218536376953125, 0.22893905639648438, 0.23934173583984375, 0.24974441528320312, 0.2601470947265625, 0.2705497741699219, 0.28095245361328125, 0.2913551330566406, 0.3017578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 29.0, 65.0, 140.0, 196.0, 223.0, 164.0, 100.0, 45.0, 14.0, 11.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8835303783416748, -1.805909514427185, -1.7282886505126953, -1.6506679058074951, -1.5730470418930054, -1.4954261779785156, -1.4178054332733154, -1.3401845693588257, -1.262563705444336, -1.1849428415298462, -1.1073219776153564, -1.0297012329101562, -0.9520803689956665, -0.8744595050811768, -0.7968387007713318, -0.7192178964614868, -0.6415970325469971, -0.5639761686325073, -0.48635536432266235, -0.408734530210495, -0.33111369609832764, -0.2534928619861603, -0.17587202787399292, -0.09825122356414795, -0.020630359649658203, 0.056990474462509155, 0.1346113085746765, 0.21223214268684387, 0.28985297679901123, 0.3674738109111786, 0.44509464502334595, 0.5227154493331909, 0.6003363132476807, 0.6779571771621704, 0.7555779814720154, 0.8331987857818604, 0.9108196496963501, 0.9884405136108398, 1.06606125831604, 1.1436821222305298, 1.2213029861450195, 1.2989238500595093, 1.376544713973999, 1.4541654586791992, 1.531786322593689, 1.6094071865081787, 1.687027931213379, 1.7646487951278687, 1.8422696590423584, 1.9198905229568481, 1.997511386871338, 2.075132131576538, 2.1527528762817383, 2.2303738594055176, 2.3079946041107178, 2.385615348815918, 2.4632363319396973, 2.5408570766448975, 2.6184780597686768, 2.696098804473877, 2.7737197875976562, 2.8513405323028564, 2.9289612770080566, 3.006582260131836, 3.084203004837036]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 9.0, 10.0, 13.0, 17.0, 19.0, 26.0, 22.0, 24.0, 36.0, 37.0, 35.0, 36.0, 49.0, 42.0, 53.0, 51.0, 54.0, 42.0, 50.0, 52.0, 33.0, 34.0, 40.0, 25.0, 31.0, 22.0, 18.0, 16.0, 25.0, 20.0, 8.0, 4.0, 8.0, 6.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.9486741423606873, -0.9223785996437073, -0.8960829973220825, -0.8697874546051025, -0.8434919118881226, -0.8171963095664978, -0.7909007668495178, -0.7646051645278931, -0.7383096218109131, -0.7120140790939331, -0.6857184767723083, -0.6594229340553284, -0.6331273317337036, -0.6068317890167236, -0.5805362462997437, -0.5542407035827637, -0.5279451012611389, -0.5016495585441589, -0.4753539562225342, -0.4490584135055542, -0.42276284098625183, -0.39646726846694946, -0.3701717257499695, -0.3438761532306671, -0.31758058071136475, -0.2912850081920624, -0.26498943567276, -0.23869389295578003, -0.21239832043647766, -0.1861027479171753, -0.15980719029903412, -0.13351163268089294, -0.10721606016159058, -0.0809204950928688, -0.054624930024147034, -0.028329364955425262, -0.002033799886703491, 0.024261772632598877, 0.05055733025074005, 0.07685288786888123, 0.1031484603881836, 0.12944403290748596, 0.15573959052562714, 0.1820351481437683, 0.20833072066307068, 0.23462629318237305, 0.260921835899353, 0.2872174084186554, 0.31351298093795776, 0.33980855345726013, 0.3661041259765625, 0.3923996686935425, 0.41869524121284485, 0.4449908137321472, 0.4712863564491272, 0.49758192896842957, 0.5238775014877319, 0.5501730442047119, 0.5764686465263367, 0.6027641892433167, 0.6290597915649414, 0.6553553342819214, 0.6816508769989014, 0.7079464197158813, 0.7342420220375061]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 6.0, 11.0, 16.0, 29.0, 53.0, 57.0, 107.0, 159.0, 276.0, 426.0, 721.0, 1181.0, 1899.0, 3057.0, 5000.0, 8060.0, 12760.0, 21578.0, 39007.0, 88152.0, 240203.0, 340697.0, 153230.0, 58605.0, 28941.0, 16946.0, 10506.0, 6456.0, 4076.0, 2340.0, 1556.0, 900.0, 560.0, 360.0, 223.0, 139.0, 87.0, 55.0, 39.0, 19.0, 20.0, 5.0, 9.0, 1.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.180908203125, -0.17530250549316406, -0.16969680786132812, -0.1640911102294922, -0.15848541259765625, -0.1528797149658203, -0.14727401733398438, -0.14166831970214844, -0.1360626220703125, -0.13045692443847656, -0.12485122680664062, -0.11924552917480469, -0.11363983154296875, -0.10803413391113281, -0.10242843627929688, -0.09682273864746094, -0.091217041015625, -0.08561134338378906, -0.08000564575195312, -0.07439994812011719, -0.06879425048828125, -0.06318855285644531, -0.057582855224609375, -0.05197715759277344, -0.0463714599609375, -0.04076576232910156, -0.035160064697265625, -0.029554367065429688, -0.02394866943359375, -0.018342971801757812, -0.012737274169921875, -0.0071315765380859375, -0.00152587890625, 0.0040798187255859375, 0.009685516357421875, 0.015291213989257812, 0.02089691162109375, 0.026502609252929688, 0.032108306884765625, 0.03771400451660156, 0.0433197021484375, 0.04892539978027344, 0.054531097412109375, 0.06013679504394531, 0.06574249267578125, 0.07134819030761719, 0.07695388793945312, 0.08255958557128906, 0.088165283203125, 0.09377098083496094, 0.09937667846679688, 0.10498237609863281, 0.11058807373046875, 0.11619377136230469, 0.12179946899414062, 0.12740516662597656, 0.1330108642578125, 0.13861656188964844, 0.14422225952148438, 0.1498279571533203, 0.15543365478515625, 0.1610393524169922, 0.16664505004882812, 0.17225074768066406, 0.1778564453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 2.0, 11.0, 6.0, 4.0, 17.0, 14.0, 18.0, 18.0, 19.0, 21.0, 29.0, 20.0, 23.0, 35.0, 42.0, 37.0, 39.0, 44.0, 49.0, 44.0, 28.0, 41.0, 51.0, 34.0, 35.0, 38.0, 31.0, 26.0, 34.0, 25.0, 24.0, 25.0, 22.0, 20.0, 10.0, 13.0, 12.0, 12.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.12310791015625, -0.11937522888183594, -0.11564254760742188, -0.11190986633300781, -0.10817718505859375, -0.10444450378417969, -0.10071182250976562, -0.09697914123535156, -0.0932464599609375, -0.08951377868652344, -0.08578109741210938, -0.08204841613769531, -0.07831573486328125, -0.07458305358886719, -0.07085037231445312, -0.06711769104003906, -0.063385009765625, -0.05965232849121094, -0.055919647216796875, -0.05218696594238281, -0.04845428466796875, -0.04472160339355469, -0.040988922119140625, -0.03725624084472656, -0.0335235595703125, -0.029790878295898438, -0.026058197021484375, -0.022325515747070312, -0.01859283447265625, -0.014860153198242188, -0.011127471923828125, -0.0073947906494140625, -0.003662109375, 7.05718994140625e-05, 0.003803253173828125, 0.0075359344482421875, 0.01126861572265625, 0.015001296997070312, 0.018733978271484375, 0.022466659545898438, 0.0261993408203125, 0.029932022094726562, 0.033664703369140625, 0.03739738464355469, 0.04113006591796875, 0.04486274719238281, 0.048595428466796875, 0.05232810974121094, 0.056060791015625, 0.05979347229003906, 0.06352615356445312, 0.06725883483886719, 0.07099151611328125, 0.07472419738769531, 0.07845687866210938, 0.08218955993652344, 0.0859222412109375, 0.08965492248535156, 0.09338760375976562, 0.09712028503417969, 0.10085296630859375, 0.10458564758300781, 0.10831832885742188, 0.11205101013183594, 0.11578369140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 10.0, 6.0, 14.0, 17.0, 21.0, 41.0, 48.0, 62.0, 98.0, 161.0, 260.0, 471.0, 866.0, 1653.0, 3720.0, 9364.0, 25559.0, 91191.0, 548435.0, 285467.0, 52052.0, 16807.0, 6495.0, 2730.0, 1303.0, 680.0, 374.0, 237.0, 131.0, 74.0, 77.0, 42.0, 25.0, 17.0, 8.0, 11.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34765625, -0.334686279296875, -0.32171630859375, -0.308746337890625, -0.2957763671875, -0.282806396484375, -0.26983642578125, -0.256866455078125, -0.243896484375, -0.230926513671875, -0.21795654296875, -0.204986572265625, -0.1920166015625, -0.179046630859375, -0.16607666015625, -0.153106689453125, -0.14013671875, -0.127166748046875, -0.11419677734375, -0.101226806640625, -0.0882568359375, -0.075286865234375, -0.06231689453125, -0.049346923828125, -0.036376953125, -0.023406982421875, -0.01043701171875, 0.002532958984375, 0.0155029296875, 0.028472900390625, 0.04144287109375, 0.054412841796875, 0.0673828125, 0.080352783203125, 0.09332275390625, 0.106292724609375, 0.1192626953125, 0.132232666015625, 0.14520263671875, 0.158172607421875, 0.171142578125, 0.184112548828125, 0.19708251953125, 0.210052490234375, 0.2230224609375, 0.235992431640625, 0.24896240234375, 0.261932373046875, 0.27490234375, 0.287872314453125, 0.30084228515625, 0.313812255859375, 0.3267822265625, 0.339752197265625, 0.35272216796875, 0.365692138671875, 0.378662109375, 0.391632080078125, 0.40460205078125, 0.417572021484375, 0.4305419921875, 0.443511962890625, 0.45648193359375, 0.469451904296875, 0.482421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 9.0, 11.0, 13.0, 15.0, 28.0, 21.0, 32.0, 28.0, 24.0, 44.0, 48.0, 41.0, 56.0, 47.0, 59.0, 53.0, 62.0, 55.0, 55.0, 47.0, 33.0, 30.0, 42.0, 24.0, 24.0, 15.0, 9.0, 10.0, 12.0, 9.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4501953125, -0.4349822998046875, -0.419769287109375, -0.4045562744140625, -0.38934326171875, -0.3741302490234375, -0.358917236328125, -0.3437042236328125, -0.3284912109375, -0.3132781982421875, -0.298065185546875, -0.2828521728515625, -0.26763916015625, -0.2524261474609375, -0.237213134765625, -0.2220001220703125, -0.206787109375, -0.1915740966796875, -0.176361083984375, -0.1611480712890625, -0.14593505859375, -0.1307220458984375, -0.115509033203125, -0.1002960205078125, -0.0850830078125, -0.0698699951171875, -0.054656982421875, -0.0394439697265625, -0.02423095703125, -0.0090179443359375, 0.006195068359375, 0.0214080810546875, 0.03662109375, 0.0518341064453125, 0.067047119140625, 0.0822601318359375, 0.09747314453125, 0.1126861572265625, 0.127899169921875, 0.1431121826171875, 0.1583251953125, 0.1735382080078125, 0.188751220703125, 0.2039642333984375, 0.21917724609375, 0.2343902587890625, 0.249603271484375, 0.2648162841796875, 0.280029296875, 0.2952423095703125, 0.310455322265625, 0.3256683349609375, 0.34088134765625, 0.3560943603515625, 0.371307373046875, 0.3865203857421875, 0.4017333984375, 0.4169464111328125, 0.432159423828125, 0.4473724365234375, 0.46258544921875, 0.4777984619140625, 0.493011474609375, 0.5082244873046875, 0.5234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 7.0, 19.0, 25.0, 40.0, 51.0, 91.0, 105.0, 168.0, 247.0, 437.0, 761.0, 1315.0, 2167.0, 4218.0, 7880.0, 15904.0, 34397.0, 93727.0, 422143.0, 329675.0, 76391.0, 29011.0, 13827.0, 7158.0, 3748.0, 2086.0, 1196.0, 659.0, 397.0, 243.0, 172.0, 75.0, 73.0, 47.0, 26.0, 16.0, 14.0, 12.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.11279296875, -0.10936546325683594, -0.10593795776367188, -0.10251045227050781, -0.09908294677734375, -0.09565544128417969, -0.09222793579101562, -0.08880043029785156, -0.0853729248046875, -0.08194541931152344, -0.07851791381835938, -0.07509040832519531, -0.07166290283203125, -0.06823539733886719, -0.06480789184570312, -0.06138038635253906, -0.057952880859375, -0.05452537536621094, -0.051097869873046875, -0.04767036437988281, -0.04424285888671875, -0.04081535339355469, -0.037387847900390625, -0.03396034240722656, -0.0305328369140625, -0.027105331420898438, -0.023677825927734375, -0.020250320434570312, -0.01682281494140625, -0.013395309448242188, -0.009967803955078125, -0.0065402984619140625, -0.00311279296875, 0.0003147125244140625, 0.003742218017578125, 0.0071697235107421875, 0.01059722900390625, 0.014024734497070312, 0.017452239990234375, 0.020879745483398438, 0.0243072509765625, 0.027734756469726562, 0.031162261962890625, 0.03458976745605469, 0.03801727294921875, 0.04144477844238281, 0.044872283935546875, 0.04829978942871094, 0.051727294921875, 0.05515480041503906, 0.058582305908203125, 0.06200981140136719, 0.06543731689453125, 0.06886482238769531, 0.07229232788085938, 0.07571983337402344, 0.0791473388671875, 0.08257484436035156, 0.08600234985351562, 0.08942985534667969, 0.09285736083984375, 0.09628486633300781, 0.09971237182617188, 0.10313987731933594, 0.1065673828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 9.0, 9.0, 13.0, 6.0, 10.0, 14.0, 13.0, 35.0, 59.0, 99.0, 166.0, 169.0, 147.0, 93.0, 40.0, 22.0, 24.0, 11.0, 11.0, 9.0, 3.0, 10.0, 3.0, 6.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4465065002441406e-05, -4.312396049499512e-05, -4.178285598754883e-05, -4.044175148010254e-05, -3.910064697265625e-05, -3.775954246520996e-05, -3.641843795776367e-05, -3.507733345031738e-05, -3.3736228942871094e-05, -3.2395124435424805e-05, -3.1054019927978516e-05, -2.9712915420532227e-05, -2.8371810913085938e-05, -2.703070640563965e-05, -2.568960189819336e-05, -2.434849739074707e-05, -2.300739288330078e-05, -2.1666288375854492e-05, -2.0325183868408203e-05, -1.8984079360961914e-05, -1.7642974853515625e-05, -1.6301870346069336e-05, -1.4960765838623047e-05, -1.3619661331176758e-05, -1.2278556823730469e-05, -1.093745231628418e-05, -9.59634780883789e-06, -8.255243301391602e-06, -6.9141387939453125e-06, -5.5730342864990234e-06, -4.231929779052734e-06, -2.8908252716064453e-06, -1.5497207641601562e-06, -2.086162567138672e-07, 1.1324882507324219e-06, 2.473592758178711e-06, 3.814697265625e-06, 5.155801773071289e-06, 6.496906280517578e-06, 7.838010787963867e-06, 9.179115295410156e-06, 1.0520219802856445e-05, 1.1861324310302734e-05, 1.3202428817749023e-05, 1.4543533325195312e-05, 1.58846378326416e-05, 1.722574234008789e-05, 1.856684684753418e-05, 1.990795135498047e-05, 2.1249055862426758e-05, 2.2590160369873047e-05, 2.3931264877319336e-05, 2.5272369384765625e-05, 2.6613473892211914e-05, 2.7954578399658203e-05, 2.9295682907104492e-05, 3.063678741455078e-05, 3.197789192199707e-05, 3.331899642944336e-05, 3.466010093688965e-05, 3.600120544433594e-05, 3.7342309951782227e-05, 3.8683414459228516e-05, 4.0024518966674805e-05, 4.1365623474121094e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 4.0, 1.0, 4.0, 11.0, 8.0, 21.0, 32.0, 36.0, 41.0, 75.0, 101.0, 169.0, 292.0, 527.0, 1172.0, 2630.0, 6586.0, 18634.0, 57141.0, 252575.0, 535055.0, 119442.0, 34047.0, 11840.0, 4478.0, 1780.0, 777.0, 416.0, 225.0, 136.0, 85.0, 54.0, 44.0, 21.0, 23.0, 15.0, 12.0, 12.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11431884765625, -0.1102762222290039, -0.10623359680175781, -0.10219097137451172, -0.09814834594726562, -0.09410572052001953, -0.09006309509277344, -0.08602046966552734, -0.08197784423828125, -0.07793521881103516, -0.07389259338378906, -0.06984996795654297, -0.06580734252929688, -0.06176471710205078, -0.05772209167480469, -0.053679466247558594, -0.0496368408203125, -0.045594215393066406, -0.04155158996582031, -0.03750896453857422, -0.033466339111328125, -0.02942371368408203, -0.025381088256835938, -0.021338462829589844, -0.01729583740234375, -0.013253211975097656, -0.009210586547851562, -0.005167961120605469, -0.001125335693359375, 0.0029172897338867188, 0.0069599151611328125, 0.011002540588378906, 0.015045166015625, 0.019087791442871094, 0.023130416870117188, 0.02717304229736328, 0.031215667724609375, 0.03525829315185547, 0.03930091857910156, 0.043343544006347656, 0.04738616943359375, 0.051428794860839844, 0.05547142028808594, 0.05951404571533203, 0.06355667114257812, 0.06759929656982422, 0.07164192199707031, 0.0756845474243164, 0.0797271728515625, 0.0837697982788086, 0.08781242370605469, 0.09185504913330078, 0.09589767456054688, 0.09994029998779297, 0.10398292541503906, 0.10802555084228516, 0.11206817626953125, 0.11611080169677734, 0.12015342712402344, 0.12419605255126953, 0.12823867797851562, 0.13228130340576172, 0.1363239288330078, 0.1403665542602539, 0.1444091796875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 7.0, 5.0, 3.0, 8.0, 9.0, 10.0, 13.0, 12.0, 14.0, 24.0, 41.0, 35.0, 59.0, 66.0, 117.0, 100.0, 104.0, 75.0, 69.0, 47.0, 33.0, 32.0, 19.0, 19.0, 19.0, 13.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.12890625, -0.1253948211669922, -0.12188339233398438, -0.11837196350097656, -0.11486053466796875, -0.11134910583496094, -0.10783767700195312, -0.10432624816894531, -0.1008148193359375, -0.09730339050292969, -0.09379196166992188, -0.09028053283691406, -0.08676910400390625, -0.08325767517089844, -0.07974624633789062, -0.07623481750488281, -0.072723388671875, -0.06921195983886719, -0.06570053100585938, -0.06218910217285156, -0.05867767333984375, -0.05516624450683594, -0.051654815673828125, -0.04814338684082031, -0.0446319580078125, -0.04112052917480469, -0.037609100341796875, -0.03409767150878906, -0.03058624267578125, -0.027074813842773438, -0.023563385009765625, -0.020051956176757812, -0.01654052734375, -0.013029098510742188, -0.009517669677734375, -0.0060062408447265625, -0.00249481201171875, 0.0010166168212890625, 0.004528045654296875, 0.008039474487304688, 0.0115509033203125, 0.015062332153320312, 0.018573760986328125, 0.022085189819335938, 0.02559661865234375, 0.029108047485351562, 0.032619476318359375, 0.03613090515136719, 0.039642333984375, 0.04315376281738281, 0.046665191650390625, 0.05017662048339844, 0.05368804931640625, 0.05719947814941406, 0.060710906982421875, 0.06422233581542969, 0.0677337646484375, 0.07124519348144531, 0.07475662231445312, 0.07826805114746094, 0.08177947998046875, 0.08529090881347656, 0.08880233764648438, 0.09231376647949219, 0.0958251953125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 10.0, 26.0, 45.0, 156.0, 244.0, 235.0, 165.0, 73.0, 29.0, 17.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6752575635910034, -1.5874508619308472, -1.499644160270691, -1.4118373394012451, -1.3240306377410889, -1.2362239360809326, -1.1484172344207764, -1.0606105327606201, -0.9728037714958191, -0.8849970698356628, -0.7971903085708618, -0.7093836069107056, -0.6215769052505493, -0.5337701439857483, -0.44596344232559204, -0.358156681060791, -0.27034997940063477, -0.18254324793815613, -0.09473653137683868, -0.00692981481552124, 0.0808769166469574, 0.16868364810943604, 0.2564903497695923, 0.3442971110343933, 0.43210381269454956, 0.5199105143547058, 0.6077172756195068, 0.6955239772796631, 0.7833306789398193, 0.8711374402046204, 0.9589441418647766, 1.0467509031295776, 1.1345574855804443, 1.2223641872406006, 1.3101708889007568, 1.397977590560913, 1.4857844114303589, 1.5735911130905151, 1.6613978147506714, 1.7492046356201172, 1.8370113372802734, 1.9248180389404297, 2.012624740600586, 2.100431442260742, 2.1882381439208984, 2.2760448455810547, 2.363851547241211, 2.4516584873199463, 2.5394649505615234, 2.6272716522216797, 2.715078353881836, 2.802885055541992, 2.8906917572021484, 2.9784984588623047, 3.066305160522461, 3.1541121006011963, 3.2419188022613525, 3.329725503921509, 3.417532205581665, 3.5053389072418213, 3.5931456089019775, 3.680952548980713, 3.768759250640869, 3.8565659523010254, 3.9443726539611816]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 1.0, 6.0, 3.0, 4.0, 5.0, 5.0, 11.0, 14.0, 15.0, 11.0, 12.0, 24.0, 23.0, 26.0, 17.0, 20.0, 19.0, 24.0, 25.0, 31.0, 33.0, 36.0, 32.0, 35.0, 32.0, 32.0, 39.0, 36.0, 44.0, 36.0, 33.0, 36.0, 35.0, 35.0, 17.0, 27.0, 26.0, 25.0, 16.0, 12.0, 16.0, 14.0, 7.0, 12.0, 9.0, 5.0, 10.0, 4.0, 7.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8007941842079163, -0.7739497423171997, -0.7471053600311279, -0.7202609181404114, -0.6934165358543396, -0.666572093963623, -0.6397277116775513, -0.6128832697868347, -0.5860388278961182, -0.5591943860054016, -0.5323500037193298, -0.5055055618286133, -0.4786611497402191, -0.45181673765182495, -0.4249723255634308, -0.3981279134750366, -0.37128350138664246, -0.3444390892982483, -0.3175946772098541, -0.29075026512145996, -0.2639058232307434, -0.23706141114234924, -0.21021699905395508, -0.18337257206439972, -0.15652815997600555, -0.1296837478876114, -0.10283932089805603, -0.07599490880966187, -0.0491504892706871, -0.02230606973171234, 0.004538342356681824, 0.03138276934623718, 0.05822718143463135, 0.08507160097360611, 0.11191602051258087, 0.13876043260097504, 0.1656048595905304, 0.19244927167892456, 0.21929368376731873, 0.24613811075687408, 0.27298253774642944, 0.2998269498348236, 0.3266713619232178, 0.3535158038139343, 0.3803602159023285, 0.40720462799072266, 0.4340490400791168, 0.460893452167511, 0.48773786425590515, 0.5145822763442993, 0.5414267182350159, 0.5682711005210876, 0.5951155424118042, 0.621959924697876, 0.6488043665885925, 0.6756488084793091, 0.7024931907653809, 0.7293376326560974, 0.7561820149421692, 0.7830264568328857, 0.8098708391189575, 0.8367152810096741, 0.8635597229003906, 0.8904041051864624, 0.917248547077179]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 13.0, 17.0, 43.0, 60.0, 79.0, 128.0, 194.0, 312.0, 485.0, 818.0, 1337.0, 2256.0, 3819.0, 6274.0, 11234.0, 19346.0, 36603.0, 75237.0, 175419.0, 442765.0, 947290.0, 1184147.0, 725107.0, 311648.0, 128693.0, 56204.0, 28167.0, 15239.0, 8610.0, 5017.0, 2988.0, 1845.0, 1085.0, 615.0, 415.0, 244.0, 188.0, 110.0, 74.0, 49.0, 43.0, 15.0, 12.0, 14.0, 9.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.12744140625, -0.12372589111328125, -0.1200103759765625, -0.11629486083984375, -0.112579345703125, -0.10886383056640625, -0.1051483154296875, -0.10143280029296875, -0.09771728515625, -0.09400177001953125, -0.0902862548828125, -0.08657073974609375, -0.082855224609375, -0.07913970947265625, -0.0754241943359375, -0.07170867919921875, -0.0679931640625, -0.06427764892578125, -0.0605621337890625, -0.05684661865234375, -0.053131103515625, -0.04941558837890625, -0.0457000732421875, -0.04198455810546875, -0.03826904296875, -0.03455352783203125, -0.0308380126953125, -0.02712249755859375, -0.023406982421875, -0.01969146728515625, -0.0159759521484375, -0.01226043701171875, -0.008544921875, -0.00482940673828125, -0.0011138916015625, 0.00260162353515625, 0.006317138671875, 0.01003265380859375, 0.0137481689453125, 0.01746368408203125, 0.02117919921875, 0.02489471435546875, 0.0286102294921875, 0.03232574462890625, 0.036041259765625, 0.03975677490234375, 0.0434722900390625, 0.04718780517578125, 0.0509033203125, 0.05461883544921875, 0.0583343505859375, 0.06204986572265625, 0.065765380859375, 0.06948089599609375, 0.0731964111328125, 0.07691192626953125, 0.08062744140625, 0.08434295654296875, 0.0880584716796875, 0.09177398681640625, 0.095489501953125, 0.09920501708984375, 0.1029205322265625, 0.10663604736328125, 0.1103515625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 4.0, 8.0, 4.0, 8.0, 8.0, 8.0, 9.0, 14.0, 18.0, 17.0, 25.0, 22.0, 29.0, 37.0, 37.0, 41.0, 34.0, 47.0, 34.0, 47.0, 35.0, 32.0, 49.0, 45.0, 48.0, 29.0, 41.0, 24.0, 39.0, 30.0, 28.0, 36.0, 19.0, 24.0, 12.0, 15.0, 6.0, 11.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.1341114044189453, -0.12967300415039062, -0.12523460388183594, -0.12079620361328125, -0.11635780334472656, -0.11191940307617188, -0.10748100280761719, -0.1030426025390625, -0.09860420227050781, -0.09416580200195312, -0.08972740173339844, -0.08528900146484375, -0.08085060119628906, -0.07641220092773438, -0.07197380065917969, -0.067535400390625, -0.06309700012207031, -0.058658599853515625, -0.05422019958496094, -0.04978179931640625, -0.04534339904785156, -0.040904998779296875, -0.03646659851074219, -0.0320281982421875, -0.027589797973632812, -0.023151397705078125, -0.018712997436523438, -0.01427459716796875, -0.009836196899414062, -0.005397796630859375, -0.0009593963623046875, 0.00347900390625, 0.007917404174804688, 0.012355804443359375, 0.016794204711914062, 0.02123260498046875, 0.025671005249023438, 0.030109405517578125, 0.03454780578613281, 0.0389862060546875, 0.04342460632324219, 0.047863006591796875, 0.05230140686035156, 0.05673980712890625, 0.06117820739746094, 0.06561660766601562, 0.07005500793457031, 0.074493408203125, 0.07893180847167969, 0.08337020874023438, 0.08780860900878906, 0.09224700927734375, 0.09668540954589844, 0.10112380981445312, 0.10556221008300781, 0.1100006103515625, 0.11443901062011719, 0.11887741088867188, 0.12331581115722656, 0.12775421142578125, 0.13219261169433594, 0.13663101196289062, 0.1410694122314453, 0.1455078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 11.0, 17.0, 15.0, 21.0, 49.0, 60.0, 86.0, 143.0, 233.0, 409.0, 734.0, 1340.0, 3052.0, 7744.0, 26866.0, 120595.0, 814890.0, 2713610.0, 403236.0, 73303.0, 17461.0, 5562.0, 2269.0, 1037.0, 600.0, 341.0, 173.0, 141.0, 81.0, 56.0, 46.0, 27.0, 21.0, 13.0, 9.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.347412109375, -0.336669921875, -0.325927734375, -0.315185546875, -0.304443359375, -0.293701171875, -0.282958984375, -0.272216796875, -0.261474609375, -0.250732421875, -0.239990234375, -0.229248046875, -0.218505859375, -0.207763671875, -0.197021484375, -0.186279296875, -0.175537109375, -0.164794921875, -0.154052734375, -0.143310546875, -0.132568359375, -0.121826171875, -0.111083984375, -0.100341796875, -0.089599609375, -0.078857421875, -0.068115234375, -0.057373046875, -0.046630859375, -0.035888671875, -0.025146484375, -0.014404296875, -0.003662109375, 0.007080078125, 0.017822265625, 0.028564453125, 0.039306640625, 0.050048828125, 0.060791015625, 0.071533203125, 0.082275390625, 0.093017578125, 0.103759765625, 0.114501953125, 0.125244140625, 0.135986328125, 0.146728515625, 0.157470703125, 0.168212890625, 0.178955078125, 0.189697265625, 0.200439453125, 0.211181640625, 0.221923828125, 0.232666015625, 0.243408203125, 0.254150390625, 0.264892578125, 0.275634765625, 0.286376953125, 0.297119140625, 0.307861328125, 0.318603515625, 0.329345703125, 0.340087890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 11.0, 10.0, 9.0, 10.0, 13.0, 26.0, 22.0, 38.0, 54.0, 90.0, 115.0, 177.0, 288.0, 473.0, 605.0, 655.0, 535.0, 325.0, 195.0, 118.0, 80.0, 71.0, 45.0, 31.0, 25.0, 15.0, 7.0, 6.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34423828125, -0.3331756591796875, -0.322113037109375, -0.3110504150390625, -0.29998779296875, -0.2889251708984375, -0.277862548828125, -0.2667999267578125, -0.2557373046875, -0.2446746826171875, -0.233612060546875, -0.2225494384765625, -0.21148681640625, -0.2004241943359375, -0.189361572265625, -0.1782989501953125, -0.167236328125, -0.1561737060546875, -0.145111083984375, -0.1340484619140625, -0.12298583984375, -0.1119232177734375, -0.100860595703125, -0.0897979736328125, -0.0787353515625, -0.0676727294921875, -0.056610107421875, -0.0455474853515625, -0.03448486328125, -0.0234222412109375, -0.012359619140625, -0.0012969970703125, 0.009765625, 0.0208282470703125, 0.031890869140625, 0.0429534912109375, 0.05401611328125, 0.0650787353515625, 0.076141357421875, 0.0872039794921875, 0.0982666015625, 0.1093292236328125, 0.120391845703125, 0.1314544677734375, 0.14251708984375, 0.1535797119140625, 0.164642333984375, 0.1757049560546875, 0.186767578125, 0.1978302001953125, 0.208892822265625, 0.2199554443359375, 0.23101806640625, 0.2420806884765625, 0.253143310546875, 0.2642059326171875, 0.2752685546875, 0.2863311767578125, 0.297393798828125, 0.3084564208984375, 0.31951904296875, 0.3305816650390625, 0.341644287109375, 0.3527069091796875, 0.36376953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 11.0, 29.0, 60.0, 119.0, 163.0, 193.0, 166.0, 125.0, 66.0, 30.0, 17.0, 7.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3422539234161377, -2.260669708251953, -2.1790857315063477, -2.097501516342163, -2.0159173011779785, -1.934333086013794, -1.852748990058899, -1.771164894104004, -1.6895806789398193, -1.6079964637756348, -1.5264123678207397, -1.4448282718658447, -1.3632440567016602, -1.2816598415374756, -1.2000757455825806, -1.1184916496276855, -1.036907434463501, -0.9553232789039612, -0.8737391233444214, -0.7921549677848816, -0.7105708122253418, -0.628986656665802, -0.5474025011062622, -0.4658183455467224, -0.3842341899871826, -0.3026500344276428, -0.22106587886810303, -0.13948172330856323, -0.05789756774902344, 0.023686587810516357, 0.10527074337005615, 0.18685489892959595, 0.26843881607055664, 0.35002297163009644, 0.43160712718963623, 0.513191282749176, 0.5947754383087158, 0.6763595938682556, 0.7579437494277954, 0.8395279049873352, 0.921112060546875, 1.0026962757110596, 1.0842803716659546, 1.1658644676208496, 1.2474486827850342, 1.3290328979492188, 1.4106169939041138, 1.4922010898590088, 1.5737853050231934, 1.655369520187378, 1.736953616142273, 1.818537712097168, 1.9001219272613525, 1.981706142425537, 2.0632901191711426, 2.144874334335327, 2.2264585494995117, 2.3080427646636963, 2.389626979827881, 2.4712109565734863, 2.552795171737671, 2.6343793869018555, 2.715963363647461, 2.7975475788116455, 2.87913179397583]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 15.0, 13.0, 14.0, 21.0, 23.0, 30.0, 24.0, 35.0, 44.0, 44.0, 37.0, 47.0, 39.0, 38.0, 49.0, 35.0, 49.0, 33.0, 34.0, 40.0, 47.0, 37.0, 30.0, 32.0, 21.0, 17.0, 18.0, 15.0, 18.0, 8.0, 18.0, 8.0, 12.0, 7.0, 5.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0403649806976318, -1.0091209411621094, -0.9778769612312317, -0.9466329216957092, -0.9153889417648315, -0.8841449022293091, -0.8529008626937866, -0.8216568827629089, -0.7904129028320312, -0.7591688632965088, -0.7279248833656311, -0.6966808438301086, -0.665436863899231, -0.6341928243637085, -0.602948784828186, -0.5717048048973083, -0.5404607653617859, -0.5092167258262634, -0.47797274589538574, -0.4467287063598633, -0.4154847264289856, -0.38424068689346313, -0.35299667716026306, -0.321752667427063, -0.2905086576938629, -0.25926464796066284, -0.22802063822746277, -0.1967766135931015, -0.16553260385990143, -0.13428859412670135, -0.10304456949234009, -0.07180055975914001, -0.04055660963058472, -0.009312596172094345, 0.021931417286396027, 0.0531754344701767, 0.08441944420337677, 0.11566345393657684, 0.1469074785709381, 0.17815148830413818, 0.20939549803733826, 0.24063950777053833, 0.2718835175037384, 0.3031275272369385, 0.33437156677246094, 0.3656155467033386, 0.3968595862388611, 0.42810359597206116, 0.45934760570526123, 0.4905916154384613, 0.5218356251716614, 0.5530796647071838, 0.5843236446380615, 0.615567684173584, 0.6468117237091064, 0.6780557036399841, 0.7092996835708618, 0.7405437231063843, 0.771787703037262, 0.8030317425727844, 0.8342757225036621, 0.8655197620391846, 0.896763801574707, 0.9280077815055847, 0.9592518210411072]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 8.0, 7.0, 14.0, 18.0, 26.0, 43.0, 62.0, 75.0, 105.0, 221.0, 336.0, 574.0, 977.0, 1807.0, 3274.0, 6114.0, 11041.0, 20037.0, 37704.0, 77175.0, 184161.0, 333394.0, 200348.0, 83168.0, 40160.0, 21270.0, 11903.0, 6564.0, 3399.0, 1974.0, 1021.0, 621.0, 336.0, 229.0, 136.0, 86.0, 45.0, 32.0, 26.0, 19.0, 12.0, 12.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.2036285400390625, -0.197174072265625, -0.1907196044921875, -0.18426513671875, -0.1778106689453125, -0.171356201171875, -0.1649017333984375, -0.158447265625, -0.1519927978515625, -0.145538330078125, -0.1390838623046875, -0.13262939453125, -0.1261749267578125, -0.119720458984375, -0.1132659912109375, -0.1068115234375, -0.1003570556640625, -0.093902587890625, -0.0874481201171875, -0.08099365234375, -0.0745391845703125, -0.068084716796875, -0.0616302490234375, -0.05517578125, -0.0487213134765625, -0.042266845703125, -0.0358123779296875, -0.02935791015625, -0.0229034423828125, -0.016448974609375, -0.0099945068359375, -0.0035400390625, 0.0029144287109375, 0.009368896484375, 0.0158233642578125, 0.02227783203125, 0.0287322998046875, 0.035186767578125, 0.0416412353515625, 0.048095703125, 0.0545501708984375, 0.061004638671875, 0.0674591064453125, 0.07391357421875, 0.0803680419921875, 0.086822509765625, 0.0932769775390625, 0.0997314453125, 0.1061859130859375, 0.112640380859375, 0.1190948486328125, 0.12554931640625, 0.1320037841796875, 0.138458251953125, 0.1449127197265625, 0.1513671875, 0.1578216552734375, 0.164276123046875, 0.1707305908203125, 0.17718505859375, 0.1836395263671875, 0.190093994140625, 0.1965484619140625, 0.2030029296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 7.0, 8.0, 10.0, 7.0, 16.0, 15.0, 20.0, 16.0, 21.0, 23.0, 22.0, 27.0, 45.0, 38.0, 35.0, 42.0, 53.0, 31.0, 43.0, 54.0, 45.0, 30.0, 59.0, 23.0, 42.0, 23.0, 33.0, 25.0, 33.0, 27.0, 27.0, 18.0, 11.0, 22.0, 11.0, 12.0, 7.0, 4.0, 5.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1466064453125, -0.14177894592285156, -0.13695144653320312, -0.1321239471435547, -0.12729644775390625, -0.12246894836425781, -0.11764144897460938, -0.11281394958496094, -0.1079864501953125, -0.10315895080566406, -0.09833145141601562, -0.09350395202636719, -0.08867645263671875, -0.08384895324707031, -0.07902145385742188, -0.07419395446777344, -0.069366455078125, -0.06453895568847656, -0.059711456298828125, -0.05488395690917969, -0.05005645751953125, -0.04522895812988281, -0.040401458740234375, -0.03557395935058594, -0.0307464599609375, -0.025918960571289062, -0.021091461181640625, -0.016263961791992188, -0.01143646240234375, -0.0066089630126953125, -0.001781463623046875, 0.0030460357666015625, 0.00787353515625, 0.012701034545898438, 0.017528533935546875, 0.022356033325195312, 0.02718353271484375, 0.03201103210449219, 0.036838531494140625, 0.04166603088378906, 0.0464935302734375, 0.05132102966308594, 0.056148529052734375, 0.06097602844238281, 0.06580352783203125, 0.07063102722167969, 0.07545852661132812, 0.08028602600097656, 0.085113525390625, 0.08994102478027344, 0.09476852416992188, 0.09959602355957031, 0.10442352294921875, 0.10925102233886719, 0.11407852172851562, 0.11890602111816406, 0.1237335205078125, 0.12856101989746094, 0.13338851928710938, 0.1382160186767578, 0.14304351806640625, 0.1478710174560547, 0.15269851684570312, 0.15752601623535156, 0.162353515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 9.0, 8.0, 17.0, 27.0, 34.0, 47.0, 83.0, 153.0, 277.0, 597.0, 1437.0, 4431.0, 17406.0, 101722.0, 677563.0, 204695.0, 29857.0, 6522.0, 1992.0, 840.0, 360.0, 172.0, 89.0, 64.0, 37.0, 27.0, 15.0, 14.0, 11.0, 10.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.61053466796875, -0.5892333984375, -0.56793212890625, -0.546630859375, -0.52532958984375, -0.5040283203125, -0.48272705078125, -0.46142578125, -0.44012451171875, -0.4188232421875, -0.39752197265625, -0.376220703125, -0.35491943359375, -0.3336181640625, -0.31231689453125, -0.291015625, -0.26971435546875, -0.2484130859375, -0.22711181640625, -0.205810546875, -0.18450927734375, -0.1632080078125, -0.14190673828125, -0.12060546875, -0.09930419921875, -0.0780029296875, -0.05670166015625, -0.035400390625, -0.01409912109375, 0.0072021484375, 0.02850341796875, 0.0498046875, 0.07110595703125, 0.0924072265625, 0.11370849609375, 0.135009765625, 0.15631103515625, 0.1776123046875, 0.19891357421875, 0.22021484375, 0.24151611328125, 0.2628173828125, 0.28411865234375, 0.305419921875, 0.32672119140625, 0.3480224609375, 0.36932373046875, 0.390625, 0.41192626953125, 0.4332275390625, 0.45452880859375, 0.475830078125, 0.49713134765625, 0.5184326171875, 0.53973388671875, 0.56103515625, 0.58233642578125, 0.6036376953125, 0.62493896484375, 0.646240234375, 0.66754150390625, 0.6888427734375, 0.71014404296875, 0.7314453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 15.0, 16.0, 15.0, 16.0, 19.0, 33.0, 38.0, 33.0, 44.0, 47.0, 59.0, 58.0, 58.0, 44.0, 54.0, 58.0, 45.0, 54.0, 46.0, 40.0, 36.0, 31.0, 26.0, 21.0, 16.0, 15.0, 17.0, 5.0, 5.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5361328125, -0.5160064697265625, -0.495880126953125, -0.4757537841796875, -0.45562744140625, -0.4355010986328125, -0.415374755859375, -0.3952484130859375, -0.3751220703125, -0.3549957275390625, -0.334869384765625, -0.3147430419921875, -0.29461669921875, -0.2744903564453125, -0.254364013671875, -0.2342376708984375, -0.214111328125, -0.1939849853515625, -0.173858642578125, -0.1537322998046875, -0.13360595703125, -0.1134796142578125, -0.093353271484375, -0.0732269287109375, -0.0531005859375, -0.0329742431640625, -0.012847900390625, 0.0072784423828125, 0.02740478515625, 0.0475311279296875, 0.067657470703125, 0.0877838134765625, 0.10791015625, 0.1280364990234375, 0.148162841796875, 0.1682891845703125, 0.18841552734375, 0.2085418701171875, 0.228668212890625, 0.2487945556640625, 0.2689208984375, 0.2890472412109375, 0.309173583984375, 0.3292999267578125, 0.34942626953125, 0.3695526123046875, 0.389678955078125, 0.4098052978515625, 0.429931640625, 0.4500579833984375, 0.470184326171875, 0.4903106689453125, 0.51043701171875, 0.5305633544921875, 0.550689697265625, 0.5708160400390625, 0.5909423828125, 0.6110687255859375, 0.631195068359375, 0.6513214111328125, 0.67144775390625, 0.6915740966796875, 0.711700439453125, 0.7318267822265625, 0.751953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 6.0, 6.0, 12.0, 19.0, 29.0, 48.0, 60.0, 110.0, 183.0, 268.0, 403.0, 706.0, 1165.0, 2083.0, 3352.0, 5864.0, 10451.0, 19718.0, 40255.0, 96768.0, 246247.0, 332070.0, 163093.0, 63164.0, 28482.0, 14680.0, 8068.0, 4492.0, 2675.0, 1596.0, 986.0, 544.0, 363.0, 196.0, 129.0, 88.0, 59.0, 38.0, 28.0, 22.0, 11.0, 6.0, 5.0, 4.0, 2.0, 6.0, 1.0, 4.0], "bins": [-0.093017578125, -0.09052181243896484, -0.08802604675292969, -0.08553028106689453, -0.08303451538085938, -0.08053874969482422, -0.07804298400878906, -0.0755472183227539, -0.07305145263671875, -0.0705556869506836, -0.06805992126464844, -0.06556415557861328, -0.06306838989257812, -0.06057262420654297, -0.05807685852050781, -0.055581092834472656, -0.0530853271484375, -0.050589561462402344, -0.04809379577636719, -0.04559803009033203, -0.043102264404296875, -0.04060649871826172, -0.03811073303222656, -0.035614967346191406, -0.03311920166015625, -0.030623435974121094, -0.028127670288085938, -0.02563190460205078, -0.023136138916015625, -0.02064037322998047, -0.018144607543945312, -0.015648841857910156, -0.013153076171875, -0.010657310485839844, -0.008161544799804688, -0.005665779113769531, -0.003170013427734375, -0.0006742477416992188, 0.0018215179443359375, 0.004317283630371094, 0.00681304931640625, 0.009308815002441406, 0.011804580688476562, 0.014300346374511719, 0.016796112060546875, 0.01929187774658203, 0.021787643432617188, 0.024283409118652344, 0.0267791748046875, 0.029274940490722656, 0.03177070617675781, 0.03426647186279297, 0.036762237548828125, 0.03925800323486328, 0.04175376892089844, 0.044249534606933594, 0.04674530029296875, 0.049241065979003906, 0.05173683166503906, 0.05423259735107422, 0.056728363037109375, 0.05922412872314453, 0.06171989440917969, 0.06421566009521484, 0.06671142578125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 6.0, 5.0, 11.0, 11.0, 9.0, 21.0, 12.0, 31.0, 27.0, 38.0, 66.0, 93.0, 96.0, 111.0, 87.0, 93.0, 69.0, 49.0, 39.0, 30.0, 23.0, 7.0, 9.0, 13.0, 5.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.8683414459228516e-05, -3.763008862733841e-05, -3.65767627954483e-05, -3.55234369635582e-05, -3.447011113166809e-05, -3.3416785299777985e-05, -3.236345946788788e-05, -3.131013363599777e-05, -3.0256807804107666e-05, -2.920348197221756e-05, -2.8150156140327454e-05, -2.7096830308437347e-05, -2.604350447654724e-05, -2.4990178644657135e-05, -2.393685281276703e-05, -2.2883526980876923e-05, -2.1830201148986816e-05, -2.077687531709671e-05, -1.9723549485206604e-05, -1.8670223653316498e-05, -1.761689782142639e-05, -1.6563571989536285e-05, -1.551024615764618e-05, -1.4456920325756073e-05, -1.3403594493865967e-05, -1.235026866197586e-05, -1.1296942830085754e-05, -1.0243616998195648e-05, -9.190291166305542e-06, -8.136965334415436e-06, -7.08363950252533e-06, -6.030313670635223e-06, -4.976987838745117e-06, -3.923662006855011e-06, -2.8703361749649048e-06, -1.8170103430747986e-06, -7.636845111846924e-07, 2.896413207054138e-07, 1.34296715259552e-06, 2.3962929844856262e-06, 3.4496188163757324e-06, 4.502944648265839e-06, 5.556270480155945e-06, 6.609596312046051e-06, 7.662922143936157e-06, 8.716247975826263e-06, 9.76957380771637e-06, 1.0822899639606476e-05, 1.1876225471496582e-05, 1.2929551303386688e-05, 1.3982877135276794e-05, 1.50362029671669e-05, 1.6089528799057007e-05, 1.7142854630947113e-05, 1.819618046283722e-05, 1.9249506294727325e-05, 2.030283212661743e-05, 2.1356157958507538e-05, 2.2409483790397644e-05, 2.346280962228775e-05, 2.4516135454177856e-05, 2.5569461286067963e-05, 2.662278711795807e-05, 2.7676112949848175e-05, 2.872943878173828e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 8.0, 9.0, 8.0, 11.0, 19.0, 32.0, 39.0, 48.0, 88.0, 133.0, 214.0, 370.0, 720.0, 1569.0, 3794.0, 10187.0, 29642.0, 99862.0, 334171.0, 384195.0, 126545.0, 36392.0, 12238.0, 4485.0, 1855.0, 811.0, 433.0, 246.0, 143.0, 86.0, 63.0, 43.0, 19.0, 22.0, 17.0, 13.0, 6.0, 9.0, 1.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12224864959716797, -0.11876487731933594, -0.1152811050415039, -0.11179733276367188, -0.10831356048583984, -0.10482978820800781, -0.10134601593017578, -0.09786224365234375, -0.09437847137451172, -0.09089469909667969, -0.08741092681884766, -0.08392715454101562, -0.0804433822631836, -0.07695960998535156, -0.07347583770751953, -0.0699920654296875, -0.06650829315185547, -0.06302452087402344, -0.059540748596191406, -0.056056976318359375, -0.052573204040527344, -0.04908943176269531, -0.04560565948486328, -0.04212188720703125, -0.03863811492919922, -0.03515434265136719, -0.031670570373535156, -0.028186798095703125, -0.024703025817871094, -0.021219253540039062, -0.01773548126220703, -0.014251708984375, -0.010767936706542969, -0.0072841644287109375, -0.0038003921508789062, -0.000316619873046875, 0.0031671524047851562, 0.0066509246826171875, 0.010134696960449219, 0.01361846923828125, 0.01710224151611328, 0.020586013793945312, 0.024069786071777344, 0.027553558349609375, 0.031037330627441406, 0.03452110290527344, 0.03800487518310547, 0.0414886474609375, 0.04497241973876953, 0.04845619201660156, 0.051939964294433594, 0.055423736572265625, 0.058907508850097656, 0.06239128112792969, 0.06587505340576172, 0.06935882568359375, 0.07284259796142578, 0.07632637023925781, 0.07981014251708984, 0.08329391479492188, 0.0867776870727539, 0.09026145935058594, 0.09374523162841797, 0.09722900390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 9.0, 5.0, 9.0, 7.0, 12.0, 14.0, 24.0, 23.0, 24.0, 30.0, 45.0, 46.0, 52.0, 75.0, 73.0, 74.0, 69.0, 62.0, 67.0, 70.0, 43.0, 46.0, 28.0, 18.0, 15.0, 15.0, 11.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1114501953125, -0.10842418670654297, -0.10539817810058594, -0.1023721694946289, -0.09934616088867188, -0.09632015228271484, -0.09329414367675781, -0.09026813507080078, -0.08724212646484375, -0.08421611785888672, -0.08119010925292969, -0.07816410064697266, -0.07513809204101562, -0.0721120834350586, -0.06908607482910156, -0.06606006622314453, -0.0630340576171875, -0.06000804901123047, -0.05698204040527344, -0.053956031799316406, -0.050930023193359375, -0.047904014587402344, -0.04487800598144531, -0.04185199737548828, -0.03882598876953125, -0.03579998016357422, -0.03277397155761719, -0.029747962951660156, -0.026721954345703125, -0.023695945739746094, -0.020669937133789062, -0.01764392852783203, -0.014617919921875, -0.011591911315917969, -0.008565902709960938, -0.005539894104003906, -0.002513885498046875, 0.0005121231079101562, 0.0035381317138671875, 0.006564140319824219, 0.00959014892578125, 0.012616157531738281, 0.015642166137695312, 0.018668174743652344, 0.021694183349609375, 0.024720191955566406, 0.027746200561523438, 0.03077220916748047, 0.0337982177734375, 0.03682422637939453, 0.03985023498535156, 0.042876243591308594, 0.045902252197265625, 0.048928260803222656, 0.05195426940917969, 0.05498027801513672, 0.05800628662109375, 0.06103229522705078, 0.06405830383300781, 0.06708431243896484, 0.07011032104492188, 0.0731363296508789, 0.07616233825683594, 0.07918834686279297, 0.08221435546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 32.0, 50.0, 79.0, 128.0, 150.0, 172.0, 139.0, 94.0, 64.0, 33.0, 13.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.387167453765869, -2.326336622238159, -2.265505790710449, -2.2046751976013184, -2.1438443660736084, -2.0830135345458984, -2.0221829414367676, -1.9613521099090576, -1.9005212783813477, -1.8396904468536377, -1.7788597345352173, -1.7180290222167969, -1.657198190689087, -1.596367359161377, -1.5355366468429565, -1.4747059345245361, -1.4138751029968262, -1.3530442714691162, -1.2922135591506958, -1.2313828468322754, -1.1705520153045654, -1.1097211837768555, -1.048890471458435, -0.9880596995353699, -0.9272289276123047, -0.8663981556892395, -0.8055673837661743, -0.7447366118431091, -0.683905839920044, -0.6230750679969788, -0.5622442960739136, -0.5014135241508484, -0.4405827522277832, -0.379751980304718, -0.31892120838165283, -0.25809043645858765, -0.19725966453552246, -0.13642889261245728, -0.07559812068939209, -0.014767348766326904, 0.04606342315673828, 0.10689419507980347, 0.16772496700286865, 0.22855573892593384, 0.289386510848999, 0.3502172827720642, 0.4110480546951294, 0.4718788266181946, 0.5327095985412598, 0.593540370464325, 0.6543711423873901, 0.7152019143104553, 0.7760326862335205, 0.8368634581565857, 0.8976942300796509, 0.9585250020027161, 1.0193557739257812, 1.0801866054534912, 1.1410173177719116, 1.201848030090332, 1.262678861618042, 1.323509693145752, 1.3843404054641724, 1.4451711177825928, 1.5060019493103027]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 6.0, 8.0, 6.0, 6.0, 14.0, 9.0, 23.0, 19.0, 23.0, 24.0, 20.0, 22.0, 34.0, 29.0, 35.0, 50.0, 45.0, 29.0, 54.0, 40.0, 51.0, 49.0, 44.0, 38.0, 34.0, 32.0, 32.0, 40.0, 21.0, 28.0, 27.0, 18.0, 7.0, 14.0, 13.0, 12.0, 11.0, 6.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.183851718902588, -1.1449288129806519, -1.1060057878494263, -1.0670828819274902, -1.0281598567962646, -0.9892369508743286, -0.9503139853477478, -0.911391019821167, -0.8724680542945862, -0.8335450887680054, -0.7946221232414246, -0.7556991577148438, -0.7167762517929077, -0.6778532266616821, -0.6389303207397461, -0.6000073552131653, -0.5610843896865845, -0.5221614241600037, -0.48323845863342285, -0.44431552290916443, -0.4053925573825836, -0.3664695918560028, -0.3275466561317444, -0.2886236906051636, -0.24970072507858276, -0.21077775955200195, -0.17185480892658234, -0.13293185830116272, -0.09400889277458191, -0.0550859272480011, -0.016162976622581482, 0.022759974002838135, 0.061682939529418945, 0.10060589760541916, 0.13952885568141937, 0.178451806306839, 0.2173747718334198, 0.2562977373600006, 0.29522067308425903, 0.33414363861083984, 0.37306660413742065, 0.41198956966400146, 0.4509125351905823, 0.4898354709148407, 0.5287584066390991, 0.5676814317703247, 0.6066043376922607, 0.6455273032188416, 0.6844502687454224, 0.7233732342720032, 0.762296199798584, 0.8012191653251648, 0.8401421308517456, 0.8790650367736816, 0.9179880023002625, 0.9569109678268433, 0.9958339333534241, 1.0347568988800049, 1.073679804801941, 1.1126028299331665, 1.1515257358551025, 1.1904487609863281, 1.2293716669082642, 1.2682945728302002, 1.3072175979614258]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 8.0, 7.0, 8.0, 12.0, 21.0, 29.0, 45.0, 40.0, 90.0, 126.0, 227.0, 376.0, 537.0, 829.0, 1352.0, 2214.0, 3763.0, 6522.0, 11185.0, 20374.0, 40826.0, 93350.0, 230617.0, 538221.0, 1020952.0, 1086602.0, 633345.0, 282375.0, 113949.0, 49369.0, 24175.0, 13142.0, 7620.0, 4511.0, 2775.0, 1764.0, 1032.0, 702.0, 412.0, 256.0, 163.0, 113.0, 76.0, 62.0, 38.0, 24.0, 15.0, 9.0, 10.0, 8.0, 7.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12169265747070312, -0.11765289306640625, -0.11361312866210938, -0.1095733642578125, -0.10553359985351562, -0.10149383544921875, -0.09745407104492188, -0.093414306640625, -0.08937454223632812, -0.08533477783203125, -0.08129501342773438, -0.0772552490234375, -0.07321548461914062, -0.06917572021484375, -0.06513595581054688, -0.06109619140625, -0.057056427001953125, -0.05301666259765625, -0.048976898193359375, -0.0449371337890625, -0.040897369384765625, -0.03685760498046875, -0.032817840576171875, -0.028778076171875, -0.024738311767578125, -0.02069854736328125, -0.016658782958984375, -0.0126190185546875, -0.008579254150390625, -0.00453948974609375, -0.000499725341796875, 0.0035400390625, 0.007579803466796875, 0.01161956787109375, 0.015659332275390625, 0.0196990966796875, 0.023738861083984375, 0.02777862548828125, 0.031818389892578125, 0.035858154296875, 0.039897918701171875, 0.04393768310546875, 0.047977447509765625, 0.0520172119140625, 0.056056976318359375, 0.06009674072265625, 0.06413650512695312, 0.06817626953125, 0.07221603393554688, 0.07625579833984375, 0.08029556274414062, 0.0843353271484375, 0.08837509155273438, 0.09241485595703125, 0.09645462036132812, 0.100494384765625, 0.10453414916992188, 0.10857391357421875, 0.11261367797851562, 0.1166534423828125, 0.12069320678710938, 0.12473297119140625, 0.12877273559570312, 0.1328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 11.0, 6.0, 6.0, 8.0, 12.0, 18.0, 16.0, 20.0, 17.0, 19.0, 30.0, 31.0, 38.0, 27.0, 27.0, 37.0, 34.0, 39.0, 58.0, 45.0, 37.0, 43.0, 52.0, 43.0, 36.0, 37.0, 34.0, 31.0, 28.0, 21.0, 25.0, 19.0, 15.0, 19.0, 12.0, 5.0, 11.0, 8.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1676025390625, -0.16231536865234375, -0.1570281982421875, -0.15174102783203125, -0.146453857421875, -0.14116668701171875, -0.1358795166015625, -0.13059234619140625, -0.12530517578125, -0.12001800537109375, -0.1147308349609375, -0.10944366455078125, -0.104156494140625, -0.09886932373046875, -0.0935821533203125, -0.08829498291015625, -0.0830078125, -0.07772064208984375, -0.0724334716796875, -0.06714630126953125, -0.061859130859375, -0.05657196044921875, -0.0512847900390625, -0.04599761962890625, -0.04071044921875, -0.03542327880859375, -0.0301361083984375, -0.02484893798828125, -0.019561767578125, -0.01427459716796875, -0.0089874267578125, -0.00370025634765625, 0.0015869140625, 0.00687408447265625, 0.0121612548828125, 0.01744842529296875, 0.022735595703125, 0.02802276611328125, 0.0333099365234375, 0.03859710693359375, 0.04388427734375, 0.04917144775390625, 0.0544586181640625, 0.05974578857421875, 0.065032958984375, 0.07032012939453125, 0.0756072998046875, 0.08089447021484375, 0.086181640625, 0.09146881103515625, 0.0967559814453125, 0.10204315185546875, 0.107330322265625, 0.11261749267578125, 0.1179046630859375, 0.12319183349609375, 0.12847900390625, 0.13376617431640625, 0.1390533447265625, 0.14434051513671875, 0.149627685546875, 0.15491485595703125, 0.1602020263671875, 0.16548919677734375, 0.1707763671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 2.0, 7.0, 16.0, 12.0, 23.0, 55.0, 75.0, 104.0, 217.0, 394.0, 747.0, 1608.0, 4259.0, 14809.0, 78936.0, 698497.0, 3026051.0, 309516.0, 43958.0, 9539.0, 2948.0, 1207.0, 571.0, 303.0, 160.0, 99.0, 54.0, 46.0, 13.0, 20.0, 14.0, 6.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43896484375, -0.4244956970214844, -0.41002655029296875, -0.3955574035644531, -0.3810882568359375, -0.3666191101074219, -0.35214996337890625, -0.3376808166503906, -0.323211669921875, -0.3087425231933594, -0.29427337646484375, -0.2798042297363281, -0.2653350830078125, -0.2508659362792969, -0.23639678955078125, -0.22192764282226562, -0.20745849609375, -0.19298934936523438, -0.17852020263671875, -0.16405105590820312, -0.1495819091796875, -0.13511276245117188, -0.12064361572265625, -0.10617446899414062, -0.091705322265625, -0.07723617553710938, -0.06276702880859375, -0.048297882080078125, -0.0338287353515625, -0.019359588623046875, -0.00489044189453125, 0.009578704833984375, 0.0240478515625, 0.038516998291015625, 0.05298614501953125, 0.06745529174804688, 0.0819244384765625, 0.09639358520507812, 0.11086273193359375, 0.12533187866210938, 0.139801025390625, 0.15427017211914062, 0.16873931884765625, 0.18320846557617188, 0.1976776123046875, 0.21214675903320312, 0.22661590576171875, 0.24108505249023438, 0.25555419921875, 0.2700233459472656, 0.28449249267578125, 0.2989616394042969, 0.3134307861328125, 0.3278999328613281, 0.34236907958984375, 0.3568382263183594, 0.371307373046875, 0.3857765197753906, 0.40024566650390625, 0.4147148132324219, 0.4291839599609375, 0.4436531066894531, 0.45812225341796875, 0.4725914001464844, 0.487060546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 14.0, 21.0, 28.0, 43.0, 54.0, 86.0, 164.0, 245.0, 428.0, 811.0, 875.0, 542.0, 271.0, 173.0, 102.0, 67.0, 39.0, 16.0, 21.0, 20.0, 13.0, 6.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.411865234375, -0.3966941833496094, -0.38152313232421875, -0.3663520812988281, -0.3511810302734375, -0.3360099792480469, -0.32083892822265625, -0.3056678771972656, -0.290496826171875, -0.2753257751464844, -0.26015472412109375, -0.24498367309570312, -0.2298126220703125, -0.21464157104492188, -0.19947052001953125, -0.18429946899414062, -0.16912841796875, -0.15395736694335938, -0.13878631591796875, -0.12361526489257812, -0.1084442138671875, -0.09327316284179688, -0.07810211181640625, -0.06293106079101562, -0.047760009765625, -0.032588958740234375, -0.01741790771484375, -0.002246856689453125, 0.0129241943359375, 0.028095245361328125, 0.04326629638671875, 0.058437347412109375, 0.0736083984375, 0.08877944946289062, 0.10395050048828125, 0.11912155151367188, 0.1342926025390625, 0.14946365356445312, 0.16463470458984375, 0.17980575561523438, 0.194976806640625, 0.21014785766601562, 0.22531890869140625, 0.24048995971679688, 0.2556610107421875, 0.2708320617675781, 0.28600311279296875, 0.3011741638183594, 0.31634521484375, 0.3315162658691406, 0.34668731689453125, 0.3618583679199219, 0.3770294189453125, 0.3922004699707031, 0.40737152099609375, 0.4225425720214844, 0.437713623046875, 0.4528846740722656, 0.46805572509765625, 0.4832267761230469, 0.4983978271484375, 0.5135688781738281, 0.5287399291992188, 0.5439109802246094, 0.55908203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 18.0, 32.0, 78.0, 182.0, 250.0, 217.0, 132.0, 53.0, 22.0, 8.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.557363510131836, -3.442140817642212, -3.326917886734009, -3.2116951942443848, -3.0964722633361816, -2.9812495708465576, -2.8660268783569336, -2.7508039474487305, -2.6355810165405273, -2.5203583240509033, -2.4051353931427, -2.289912700653076, -2.174689769744873, -2.059467077255249, -1.9442442655563354, -1.8290214538574219, -1.7137987613677979, -1.5985759496688843, -1.4833531379699707, -1.3681304454803467, -1.2529075145721436, -1.1376848220825195, -1.022462010383606, -0.9072391986846924, -0.7920163869857788, -0.6767935752868652, -0.5615707635879517, -0.44634801149368286, -0.3311251997947693, -0.2159023880958557, -0.10067963600158691, 0.01454317569732666, 0.12976598739624023, 0.24498878419399261, 0.360211580991745, 0.4754343628883362, 0.5906571745872498, 0.7058799862861633, 0.8211027383804321, 0.9363255500793457, 1.0515483617782593, 1.1667711734771729, 1.2819939851760864, 1.397216796875, 1.512439489364624, 1.6276624202728271, 1.7428851127624512, 1.8581079244613647, 1.9733307361602783, 2.0885534286499023, 2.2037763595581055, 2.3189990520477295, 2.4342219829559326, 2.5494446754455566, 2.6646676063537598, 2.779890298843384, 2.895112991333008, 3.010335683822632, 3.125558614730835, 3.240781307220459, 3.356004238128662, 3.471226930618286, 3.58644962310791, 3.7016725540161133, 3.8168954849243164]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 11.0, 7.0, 4.0, 13.0, 13.0, 17.0, 27.0, 24.0, 27.0, 32.0, 30.0, 32.0, 37.0, 49.0, 42.0, 48.0, 36.0, 36.0, 54.0, 36.0, 42.0, 47.0, 34.0, 45.0, 26.0, 30.0, 25.0, 26.0, 14.0, 24.0, 14.0, 15.0, 18.0, 9.0, 8.0, 12.0, 4.0, 6.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1459629535675049, -1.1114869117736816, -1.077010989189148, -1.0425349473953247, -1.0080589056015015, -0.973582923412323, -0.9391069412231445, -0.9046308994293213, -0.870154857635498, -0.8356788754463196, -0.8012028336524963, -0.7667268514633179, -0.7322508096694946, -0.6977748274803162, -0.6632988452911377, -0.6288228034973145, -0.594346821308136, -0.5598708391189575, -0.5253947973251343, -0.4909188151359558, -0.45644277334213257, -0.4219667911529541, -0.38749077916145325, -0.3530147671699524, -0.31853875517845154, -0.2840627431869507, -0.24958673119544983, -0.21511073410511017, -0.18063472211360931, -0.14615871012210846, -0.1116827130317688, -0.07720670104026794, -0.04273068904876709, -0.008254680782556534, 0.026221327483654022, 0.06069733202457428, 0.09517334401607513, 0.129649356007576, 0.16412535309791565, 0.1986013650894165, 0.23307737708091736, 0.2675533890724182, 0.30202940106391907, 0.3365054130554199, 0.3709813952445984, 0.40545743703842163, 0.4399334192276001, 0.47440943121910095, 0.5088854432106018, 0.5433614253997803, 0.5778374671936035, 0.612313449382782, 0.6467894911766052, 0.6812654733657837, 0.7157415151596069, 0.7502174973487854, 0.7846934795379639, 0.8191694617271423, 0.8536455035209656, 0.888121485710144, 0.9225975275039673, 0.9570735096931458, 0.9915494918823242, 1.0260255336761475, 1.0605015754699707]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 17.0, 12.0, 15.0, 21.0, 38.0, 55.0, 82.0, 118.0, 224.0, 377.0, 599.0, 1084.0, 1883.0, 3817.0, 7474.0, 15336.0, 32583.0, 72011.0, 151362.0, 246217.0, 241482.0, 144947.0, 68120.0, 31204.0, 14539.0, 7028.0, 3503.0, 1864.0, 1015.0, 558.0, 319.0, 209.0, 144.0, 89.0, 52.0, 41.0, 36.0, 23.0, 15.0, 13.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.1411285400390625, -0.135894775390625, -0.1306610107421875, -0.12542724609375, -0.1201934814453125, -0.114959716796875, -0.1097259521484375, -0.1044921875, -0.0992584228515625, -0.094024658203125, -0.0887908935546875, -0.08355712890625, -0.0783233642578125, -0.073089599609375, -0.0678558349609375, -0.0626220703125, -0.0573883056640625, -0.052154541015625, -0.0469207763671875, -0.04168701171875, -0.0364532470703125, -0.031219482421875, -0.0259857177734375, -0.020751953125, -0.0155181884765625, -0.010284423828125, -0.0050506591796875, 0.00018310546875, 0.0054168701171875, 0.010650634765625, 0.0158843994140625, 0.0211181640625, 0.0263519287109375, 0.031585693359375, 0.0368194580078125, 0.04205322265625, 0.0472869873046875, 0.052520751953125, 0.0577545166015625, 0.06298828125, 0.0682220458984375, 0.073455810546875, 0.0786895751953125, 0.08392333984375, 0.0891571044921875, 0.094390869140625, 0.0996246337890625, 0.1048583984375, 0.1100921630859375, 0.115325927734375, 0.1205596923828125, 0.12579345703125, 0.1310272216796875, 0.136260986328125, 0.1414947509765625, 0.146728515625, 0.1519622802734375, 0.157196044921875, 0.1624298095703125, 0.16766357421875, 0.1728973388671875, 0.178131103515625, 0.1833648681640625, 0.1885986328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 6.0, 8.0, 11.0, 9.0, 13.0, 16.0, 8.0, 22.0, 15.0, 24.0, 33.0, 31.0, 35.0, 31.0, 43.0, 36.0, 43.0, 36.0, 46.0, 45.0, 41.0, 41.0, 39.0, 45.0, 40.0, 45.0, 31.0, 16.0, 16.0, 24.0, 23.0, 24.0, 15.0, 17.0, 8.0, 2.0, 14.0, 13.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13397979736328125, -0.1294097900390625, -0.12483978271484375, -0.120269775390625, -0.11569976806640625, -0.1111297607421875, -0.10655975341796875, -0.10198974609375, -0.09741973876953125, -0.0928497314453125, -0.08827972412109375, -0.083709716796875, -0.07913970947265625, -0.0745697021484375, -0.06999969482421875, -0.0654296875, -0.06085968017578125, -0.0562896728515625, -0.05171966552734375, -0.047149658203125, -0.04257965087890625, -0.0380096435546875, -0.03343963623046875, -0.02886962890625, -0.02429962158203125, -0.0197296142578125, -0.01515960693359375, -0.010589599609375, -0.00601959228515625, -0.0014495849609375, 0.00312042236328125, 0.0076904296875, 0.01226043701171875, 0.0168304443359375, 0.02140045166015625, 0.025970458984375, 0.03054046630859375, 0.0351104736328125, 0.03968048095703125, 0.04425048828125, 0.04882049560546875, 0.0533905029296875, 0.05796051025390625, 0.062530517578125, 0.06710052490234375, 0.0716705322265625, 0.07624053955078125, 0.080810546875, 0.08538055419921875, 0.0899505615234375, 0.09452056884765625, 0.099090576171875, 0.10366058349609375, 0.1082305908203125, 0.11280059814453125, 0.11737060546875, 0.12194061279296875, 0.1265106201171875, 0.13108062744140625, 0.135650634765625, 0.14022064208984375, 0.1447906494140625, 0.14936065673828125, 0.1539306640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 14.0, 23.0, 22.0, 50.0, 56.0, 83.0, 169.0, 272.0, 505.0, 1192.0, 2914.0, 8110.0, 27133.0, 110068.0, 450810.0, 342312.0, 75069.0, 19373.0, 6124.0, 2294.0, 918.0, 451.0, 211.0, 131.0, 79.0, 41.0, 37.0, 29.0, 15.0, 14.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.4658203125, -0.45318603515625, -0.4405517578125, -0.42791748046875, -0.415283203125, -0.40264892578125, -0.3900146484375, -0.37738037109375, -0.36474609375, -0.35211181640625, -0.3394775390625, -0.32684326171875, -0.314208984375, -0.30157470703125, -0.2889404296875, -0.27630615234375, -0.263671875, -0.25103759765625, -0.2384033203125, -0.22576904296875, -0.213134765625, -0.20050048828125, -0.1878662109375, -0.17523193359375, -0.16259765625, -0.14996337890625, -0.1373291015625, -0.12469482421875, -0.112060546875, -0.09942626953125, -0.0867919921875, -0.07415771484375, -0.0615234375, -0.04888916015625, -0.0362548828125, -0.02362060546875, -0.010986328125, 0.00164794921875, 0.0142822265625, 0.02691650390625, 0.03955078125, 0.05218505859375, 0.0648193359375, 0.07745361328125, 0.090087890625, 0.10272216796875, 0.1153564453125, 0.12799072265625, 0.140625, 0.15325927734375, 0.1658935546875, 0.17852783203125, 0.191162109375, 0.20379638671875, 0.2164306640625, 0.22906494140625, 0.24169921875, 0.25433349609375, 0.2669677734375, 0.27960205078125, 0.292236328125, 0.30487060546875, 0.3175048828125, 0.33013916015625, 0.3427734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 8.0, 9.0, 14.0, 15.0, 24.0, 36.0, 32.0, 50.0, 72.0, 67.0, 84.0, 82.0, 95.0, 95.0, 58.0, 59.0, 48.0, 38.0, 40.0, 20.0, 17.0, 17.0, 5.0, 4.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.04437255859375, -1.0155029296875, -0.98663330078125, -0.957763671875, -0.92889404296875, -0.9000244140625, -0.87115478515625, -0.84228515625, -0.81341552734375, -0.7845458984375, -0.75567626953125, -0.726806640625, -0.69793701171875, -0.6690673828125, -0.64019775390625, -0.611328125, -0.58245849609375, -0.5535888671875, -0.52471923828125, -0.495849609375, -0.46697998046875, -0.4381103515625, -0.40924072265625, -0.38037109375, -0.35150146484375, -0.3226318359375, -0.29376220703125, -0.264892578125, -0.23602294921875, -0.2071533203125, -0.17828369140625, -0.1494140625, -0.12054443359375, -0.0916748046875, -0.06280517578125, -0.033935546875, -0.00506591796875, 0.0238037109375, 0.05267333984375, 0.08154296875, 0.11041259765625, 0.1392822265625, 0.16815185546875, 0.197021484375, 0.22589111328125, 0.2547607421875, 0.28363037109375, 0.3125, 0.34136962890625, 0.3702392578125, 0.39910888671875, 0.427978515625, 0.45684814453125, 0.4857177734375, 0.51458740234375, 0.54345703125, 0.57232666015625, 0.6011962890625, 0.63006591796875, 0.658935546875, 0.68780517578125, 0.7166748046875, 0.74554443359375, 0.7744140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 12.0, 21.0, 19.0, 31.0, 63.0, 90.0, 144.0, 244.0, 488.0, 941.0, 1875.0, 3905.0, 8967.0, 22400.0, 62333.0, 192222.0, 389748.0, 237914.0, 79617.0, 27701.0, 10726.0, 4496.0, 2175.0, 1032.0, 555.0, 362.0, 188.0, 100.0, 56.0, 44.0, 19.0, 14.0, 10.0, 12.0, 5.0, 9.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1207275390625, -0.11713504791259766, -0.11354255676269531, -0.10995006561279297, -0.10635757446289062, -0.10276508331298828, -0.09917259216308594, -0.0955801010131836, -0.09198760986328125, -0.0883951187133789, -0.08480262756347656, -0.08121013641357422, -0.07761764526367188, -0.07402515411376953, -0.07043266296386719, -0.06684017181396484, -0.0632476806640625, -0.059655189514160156, -0.05606269836425781, -0.05247020721435547, -0.048877716064453125, -0.04528522491455078, -0.04169273376464844, -0.038100242614746094, -0.03450775146484375, -0.030915260314941406, -0.027322769165039062, -0.02373027801513672, -0.020137786865234375, -0.01654529571533203, -0.012952804565429688, -0.009360313415527344, -0.005767822265625, -0.0021753311157226562, 0.0014171600341796875, 0.005009651184082031, 0.008602142333984375, 0.012194633483886719, 0.015787124633789062, 0.019379615783691406, 0.02297210693359375, 0.026564598083496094, 0.030157089233398438, 0.03374958038330078, 0.037342071533203125, 0.04093456268310547, 0.04452705383300781, 0.048119544982910156, 0.0517120361328125, 0.055304527282714844, 0.05889701843261719, 0.06248950958251953, 0.06608200073242188, 0.06967449188232422, 0.07326698303222656, 0.0768594741821289, 0.08045196533203125, 0.0840444564819336, 0.08763694763183594, 0.09122943878173828, 0.09482192993164062, 0.09841442108154297, 0.10200691223144531, 0.10559940338134766, 0.10919189453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 7.0, 13.0, 14.0, 17.0, 19.0, 28.0, 33.0, 32.0, 39.0, 45.0, 62.0, 71.0, 71.0, 53.0, 57.0, 63.0, 60.0, 43.0, 53.0, 53.0, 29.0, 33.0, 27.0, 16.0, 16.0, 6.0, 7.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8417835235595703e-05, -1.772213727235794e-05, -1.7026439309120178e-05, -1.6330741345882416e-05, -1.5635043382644653e-05, -1.4939345419406891e-05, -1.4243647456169128e-05, -1.3547949492931366e-05, -1.2852251529693604e-05, -1.2156553566455841e-05, -1.1460855603218079e-05, -1.0765157639980316e-05, -1.0069459676742554e-05, -9.373761713504791e-06, -8.678063750267029e-06, -7.982365787029266e-06, -7.286667823791504e-06, -6.5909698605537415e-06, -5.895271897315979e-06, -5.1995739340782166e-06, -4.503875970840454e-06, -3.8081780076026917e-06, -3.112480044364929e-06, -2.4167820811271667e-06, -1.7210841178894043e-06, -1.0253861546516418e-06, -3.296881914138794e-07, 3.6600977182388306e-07, 1.0617077350616455e-06, 1.757405698299408e-06, 2.4531036615371704e-06, 3.148801624774933e-06, 3.844499588012695e-06, 4.540197551250458e-06, 5.23589551448822e-06, 5.931593477725983e-06, 6.627291440963745e-06, 7.3229894042015076e-06, 8.01868736743927e-06, 8.714385330677032e-06, 9.410083293914795e-06, 1.0105781257152557e-05, 1.080147922039032e-05, 1.1497177183628082e-05, 1.2192875146865845e-05, 1.2888573110103607e-05, 1.358427107334137e-05, 1.4279969036579132e-05, 1.4975666999816895e-05, 1.5671364963054657e-05, 1.636706292629242e-05, 1.7062760889530182e-05, 1.7758458852767944e-05, 1.8454156816005707e-05, 1.914985477924347e-05, 1.984555274248123e-05, 2.0541250705718994e-05, 2.1236948668956757e-05, 2.193264663219452e-05, 2.262834459543228e-05, 2.3324042558670044e-05, 2.4019740521907806e-05, 2.471543848514557e-05, 2.541113644838333e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 10.0, 7.0, 5.0, 14.0, 13.0, 16.0, 26.0, 58.0, 57.0, 94.0, 183.0, 289.0, 485.0, 931.0, 1986.0, 4569.0, 11205.0, 31078.0, 90337.0, 249379.0, 365059.0, 189130.0, 65364.0, 22926.0, 8622.0, 3422.0, 1500.0, 733.0, 407.0, 214.0, 146.0, 86.0, 60.0, 36.0, 32.0, 19.0, 17.0, 14.0, 5.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.11883544921875, -0.11547374725341797, -0.11211204528808594, -0.1087503433227539, -0.10538864135742188, -0.10202693939208984, -0.09866523742675781, -0.09530353546142578, -0.09194183349609375, -0.08858013153076172, -0.08521842956542969, -0.08185672760009766, -0.07849502563476562, -0.0751333236694336, -0.07177162170410156, -0.06840991973876953, -0.0650482177734375, -0.06168651580810547, -0.05832481384277344, -0.054963111877441406, -0.051601409912109375, -0.048239707946777344, -0.04487800598144531, -0.04151630401611328, -0.03815460205078125, -0.03479290008544922, -0.03143119812011719, -0.028069496154785156, -0.024707794189453125, -0.021346092224121094, -0.017984390258789062, -0.014622688293457031, -0.011260986328125, -0.007899284362792969, -0.0045375823974609375, -0.0011758804321289062, 0.002185821533203125, 0.005547523498535156, 0.008909225463867188, 0.012270927429199219, 0.01563262939453125, 0.01899433135986328, 0.022356033325195312, 0.025717735290527344, 0.029079437255859375, 0.032441139221191406, 0.03580284118652344, 0.03916454315185547, 0.0425262451171875, 0.04588794708251953, 0.04924964904785156, 0.052611351013183594, 0.055973052978515625, 0.059334754943847656, 0.06269645690917969, 0.06605815887451172, 0.06941986083984375, 0.07278156280517578, 0.07614326477050781, 0.07950496673583984, 0.08286666870117188, 0.0862283706665039, 0.08959007263183594, 0.09295177459716797, 0.0963134765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 9.0, 13.0, 6.0, 13.0, 12.0, 25.0, 25.0, 31.0, 29.0, 38.0, 58.0, 72.0, 72.0, 84.0, 86.0, 78.0, 74.0, 49.0, 49.0, 38.0, 29.0, 21.0, 20.0, 17.0, 10.0, 3.0, 6.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1478271484375, -0.14421463012695312, -0.14060211181640625, -0.13698959350585938, -0.1333770751953125, -0.12976455688476562, -0.12615203857421875, -0.12253952026367188, -0.118927001953125, -0.11531448364257812, -0.11170196533203125, -0.10808944702148438, -0.1044769287109375, -0.10086441040039062, -0.09725189208984375, -0.09363937377929688, -0.09002685546875, -0.08641433715820312, -0.08280181884765625, -0.07918930053710938, -0.0755767822265625, -0.07196426391601562, -0.06835174560546875, -0.06473922729492188, -0.061126708984375, -0.057514190673828125, -0.05390167236328125, -0.050289154052734375, -0.0466766357421875, -0.043064117431640625, -0.03945159912109375, -0.035839080810546875, -0.0322265625, -0.028614044189453125, -0.02500152587890625, -0.021389007568359375, -0.0177764892578125, -0.014163970947265625, -0.01055145263671875, -0.006938934326171875, -0.003326416015625, 0.000286102294921875, 0.00389862060546875, 0.007511138916015625, 0.0111236572265625, 0.014736175537109375, 0.01834869384765625, 0.021961212158203125, 0.02557373046875, 0.029186248779296875, 0.03279876708984375, 0.036411285400390625, 0.0400238037109375, 0.043636322021484375, 0.04724884033203125, 0.050861358642578125, 0.054473876953125, 0.058086395263671875, 0.06169891357421875, 0.06531143188476562, 0.0689239501953125, 0.07253646850585938, 0.07614898681640625, 0.07976150512695312, 0.0833740234375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 30.0, 64.0, 123.0, 186.0, 231.0, 169.0, 98.0, 47.0, 16.0, 7.0, 7.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0367140769958496, -1.9678680896759033, -1.8990222215652466, -1.8301763534545898, -1.7613303661346436, -1.6924843788146973, -1.6236385107040405, -1.5547926425933838, -1.4859466552734375, -1.4171006679534912, -1.3482547998428345, -1.2794089317321777, -1.2105629444122314, -1.1417169570922852, -1.0728710889816284, -1.0040252208709717, -0.9351792335510254, -0.8663333058357239, -0.7974873781204224, -0.7286414504051208, -0.6597955226898193, -0.5909495949745178, -0.5221036672592163, -0.4532577395439148, -0.3844118118286133, -0.31556588411331177, -0.24671995639801025, -0.17787402868270874, -0.10902810096740723, -0.04018217325210571, 0.0286637544631958, 0.09750968217849731, 0.16635560989379883, 0.23520153760910034, 0.30404746532440186, 0.37289339303970337, 0.4417393207550049, 0.5105852484703064, 0.5794311761856079, 0.6482771039009094, 0.7171230316162109, 0.7859689593315125, 0.854814887046814, 0.9236608147621155, 0.992506742477417, 1.0613527297973633, 1.13019859790802, 1.1990444660186768, 1.267890453338623, 1.3367364406585693, 1.405582308769226, 1.4744281768798828, 1.543274164199829, 1.6121201515197754, 1.6809660196304321, 1.7498118877410889, 1.8186578750610352, 1.8875038623809814, 1.9563497304916382, 2.025195598602295, 2.094041585922241, 2.1628875732421875, 2.2317333221435547, 2.300579309463501, 2.3694252967834473]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 8.0, 12.0, 11.0, 16.0, 17.0, 18.0, 29.0, 27.0, 35.0, 22.0, 31.0, 37.0, 32.0, 36.0, 43.0, 30.0, 40.0, 31.0, 42.0, 48.0, 42.0, 47.0, 35.0, 36.0, 40.0, 31.0, 32.0, 32.0, 22.0, 15.0, 9.0, 18.0, 15.0, 7.0, 4.0, 4.0, 8.0, 4.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0450348854064941, -1.010515809059143, -0.9759967923164368, -0.9414777159690857, -0.9069586396217346, -0.8724396228790283, -0.8379205465316772, -0.8034014701843262, -0.7688823938369751, -0.734363317489624, -0.6998443007469177, -0.6653252243995667, -0.6308061480522156, -0.5962871313095093, -0.5617680549621582, -0.5272489786148071, -0.49272996187210083, -0.45821091532707214, -0.42369183897972107, -0.3891727924346924, -0.3546537160873413, -0.3201346695423126, -0.28561562299728394, -0.25109654664993286, -0.21657750010490417, -0.1820584386587143, -0.14753937721252441, -0.11302033066749573, -0.07850126922130585, -0.04398220777511597, -0.00946316123008728, 0.0250559002161026, 0.05957496166229248, 0.09409402310848236, 0.12861308455467224, 0.16313213109970093, 0.1976511925458908, 0.2321702539920807, 0.2666893005371094, 0.30120837688446045, 0.33572742342948914, 0.3702464699745178, 0.4047655463218689, 0.4392845928668976, 0.47380363941192627, 0.5083227157592773, 0.5428417921066284, 0.5773608088493347, 0.6118798851966858, 0.6463989615440369, 0.6809179782867432, 0.7154370546340942, 0.7499561309814453, 0.7844752073287964, 0.8189942240715027, 0.8535133004188538, 0.8880323171615601, 0.9225513935089111, 0.9570704102516174, 0.9915894865989685, 1.0261085033416748, 1.0606275796890259, 1.095146656036377, 1.129665732383728, 1.164184808731079]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 19.0, 26.0, 28.0, 52.0, 75.0, 113.0, 173.0, 251.0, 427.0, 654.0, 1190.0, 2037.0, 3814.0, 7604.0, 16788.0, 43259.0, 125284.0, 366558.0, 899034.0, 1321572.0, 860287.0, 349970.0, 119665.0, 41672.0, 16613.0, 7835.0, 4053.0, 2178.0, 1156.0, 686.0, 438.0, 283.0, 169.0, 99.0, 60.0, 53.0, 29.0, 19.0, 17.0, 7.0, 12.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.158935546875, -0.1541900634765625, -0.149444580078125, -0.1446990966796875, -0.13995361328125, -0.1352081298828125, -0.130462646484375, -0.1257171630859375, -0.1209716796875, -0.1162261962890625, -0.111480712890625, -0.1067352294921875, -0.10198974609375, -0.0972442626953125, -0.092498779296875, -0.0877532958984375, -0.0830078125, -0.0782623291015625, -0.073516845703125, -0.0687713623046875, -0.06402587890625, -0.0592803955078125, -0.054534912109375, -0.0497894287109375, -0.0450439453125, -0.0402984619140625, -0.035552978515625, -0.0308074951171875, -0.02606201171875, -0.0213165283203125, -0.016571044921875, -0.0118255615234375, -0.007080078125, -0.0023345947265625, 0.002410888671875, 0.0071563720703125, 0.01190185546875, 0.0166473388671875, 0.021392822265625, 0.0261383056640625, 0.0308837890625, 0.0356292724609375, 0.040374755859375, 0.0451202392578125, 0.04986572265625, 0.0546112060546875, 0.059356689453125, 0.0641021728515625, 0.06884765625, 0.0735931396484375, 0.078338623046875, 0.0830841064453125, 0.08782958984375, 0.0925750732421875, 0.097320556640625, 0.1020660400390625, 0.1068115234375, 0.1115570068359375, 0.116302490234375, 0.1210479736328125, 0.12579345703125, 0.1305389404296875, 0.135284423828125, 0.1400299072265625, 0.144775390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 1.0, 5.0, 4.0, 5.0, 11.0, 9.0, 8.0, 17.0, 23.0, 13.0, 20.0, 24.0, 24.0, 25.0, 34.0, 34.0, 36.0, 32.0, 38.0, 46.0, 31.0, 44.0, 34.0, 43.0, 26.0, 30.0, 38.0, 38.0, 38.0, 33.0, 38.0, 29.0, 22.0, 24.0, 15.0, 13.0, 24.0, 13.0, 9.0, 16.0, 5.0, 8.0, 5.0, 7.0, 0.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1632080078125, -0.15781211853027344, -0.15241622924804688, -0.1470203399658203, -0.14162445068359375, -0.1362285614013672, -0.13083267211914062, -0.12543678283691406, -0.1200408935546875, -0.11464500427246094, -0.10924911499023438, -0.10385322570800781, -0.09845733642578125, -0.09306144714355469, -0.08766555786132812, -0.08226966857910156, -0.076873779296875, -0.07147789001464844, -0.06608200073242188, -0.06068611145019531, -0.05529022216796875, -0.04989433288574219, -0.044498443603515625, -0.03910255432128906, -0.0337066650390625, -0.028310775756835938, -0.022914886474609375, -0.017518997192382812, -0.01212310791015625, -0.0067272186279296875, -0.001331329345703125, 0.0040645599365234375, 0.00946044921875, 0.014856338500976562, 0.020252227783203125, 0.025648117065429688, 0.03104400634765625, 0.03643989562988281, 0.041835784912109375, 0.04723167419433594, 0.0526275634765625, 0.05802345275878906, 0.06341934204101562, 0.06881523132324219, 0.07421112060546875, 0.07960700988769531, 0.08500289916992188, 0.09039878845214844, 0.095794677734375, 0.10119056701660156, 0.10658645629882812, 0.11198234558105469, 0.11737823486328125, 0.12277412414550781, 0.12817001342773438, 0.13356590270996094, 0.1389617919921875, 0.14435768127441406, 0.14975357055664062, 0.1551494598388672, 0.16054534912109375, 0.1659412384033203, 0.17133712768554688, 0.17673301696777344, 0.18212890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 5.0, 8.0, 21.0, 23.0, 38.0, 49.0, 125.0, 238.0, 452.0, 918.0, 2276.0, 7592.0, 41469.0, 524515.0, 3377718.0, 207209.0, 23266.0, 5167.0, 1704.0, 718.0, 361.0, 174.0, 99.0, 44.0, 32.0, 16.0, 16.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6328125, -0.6154022216796875, -0.597991943359375, -0.5805816650390625, -0.56317138671875, -0.5457611083984375, -0.528350830078125, -0.5109405517578125, -0.4935302734375, -0.4761199951171875, -0.458709716796875, -0.4412994384765625, -0.42388916015625, -0.4064788818359375, -0.389068603515625, -0.3716583251953125, -0.354248046875, -0.3368377685546875, -0.319427490234375, -0.3020172119140625, -0.28460693359375, -0.2671966552734375, -0.249786376953125, -0.2323760986328125, -0.2149658203125, -0.1975555419921875, -0.180145263671875, -0.1627349853515625, -0.14532470703125, -0.1279144287109375, -0.110504150390625, -0.0930938720703125, -0.07568359375, -0.0582733154296875, -0.040863037109375, -0.0234527587890625, -0.00604248046875, 0.0113677978515625, 0.028778076171875, 0.0461883544921875, 0.0635986328125, 0.0810089111328125, 0.098419189453125, 0.1158294677734375, 0.13323974609375, 0.1506500244140625, 0.168060302734375, 0.1854705810546875, 0.202880859375, 0.2202911376953125, 0.237701416015625, 0.2551116943359375, 0.27252197265625, 0.2899322509765625, 0.307342529296875, 0.3247528076171875, 0.3421630859375, 0.3595733642578125, 0.376983642578125, 0.3943939208984375, 0.41180419921875, 0.4292144775390625, 0.446624755859375, 0.4640350341796875, 0.4814453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 21.0, 22.0, 32.0, 38.0, 80.0, 122.0, 266.0, 576.0, 1002.0, 889.0, 445.0, 220.0, 132.0, 75.0, 43.0, 26.0, 19.0, 17.0, 16.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.64990234375, -0.6335945129394531, -0.6172866821289062, -0.6009788513183594, -0.5846710205078125, -0.5683631896972656, -0.5520553588867188, -0.5357475280761719, -0.519439697265625, -0.5031318664550781, -0.48682403564453125, -0.4705162048339844, -0.4542083740234375, -0.4379005432128906, -0.42159271240234375, -0.4052848815917969, -0.38897705078125, -0.3726692199707031, -0.35636138916015625, -0.3400535583496094, -0.3237457275390625, -0.3074378967285156, -0.29113006591796875, -0.2748222351074219, -0.258514404296875, -0.24220657348632812, -0.22589874267578125, -0.20959091186523438, -0.1932830810546875, -0.17697525024414062, -0.16066741943359375, -0.14435958862304688, -0.1280517578125, -0.11174392700195312, -0.09543609619140625, -0.07912826538085938, -0.0628204345703125, -0.046512603759765625, -0.03020477294921875, -0.013896942138671875, 0.002410888671875, 0.018718719482421875, 0.03502655029296875, 0.051334381103515625, 0.0676422119140625, 0.08395004272460938, 0.10025787353515625, 0.11656570434570312, 0.13287353515625, 0.14918136596679688, 0.16548919677734375, 0.18179702758789062, 0.1981048583984375, 0.21441268920898438, 0.23072052001953125, 0.24702835083007812, 0.263336181640625, 0.2796440124511719, 0.29595184326171875, 0.3122596740722656, 0.3285675048828125, 0.3448753356933594, 0.36118316650390625, 0.3774909973144531, 0.393798828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 8.0, 9.0, 26.0, 39.0, 52.0, 104.0, 113.0, 152.0, 124.0, 104.0, 100.0, 64.0, 34.0, 22.0, 18.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4177896976470947, -1.3625602722167969, -1.307330846786499, -1.2521015405654907, -1.1968721151351929, -1.141642689704895, -1.0864132642745972, -1.0311839580535889, -0.975954532623291, -0.9207251071929932, -0.8654957413673401, -0.8102663159370422, -0.7550369501113892, -0.6998075246810913, -0.6445780992507935, -0.5893487334251404, -0.5341193079948425, -0.47888991236686707, -0.4236605167388916, -0.36843109130859375, -0.3132017254829407, -0.2579723000526428, -0.20274290442466736, -0.1475135087966919, -0.09228411316871643, -0.03705471381545067, 0.018174685537815094, 0.07340408861637115, 0.12863348424434662, 0.18386289477348328, 0.23909229040145874, 0.2943216860294342, 0.34955108165740967, 0.40478047728538513, 0.4600098729133606, 0.5152392983436584, 0.5704686641693115, 0.6256980895996094, 0.6809275150299072, 0.7361568808555603, 0.7913862466812134, 0.8466156721115112, 0.9018450379371643, 0.9570744633674622, 1.0123038291931152, 1.067533254623413, 1.122762680053711, 1.1779921054840088, 1.2332215309143066, 1.2884509563446045, 1.3436803817749023, 1.3989096879959106, 1.4541391134262085, 1.5093685388565063, 1.5645979642868042, 1.6198272705078125, 1.6750566959381104, 1.7302861213684082, 1.785515546798706, 1.8407448530197144, 1.8959742784500122, 1.95120370388031, 2.0064330101013184, 2.061662435531616, 2.116891860961914]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 3.0, 7.0, 6.0, 9.0, 7.0, 9.0, 15.0, 15.0, 13.0, 18.0, 28.0, 25.0, 23.0, 26.0, 30.0, 27.0, 37.0, 40.0, 50.0, 42.0, 30.0, 43.0, 32.0, 36.0, 26.0, 32.0, 26.0, 40.0, 37.0, 24.0, 29.0, 31.0, 22.0, 19.0, 22.0, 16.0, 10.0, 18.0, 14.0, 10.0, 12.0, 9.0, 9.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.96055006980896, -0.9320085644721985, -0.903467059135437, -0.8749254941940308, -0.8463839888572693, -0.8178424835205078, -0.7893009781837463, -0.7607594728469849, -0.7322179079055786, -0.7036764025688171, -0.6751348972320557, -0.6465933322906494, -0.6180518269538879, -0.5895103216171265, -0.560968816280365, -0.5324273109436035, -0.503885805606842, -0.47534430027008057, -0.4468027651309967, -0.41826125979423523, -0.38971972465515137, -0.3611782193183899, -0.3326367139816284, -0.30409520864486694, -0.2755536735057831, -0.2470121532678604, -0.21847063302993774, -0.18992912769317627, -0.1613876074552536, -0.13284608721733093, -0.10430458188056946, -0.07576306164264679, -0.047221601009368896, -0.018680084496736526, 0.009861432015895844, 0.038402944803237915, 0.06694446504116058, 0.09548598527908325, 0.12402749061584473, 0.1525690108537674, 0.18111053109169006, 0.20965205132961273, 0.2381935715675354, 0.2667350769042969, 0.29527658224105835, 0.3238181173801422, 0.3523596227169037, 0.38090115785598755, 0.409442663192749, 0.4379841685295105, 0.46652570366859436, 0.49506720900535583, 0.5236087441444397, 0.5521502494812012, 0.5806917548179626, 0.6092332601547241, 0.6377748250961304, 0.6663163304328918, 0.6948578357696533, 0.7233994007110596, 0.751940906047821, 0.7804824113845825, 0.809023916721344, 0.8375654220581055, 0.8661069273948669]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 4.0, 7.0, 10.0, 14.0, 10.0, 18.0, 17.0, 34.0, 49.0, 49.0, 80.0, 116.0, 205.0, 352.0, 644.0, 1111.0, 2133.0, 4414.0, 8930.0, 19463.0, 47067.0, 130341.0, 338778.0, 308020.0, 112157.0, 40913.0, 17118.0, 7902.0, 4068.0, 1982.0, 1004.0, 549.0, 360.0, 207.0, 133.0, 77.0, 56.0, 37.0, 27.0, 27.0, 12.0, 15.0, 10.0, 11.0, 8.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.292724609375, -0.2843437194824219, -0.27596282958984375, -0.2675819396972656, -0.2592010498046875, -0.2508201599121094, -0.24243927001953125, -0.23405838012695312, -0.225677490234375, -0.21729660034179688, -0.20891571044921875, -0.20053482055664062, -0.1921539306640625, -0.18377304077148438, -0.17539215087890625, -0.16701126098632812, -0.15863037109375, -0.15024948120117188, -0.14186859130859375, -0.13348770141601562, -0.1251068115234375, -0.11672592163085938, -0.10834503173828125, -0.09996414184570312, -0.091583251953125, -0.08320236206054688, -0.07482147216796875, -0.06644058227539062, -0.0580596923828125, -0.049678802490234375, -0.04129791259765625, -0.032917022705078125, -0.0245361328125, -0.016155242919921875, -0.00777435302734375, 0.000606536865234375, 0.0089874267578125, 0.017368316650390625, 0.02574920654296875, 0.034130096435546875, 0.042510986328125, 0.050891876220703125, 0.05927276611328125, 0.06765365600585938, 0.0760345458984375, 0.08441543579101562, 0.09279632568359375, 0.10117721557617188, 0.10955810546875, 0.11793899536132812, 0.12631988525390625, 0.13470077514648438, 0.1430816650390625, 0.15146255493164062, 0.15984344482421875, 0.16822433471679688, 0.176605224609375, 0.18498611450195312, 0.19336700439453125, 0.20174789428710938, 0.2101287841796875, 0.21850967407226562, 0.22689056396484375, 0.23527145385742188, 0.24365234375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 10.0, 13.0, 7.0, 9.0, 12.0, 18.0, 21.0, 32.0, 23.0, 33.0, 23.0, 31.0, 32.0, 30.0, 38.0, 30.0, 40.0, 33.0, 47.0, 36.0, 34.0, 54.0, 29.0, 31.0, 36.0, 33.0, 31.0, 42.0, 28.0, 27.0, 20.0, 15.0, 15.0, 10.0, 18.0, 14.0, 9.0, 9.0, 0.0, 1.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.18017578125, -0.17490577697753906, -0.16963577270507812, -0.1643657684326172, -0.15909576416015625, -0.1538257598876953, -0.14855575561523438, -0.14328575134277344, -0.1380157470703125, -0.13274574279785156, -0.12747573852539062, -0.12220573425292969, -0.11693572998046875, -0.11166572570800781, -0.10639572143554688, -0.10112571716308594, -0.095855712890625, -0.09058570861816406, -0.08531570434570312, -0.08004570007324219, -0.07477569580078125, -0.06950569152832031, -0.06423568725585938, -0.05896568298339844, -0.0536956787109375, -0.04842567443847656, -0.043155670166015625, -0.03788566589355469, -0.03261566162109375, -0.027345657348632812, -0.022075653076171875, -0.016805648803710938, -0.01153564453125, -0.0062656402587890625, -0.000995635986328125, 0.0042743682861328125, 0.00954437255859375, 0.014814376831054688, 0.020084381103515625, 0.025354385375976562, 0.0306243896484375, 0.03589439392089844, 0.041164398193359375, 0.04643440246582031, 0.05170440673828125, 0.05697441101074219, 0.062244415283203125, 0.06751441955566406, 0.072784423828125, 0.07805442810058594, 0.08332443237304688, 0.08859443664550781, 0.09386444091796875, 0.09913444519042969, 0.10440444946289062, 0.10967445373535156, 0.1149444580078125, 0.12021446228027344, 0.12548446655273438, 0.1307544708251953, 0.13602447509765625, 0.1412944793701172, 0.14656448364257812, 0.15183448791503906, 0.1571044921875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 13.0, 21.0, 40.0, 50.0, 71.0, 122.0, 194.0, 432.0, 772.0, 1623.0, 3546.0, 8865.0, 23669.0, 85265.0, 463893.0, 360159.0, 66505.0, 19905.0, 7375.0, 3122.0, 1362.0, 678.0, 373.0, 169.0, 123.0, 59.0, 49.0, 22.0, 17.0, 9.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.544921875, -0.5283660888671875, -0.511810302734375, -0.4952545166015625, -0.47869873046875, -0.4621429443359375, -0.445587158203125, -0.4290313720703125, -0.4124755859375, -0.3959197998046875, -0.379364013671875, -0.3628082275390625, -0.34625244140625, -0.3296966552734375, -0.313140869140625, -0.2965850830078125, -0.280029296875, -0.2634735107421875, -0.246917724609375, -0.2303619384765625, -0.21380615234375, -0.1972503662109375, -0.180694580078125, -0.1641387939453125, -0.1475830078125, -0.1310272216796875, -0.114471435546875, -0.0979156494140625, -0.08135986328125, -0.0648040771484375, -0.048248291015625, -0.0316925048828125, -0.01513671875, 0.0014190673828125, 0.017974853515625, 0.0345306396484375, 0.05108642578125, 0.0676422119140625, 0.084197998046875, 0.1007537841796875, 0.1173095703125, 0.1338653564453125, 0.150421142578125, 0.1669769287109375, 0.18353271484375, 0.2000885009765625, 0.216644287109375, 0.2332000732421875, 0.249755859375, 0.2663116455078125, 0.282867431640625, 0.2994232177734375, 0.31597900390625, 0.3325347900390625, 0.349090576171875, 0.3656463623046875, 0.3822021484375, 0.3987579345703125, 0.415313720703125, 0.4318695068359375, 0.44842529296875, 0.4649810791015625, 0.481536865234375, 0.4980926513671875, 0.5146484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 3.0, 7.0, 12.0, 6.0, 9.0, 10.0, 14.0, 19.0, 23.0, 25.0, 41.0, 33.0, 34.0, 43.0, 40.0, 60.0, 50.0, 56.0, 48.0, 59.0, 49.0, 39.0, 47.0, 43.0, 30.0, 34.0, 33.0, 20.0, 17.0, 14.0, 7.0, 8.0, 12.0, 10.0, 16.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71630859375, -0.6935348510742188, -0.6707611083984375, -0.6479873657226562, -0.625213623046875, -0.6024398803710938, -0.5796661376953125, -0.5568923950195312, -0.53411865234375, -0.5113449096679688, -0.4885711669921875, -0.46579742431640625, -0.443023681640625, -0.42024993896484375, -0.3974761962890625, -0.37470245361328125, -0.3519287109375, -0.32915496826171875, -0.3063812255859375, -0.28360748291015625, -0.260833740234375, -0.23805999755859375, -0.2152862548828125, -0.19251251220703125, -0.16973876953125, -0.14696502685546875, -0.1241912841796875, -0.10141754150390625, -0.078643798828125, -0.05587005615234375, -0.0330963134765625, -0.01032257080078125, 0.012451171875, 0.03522491455078125, 0.0579986572265625, 0.08077239990234375, 0.103546142578125, 0.12631988525390625, 0.1490936279296875, 0.17186737060546875, 0.19464111328125, 0.21741485595703125, 0.2401885986328125, 0.26296234130859375, 0.285736083984375, 0.30850982666015625, 0.3312835693359375, 0.35405731201171875, 0.3768310546875, 0.39960479736328125, 0.4223785400390625, 0.44515228271484375, 0.467926025390625, 0.49069976806640625, 0.5134735107421875, 0.5362472534179688, 0.55902099609375, 0.5817947387695312, 0.6045684814453125, 0.6273422241210938, 0.650115966796875, 0.6728897094726562, 0.6956634521484375, 0.7184371948242188, 0.7412109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 10.0, 16.0, 32.0, 53.0, 69.0, 78.0, 146.0, 227.0, 347.0, 581.0, 1002.0, 1741.0, 3063.0, 5015.0, 9196.0, 17105.0, 35927.0, 91086.0, 254509.0, 358869.0, 158273.0, 57070.0, 24746.0, 12575.0, 7045.0, 4015.0, 2243.0, 1339.0, 808.0, 498.0, 307.0, 188.0, 128.0, 77.0, 49.0, 35.0, 14.0, 17.0, 15.0, 7.0, 3.0, 9.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.0973501205444336, -0.09423637390136719, -0.09112262725830078, -0.08800888061523438, -0.08489513397216797, -0.08178138732910156, -0.07866764068603516, -0.07555389404296875, -0.07244014739990234, -0.06932640075683594, -0.06621265411376953, -0.06309890747070312, -0.05998516082763672, -0.05687141418457031, -0.053757667541503906, -0.0506439208984375, -0.047530174255371094, -0.04441642761230469, -0.04130268096923828, -0.038188934326171875, -0.03507518768310547, -0.03196144104003906, -0.028847694396972656, -0.02573394775390625, -0.022620201110839844, -0.019506454467773438, -0.01639270782470703, -0.013278961181640625, -0.010165214538574219, -0.0070514678955078125, -0.003937721252441406, -0.000823974609375, 0.0022897720336914062, 0.0054035186767578125, 0.008517265319824219, 0.011631011962890625, 0.014744758605957031, 0.017858505249023438, 0.020972251892089844, 0.02408599853515625, 0.027199745178222656, 0.030313491821289062, 0.03342723846435547, 0.036540985107421875, 0.03965473175048828, 0.04276847839355469, 0.045882225036621094, 0.0489959716796875, 0.052109718322753906, 0.05522346496582031, 0.05833721160888672, 0.061450958251953125, 0.06456470489501953, 0.06767845153808594, 0.07079219818115234, 0.07390594482421875, 0.07701969146728516, 0.08013343811035156, 0.08324718475341797, 0.08636093139648438, 0.08947467803955078, 0.09258842468261719, 0.0957021713256836, 0.09881591796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 9.0, 3.0, 6.0, 10.0, 15.0, 29.0, 62.0, 97.0, 164.0, 163.0, 165.0, 109.0, 58.0, 32.0, 20.0, 13.0, 2.0, 5.0, 10.0, 8.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.16312026977539e-05, -5.9985555708408356e-05, -5.8339908719062805e-05, -5.6694261729717255e-05, -5.5048614740371704e-05, -5.3402967751026154e-05, -5.17573207616806e-05, -5.011167377233505e-05, -4.84660267829895e-05, -4.682037979364395e-05, -4.51747328042984e-05, -4.352908581495285e-05, -4.18834388256073e-05, -4.023779183626175e-05, -3.85921448469162e-05, -3.694649785757065e-05, -3.53008508682251e-05, -3.365520387887955e-05, -3.2009556889533997e-05, -3.0363909900188446e-05, -2.8718262910842896e-05, -2.7072615921497345e-05, -2.5426968932151794e-05, -2.3781321942806244e-05, -2.2135674953460693e-05, -2.0490027964115143e-05, -1.8844380974769592e-05, -1.7198733985424042e-05, -1.555308699607849e-05, -1.390744000673294e-05, -1.226179301738739e-05, -1.061614602804184e-05, -8.970499038696289e-06, -7.3248520493507385e-06, -5.679205060005188e-06, -4.0335580706596375e-06, -2.387911081314087e-06, -7.422640919685364e-07, 9.033828973770142e-07, 2.5490298867225647e-06, 4.194676876068115e-06, 5.840323865413666e-06, 7.485970854759216e-06, 9.131617844104767e-06, 1.0777264833450317e-05, 1.2422911822795868e-05, 1.4068558812141418e-05, 1.571420580148697e-05, 1.735985279083252e-05, 1.900549978017807e-05, 2.065114676952362e-05, 2.229679375886917e-05, 2.394244074821472e-05, 2.5588087737560272e-05, 2.7233734726905823e-05, 2.8879381716251373e-05, 3.0525028705596924e-05, 3.2170675694942474e-05, 3.3816322684288025e-05, 3.5461969673633575e-05, 3.7107616662979126e-05, 3.8753263652324677e-05, 4.039891064167023e-05, 4.204455763101578e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 8.0, 10.0, 10.0, 15.0, 20.0, 36.0, 53.0, 88.0, 115.0, 222.0, 398.0, 757.0, 1485.0, 3151.0, 6940.0, 15849.0, 38254.0, 102893.0, 268560.0, 345716.0, 163171.0, 58837.0, 23061.0, 10004.0, 4555.0, 2032.0, 1021.0, 507.0, 293.0, 196.0, 97.0, 65.0, 48.0, 23.0, 18.0, 10.0, 11.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.103515625, -0.10039997100830078, -0.09728431701660156, -0.09416866302490234, -0.09105300903320312, -0.0879373550415039, -0.08482170104980469, -0.08170604705810547, -0.07859039306640625, -0.07547473907470703, -0.07235908508300781, -0.0692434310913086, -0.06612777709960938, -0.06301212310791016, -0.05989646911621094, -0.05678081512451172, -0.0536651611328125, -0.05054950714111328, -0.04743385314941406, -0.044318199157714844, -0.041202545166015625, -0.038086891174316406, -0.03497123718261719, -0.03185558319091797, -0.02873992919921875, -0.02562427520751953, -0.022508621215820312, -0.019392967224121094, -0.016277313232421875, -0.013161659240722656, -0.010046005249023438, -0.006930351257324219, -0.003814697265625, -0.0006990432739257812, 0.0024166107177734375, 0.005532264709472656, 0.008647918701171875, 0.011763572692871094, 0.014879226684570312, 0.01799488067626953, 0.02111053466796875, 0.02422618865966797, 0.027341842651367188, 0.030457496643066406, 0.033573150634765625, 0.036688804626464844, 0.03980445861816406, 0.04292011260986328, 0.0460357666015625, 0.04915142059326172, 0.05226707458496094, 0.055382728576660156, 0.058498382568359375, 0.061614036560058594, 0.06472969055175781, 0.06784534454345703, 0.07096099853515625, 0.07407665252685547, 0.07719230651855469, 0.0803079605102539, 0.08342361450195312, 0.08653926849365234, 0.08965492248535156, 0.09277057647705078, 0.09588623046875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 13.0, 5.0, 15.0, 10.0, 22.0, 26.0, 31.0, 42.0, 48.0, 68.0, 81.0, 79.0, 82.0, 93.0, 83.0, 66.0, 67.0, 30.0, 26.0, 21.0, 21.0, 13.0, 6.0, 6.0, 6.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.142822265625, -0.13868427276611328, -0.13454627990722656, -0.13040828704833984, -0.12627029418945312, -0.1221323013305664, -0.11799430847167969, -0.11385631561279297, -0.10971832275390625, -0.10558032989501953, -0.10144233703613281, -0.0973043441772461, -0.09316635131835938, -0.08902835845947266, -0.08489036560058594, -0.08075237274169922, -0.0766143798828125, -0.07247638702392578, -0.06833839416503906, -0.06420040130615234, -0.060062408447265625, -0.055924415588378906, -0.05178642272949219, -0.04764842987060547, -0.04351043701171875, -0.03937244415283203, -0.03523445129394531, -0.031096458435058594, -0.026958465576171875, -0.022820472717285156, -0.018682479858398438, -0.014544486999511719, -0.010406494140625, -0.006268501281738281, -0.0021305084228515625, 0.0020074844360351562, 0.006145477294921875, 0.010283470153808594, 0.014421463012695312, 0.01855945587158203, 0.02269744873046875, 0.02683544158935547, 0.030973434448242188, 0.035111427307128906, 0.039249420166015625, 0.043387413024902344, 0.04752540588378906, 0.05166339874267578, 0.0558013916015625, 0.05993938446044922, 0.06407737731933594, 0.06821537017822266, 0.07235336303710938, 0.0764913558959961, 0.08062934875488281, 0.08476734161376953, 0.08890533447265625, 0.09304332733154297, 0.09718132019042969, 0.1013193130493164, 0.10545730590820312, 0.10959529876708984, 0.11373329162597656, 0.11787128448486328, 0.12200927734375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 9.0, 14.0, 15.0, 42.0, 50.0, 98.0, 111.0, 164.0, 133.0, 125.0, 80.0, 56.0, 39.0, 20.0, 12.0, 10.0, 2.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2149240970611572, -2.153782844543457, -2.092641830444336, -2.0315005779266357, -1.9703595638275146, -1.909218430519104, -1.8480772972106934, -1.7869360446929932, -1.725795030593872, -1.6646538972854614, -1.6035127639770508, -1.5423716306686401, -1.4812304973602295, -1.4200893640518188, -1.3589482307434082, -1.297806978225708, -1.2366658449172974, -1.1755247116088867, -1.114383578300476, -1.0532424449920654, -0.9921013116836548, -0.9309601783752441, -0.8698189854621887, -0.8086778521537781, -0.7475367188453674, -0.6863955855369568, -0.6252544522285461, -0.5641132593154907, -0.5029721260070801, -0.4418310225009918, -0.3806898593902588, -0.31954872608184814, -0.25840747356414795, -0.1972663402557373, -0.13612519204616547, -0.07498404383659363, -0.013842910528182983, 0.04729822278022766, 0.1084393858909607, 0.16958051919937134, 0.23072165250778198, 0.2918627858161926, 0.35300391912460327, 0.4141450822353363, 0.47528621554374695, 0.53642737865448, 0.5975685119628906, 0.6587096452713013, 0.7198507785797119, 0.7809919118881226, 0.8421330451965332, 0.9032741785049438, 0.9644153118133545, 1.0255564451217651, 1.0866975784301758, 1.147838830947876, 1.208979845046997, 1.2701209783554077, 1.3312621116638184, 1.392403244972229, 1.4535443782806396, 1.5146855115890503, 1.575826644897461, 1.6369678974151611, 1.6981090307235718]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 8.0, 6.0, 9.0, 7.0, 8.0, 10.0, 10.0, 18.0, 20.0, 32.0, 23.0, 33.0, 28.0, 27.0, 35.0, 46.0, 33.0, 32.0, 38.0, 40.0, 37.0, 36.0, 36.0, 46.0, 45.0, 34.0, 31.0, 44.0, 30.0, 28.0, 25.0, 27.0, 14.0, 16.0, 14.0, 12.0, 6.0, 13.0, 6.0, 11.0, 3.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.407486915588379, -1.361666202545166, -1.3158454895019531, -1.2700247764587402, -1.2242040634155273, -1.1783833503723145, -1.1325626373291016, -1.0867419242858887, -1.0409212112426758, -0.9951004981994629, -0.94927978515625, -0.9034590721130371, -0.8576383590698242, -0.8118176460266113, -0.7659968733787537, -0.7201761603355408, -0.6743553876876831, -0.6285346746444702, -0.5827139616012573, -0.5368932485580444, -0.49107250571250916, -0.44525179266929626, -0.399431049823761, -0.3536103367805481, -0.3077896237373352, -0.2619689106941223, -0.21614818274974823, -0.17032745480537415, -0.12450674176216125, -0.07868602871894836, -0.032865285873413086, 0.012955427169799805, 0.058776140213012695, 0.10459686070680618, 0.15041758120059967, 0.19623830914497375, 0.24205902218818665, 0.28787973523139954, 0.3337004780769348, 0.3795211911201477, 0.4253419041633606, 0.4711626172065735, 0.5169833302497864, 0.562804102897644, 0.6086248159408569, 0.6544455289840698, 0.7002662420272827, 0.7460869550704956, 0.7919076681137085, 0.8377283811569214, 0.8835490942001343, 0.9293698072433472, 0.9751905202865601, 1.021011233329773, 1.0668320655822754, 1.1126527786254883, 1.1584734916687012, 1.204294204711914, 1.250114917755127, 1.2959356307983398, 1.3417563438415527, 1.3875770568847656, 1.4333977699279785, 1.4792184829711914, 1.5250391960144043]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 14.0, 20.0, 24.0, 44.0, 45.0, 65.0, 118.0, 182.0, 244.0, 395.0, 665.0, 973.0, 1684.0, 2975.0, 5592.0, 11630.0, 24756.0, 55884.0, 119571.0, 247880.0, 488376.0, 790214.0, 906262.0, 698090.0, 428786.0, 223436.0, 101641.0, 43735.0, 19654.0, 9757.0, 4921.0, 2583.0, 1517.0, 860.0, 594.0, 356.0, 249.0, 178.0, 106.0, 69.0, 46.0, 37.0, 19.0, 10.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1162109375, -0.11225700378417969, -0.10830307006835938, -0.10434913635253906, -0.10039520263671875, -0.09644126892089844, -0.09248733520507812, -0.08853340148925781, -0.0845794677734375, -0.08062553405761719, -0.07667160034179688, -0.07271766662597656, -0.06876373291015625, -0.06480979919433594, -0.060855865478515625, -0.05690193176269531, -0.052947998046875, -0.04899406433105469, -0.045040130615234375, -0.04108619689941406, -0.03713226318359375, -0.03317832946777344, -0.029224395751953125, -0.025270462036132812, -0.0213165283203125, -0.017362594604492188, -0.013408660888671875, -0.009454727172851562, -0.00550079345703125, -0.0015468597412109375, 0.002407073974609375, 0.0063610076904296875, 0.01031494140625, 0.014268875122070312, 0.018222808837890625, 0.022176742553710938, 0.02613067626953125, 0.030084609985351562, 0.034038543701171875, 0.03799247741699219, 0.0419464111328125, 0.04590034484863281, 0.049854278564453125, 0.05380821228027344, 0.05776214599609375, 0.06171607971191406, 0.06567001342773438, 0.06962394714355469, 0.073577880859375, 0.07753181457519531, 0.08148574829101562, 0.08543968200683594, 0.08939361572265625, 0.09334754943847656, 0.09730148315429688, 0.10125541687011719, 0.1052093505859375, 0.10916328430175781, 0.11311721801757812, 0.11707115173339844, 0.12102508544921875, 0.12497901916503906, 0.12893295288085938, 0.1328868865966797, 0.1368408203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 8.0, 6.0, 4.0, 9.0, 9.0, 11.0, 17.0, 16.0, 31.0, 15.0, 32.0, 19.0, 28.0, 39.0, 27.0, 32.0, 37.0, 48.0, 44.0, 49.0, 35.0, 50.0, 43.0, 47.0, 48.0, 47.0, 39.0, 30.0, 29.0, 29.0, 23.0, 26.0, 13.0, 12.0, 6.0, 7.0, 6.0, 5.0, 8.0, 5.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.251708984375, -0.24436187744140625, -0.2370147705078125, -0.22966766357421875, -0.222320556640625, -0.21497344970703125, -0.2076263427734375, -0.20027923583984375, -0.19293212890625, -0.18558502197265625, -0.1782379150390625, -0.17089080810546875, -0.163543701171875, -0.15619659423828125, -0.1488494873046875, -0.14150238037109375, -0.1341552734375, -0.12680816650390625, -0.1194610595703125, -0.11211395263671875, -0.104766845703125, -0.09741973876953125, -0.0900726318359375, -0.08272552490234375, -0.07537841796875, -0.06803131103515625, -0.0606842041015625, -0.05333709716796875, -0.045989990234375, -0.03864288330078125, -0.0312957763671875, -0.02394866943359375, -0.0166015625, -0.00925445556640625, -0.0019073486328125, 0.00543975830078125, 0.012786865234375, 0.02013397216796875, 0.0274810791015625, 0.03482818603515625, 0.04217529296875, 0.04952239990234375, 0.0568695068359375, 0.06421661376953125, 0.071563720703125, 0.07891082763671875, 0.0862579345703125, 0.09360504150390625, 0.1009521484375, 0.10829925537109375, 0.1156463623046875, 0.12299346923828125, 0.130340576171875, 0.13768768310546875, 0.1450347900390625, 0.15238189697265625, 0.15972900390625, 0.16707611083984375, 0.1744232177734375, 0.18177032470703125, 0.189117431640625, 0.19646453857421875, 0.2038116455078125, 0.21115875244140625, 0.218505859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 14.0, 31.0, 44.0, 66.0, 146.0, 295.0, 642.0, 1797.0, 7409.0, 58673.0, 1559643.0, 2466889.0, 85574.0, 9513.0, 2112.0, 763.0, 295.0, 168.0, 93.0, 43.0, 18.0, 15.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7692031860351562, -0.7478790283203125, -0.7265548706054688, -0.705230712890625, -0.6839065551757812, -0.6625823974609375, -0.6412582397460938, -0.61993408203125, -0.5986099243164062, -0.5772857666015625, -0.5559616088867188, -0.534637451171875, -0.5133132934570312, -0.4919891357421875, -0.47066497802734375, -0.4493408203125, -0.42801666259765625, -0.4066925048828125, -0.38536834716796875, -0.364044189453125, -0.34272003173828125, -0.3213958740234375, -0.30007171630859375, -0.27874755859375, -0.25742340087890625, -0.2360992431640625, -0.21477508544921875, -0.193450927734375, -0.17212677001953125, -0.1508026123046875, -0.12947845458984375, -0.108154296875, -0.08683013916015625, -0.0655059814453125, -0.04418182373046875, -0.022857666015625, -0.00153350830078125, 0.0197906494140625, 0.04111480712890625, 0.06243896484375, 0.08376312255859375, 0.1050872802734375, 0.12641143798828125, 0.147735595703125, 0.16905975341796875, 0.1903839111328125, 0.21170806884765625, 0.2330322265625, 0.25435638427734375, 0.2756805419921875, 0.29700469970703125, 0.318328857421875, 0.33965301513671875, 0.3609771728515625, 0.38230133056640625, 0.40362548828125, 0.42494964599609375, 0.4462738037109375, 0.46759796142578125, 0.488922119140625, 0.5102462768554688, 0.5315704345703125, 0.5528945922851562, 0.57421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 21.0, 31.0, 41.0, 52.0, 113.0, 207.0, 413.0, 650.0, 894.0, 710.0, 384.0, 210.0, 116.0, 64.0, 49.0, 36.0, 20.0, 13.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70849609375, -0.6905746459960938, -0.6726531982421875, -0.6547317504882812, -0.636810302734375, -0.6188888549804688, -0.6009674072265625, -0.5830459594726562, -0.56512451171875, -0.5472030639648438, -0.5292816162109375, -0.5113601684570312, -0.493438720703125, -0.47551727294921875, -0.4575958251953125, -0.43967437744140625, -0.4217529296875, -0.40383148193359375, -0.3859100341796875, -0.36798858642578125, -0.350067138671875, -0.33214569091796875, -0.3142242431640625, -0.29630279541015625, -0.27838134765625, -0.26045989990234375, -0.2425384521484375, -0.22461700439453125, -0.206695556640625, -0.18877410888671875, -0.1708526611328125, -0.15293121337890625, -0.135009765625, -0.11708831787109375, -0.0991668701171875, -0.08124542236328125, -0.063323974609375, -0.04540252685546875, -0.0274810791015625, -0.00955963134765625, 0.00836181640625, 0.02628326416015625, 0.0442047119140625, 0.06212615966796875, 0.080047607421875, 0.09796905517578125, 0.1158905029296875, 0.13381195068359375, 0.1517333984375, 0.16965484619140625, 0.1875762939453125, 0.20549774169921875, 0.223419189453125, 0.24134063720703125, 0.2592620849609375, 0.27718353271484375, 0.29510498046875, 0.31302642822265625, 0.3309478759765625, 0.34886932373046875, 0.366790771484375, 0.38471221923828125, 0.4026336669921875, 0.42055511474609375, 0.4384765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 3.0, 14.0, 28.0, 31.0, 45.0, 77.0, 76.0, 67.0, 96.0, 100.0, 96.0, 86.0, 71.0, 57.0, 48.0, 29.0, 17.0, 13.0, 9.0, 5.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.312841534614563, -1.265079140663147, -1.2173168659210205, -1.1695544719696045, -1.1217920780181885, -1.0740296840667725, -1.026267409324646, -0.97850501537323, -0.9307426810264587, -0.8829803466796875, -0.8352179527282715, -0.7874556183815002, -0.739693284034729, -0.691930890083313, -0.6441685557365417, -0.5964062213897705, -0.5486438274383545, -0.5008814930915833, -0.45311909914016724, -0.405356764793396, -0.35759440064430237, -0.30983203649520874, -0.2620697021484375, -0.21430733799934387, -0.16654497385025024, -0.11878261715173721, -0.07102026045322418, -0.023257911205291748, 0.02450445294380188, 0.07226681709289551, 0.12002915143966675, 0.16779151558876038, 0.21555376052856445, 0.2633161246776581, 0.3110784888267517, 0.35884082317352295, 0.4066031873226166, 0.4543655514717102, 0.5021278858184814, 0.5498902797698975, 0.5976526141166687, 0.6454149484634399, 0.693177342414856, 0.7409396767616272, 0.7887020111083984, 0.8364644050598145, 0.8842267394065857, 0.9319890737533569, 0.979751467704773, 1.027513861656189, 1.0752761363983154, 1.1230385303497314, 1.1708009243011475, 1.2185633182525635, 1.26632559299469, 1.314087986946106, 1.3618502616882324, 1.4096126556396484, 1.457374930381775, 1.505137324333191, 1.552899718284607, 1.6006619930267334, 1.6484243869781494, 1.6961867809295654, 1.7439491748809814]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 8.0, 9.0, 6.0, 12.0, 5.0, 7.0, 12.0, 18.0, 15.0, 17.0, 22.0, 31.0, 31.0, 30.0, 39.0, 37.0, 33.0, 36.0, 35.0, 51.0, 46.0, 48.0, 40.0, 38.0, 48.0, 41.0, 37.0, 25.0, 29.0, 33.0, 13.0, 20.0, 22.0, 19.0, 19.0, 16.0, 11.0, 4.0, 10.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0], "bins": [-1.2578117847442627, -1.2224985361099243, -1.187185287475586, -1.151872158050537, -1.1165589094161987, -1.0812456607818604, -1.0459325313568115, -1.0106192827224731, -0.9753060340881348, -0.9399927854537964, -0.9046795964241028, -0.8693664073944092, -0.8340531587600708, -0.7987399101257324, -0.7634267210960388, -0.7281135320663452, -0.6928002834320068, -0.6574870347976685, -0.6221738457679749, -0.5868606567382812, -0.5515474081039429, -0.5162341594696045, -0.4809209704399109, -0.4456077516078949, -0.4102945327758789, -0.3749813139438629, -0.3396680951118469, -0.30435487627983093, -0.26904165744781494, -0.23372843861579895, -0.19841521978378296, -0.16310200095176697, -0.12778878211975098, -0.09247556328773499, -0.057162344455718994, -0.021849125623703003, 0.013464093208312988, 0.04877731204032898, 0.08409053087234497, 0.11940374970436096, 0.15471696853637695, 0.19003018736839294, 0.22534340620040894, 0.2606566250324249, 0.2959698438644409, 0.3312830626964569, 0.3665962815284729, 0.4019095003604889, 0.4372227191925049, 0.4725359380245209, 0.5078491568565369, 0.5431623458862305, 0.5784755945205688, 0.6137888431549072, 0.6491020321846008, 0.6844152212142944, 0.7197284698486328, 0.7550417184829712, 0.7903549075126648, 0.8256680965423584, 0.8609813451766968, 0.8962945938110352, 0.9316077828407288, 0.9669209718704224, 1.0022342205047607]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 2.0, 9.0, 10.0, 13.0, 27.0, 35.0, 36.0, 72.0, 88.0, 155.0, 221.0, 354.0, 574.0, 981.0, 1586.0, 2609.0, 4538.0, 7979.0, 14266.0, 27986.0, 61800.0, 151849.0, 297153.0, 260351.0, 116413.0, 48258.0, 22805.0, 12041.0, 6782.0, 3871.0, 2161.0, 1306.0, 824.0, 492.0, 307.0, 170.0, 135.0, 87.0, 61.0, 40.0, 32.0, 28.0, 17.0, 14.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2452392578125, -0.23702430725097656, -0.22880935668945312, -0.2205944061279297, -0.21237945556640625, -0.2041645050048828, -0.19594955444335938, -0.18773460388183594, -0.1795196533203125, -0.17130470275878906, -0.16308975219726562, -0.1548748016357422, -0.14665985107421875, -0.1384449005126953, -0.13022994995117188, -0.12201499938964844, -0.113800048828125, -0.10558509826660156, -0.09737014770507812, -0.08915519714355469, -0.08094024658203125, -0.07272529602050781, -0.06451034545898438, -0.05629539489746094, -0.0480804443359375, -0.03986549377441406, -0.031650543212890625, -0.023435592651367188, -0.01522064208984375, -0.0070056915283203125, 0.001209259033203125, 0.009424209594726562, 0.01763916015625, 0.025854110717773438, 0.034069061279296875, 0.04228401184082031, 0.05049896240234375, 0.05871391296386719, 0.06692886352539062, 0.07514381408691406, 0.0833587646484375, 0.09157371520996094, 0.09978866577148438, 0.10800361633300781, 0.11621856689453125, 0.12443351745605469, 0.13264846801757812, 0.14086341857910156, 0.149078369140625, 0.15729331970214844, 0.16550827026367188, 0.1737232208251953, 0.18193817138671875, 0.1901531219482422, 0.19836807250976562, 0.20658302307128906, 0.2147979736328125, 0.22301292419433594, 0.23122787475585938, 0.2394428253173828, 0.24765777587890625, 0.2558727264404297, 0.2640876770019531, 0.27230262756347656, 0.280517578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 9.0, 9.0, 10.0, 17.0, 19.0, 20.0, 26.0, 27.0, 26.0, 29.0, 37.0, 32.0, 38.0, 46.0, 50.0, 52.0, 40.0, 48.0, 47.0, 54.0, 49.0, 38.0, 30.0, 31.0, 22.0, 23.0, 25.0, 27.0, 21.0, 11.0, 12.0, 10.0, 9.0, 10.0, 10.0, 3.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.19951629638671875, -0.1924896240234375, -0.18546295166015625, -0.178436279296875, -0.17140960693359375, -0.1643829345703125, -0.15735626220703125, -0.15032958984375, -0.14330291748046875, -0.1362762451171875, -0.12924957275390625, -0.122222900390625, -0.11519622802734375, -0.1081695556640625, -0.10114288330078125, -0.0941162109375, -0.08708953857421875, -0.0800628662109375, -0.07303619384765625, -0.066009521484375, -0.05898284912109375, -0.0519561767578125, -0.04492950439453125, -0.03790283203125, -0.03087615966796875, -0.0238494873046875, -0.01682281494140625, -0.009796142578125, -0.00276947021484375, 0.0042572021484375, 0.01128387451171875, 0.018310546875, 0.02533721923828125, 0.0323638916015625, 0.03939056396484375, 0.046417236328125, 0.05344390869140625, 0.0604705810546875, 0.06749725341796875, 0.07452392578125, 0.08155059814453125, 0.0885772705078125, 0.09560394287109375, 0.102630615234375, 0.10965728759765625, 0.1166839599609375, 0.12371063232421875, 0.1307373046875, 0.13776397705078125, 0.1447906494140625, 0.15181732177734375, 0.158843994140625, 0.16587066650390625, 0.1728973388671875, 0.17992401123046875, 0.18695068359375, 0.19397735595703125, 0.2010040283203125, 0.20803070068359375, 0.215057373046875, 0.22208404541015625, 0.2291107177734375, 0.23613739013671875, 0.2431640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 14.0, 22.0, 21.0, 41.0, 40.0, 69.0, 93.0, 156.0, 332.0, 569.0, 1175.0, 2642.0, 6283.0, 15101.0, 38135.0, 109707.0, 370849.0, 342473.0, 100575.0, 35436.0, 14098.0, 5789.0, 2534.0, 1083.0, 525.0, 303.0, 165.0, 102.0, 79.0, 27.0, 23.0, 19.0, 14.0, 12.0, 9.0, 11.0, 5.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4091796875, -0.395050048828125, -0.38092041015625, -0.366790771484375, -0.3526611328125, -0.338531494140625, -0.32440185546875, -0.310272216796875, -0.296142578125, -0.282012939453125, -0.26788330078125, -0.253753662109375, -0.2396240234375, -0.225494384765625, -0.21136474609375, -0.197235107421875, -0.18310546875, -0.168975830078125, -0.15484619140625, -0.140716552734375, -0.1265869140625, -0.112457275390625, -0.09832763671875, -0.084197998046875, -0.070068359375, -0.055938720703125, -0.04180908203125, -0.027679443359375, -0.0135498046875, 0.000579833984375, 0.01470947265625, 0.028839111328125, 0.04296875, 0.057098388671875, 0.07122802734375, 0.085357666015625, 0.0994873046875, 0.113616943359375, 0.12774658203125, 0.141876220703125, 0.156005859375, 0.170135498046875, 0.18426513671875, 0.198394775390625, 0.2125244140625, 0.226654052734375, 0.24078369140625, 0.254913330078125, 0.26904296875, 0.283172607421875, 0.29730224609375, 0.311431884765625, 0.3255615234375, 0.339691162109375, 0.35382080078125, 0.367950439453125, 0.382080078125, 0.396209716796875, 0.41033935546875, 0.424468994140625, 0.4385986328125, 0.452728271484375, 0.46685791015625, 0.480987548828125, 0.4951171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 2.0, 7.0, 1.0, 9.0, 12.0, 10.0, 16.0, 17.0, 15.0, 31.0, 30.0, 29.0, 28.0, 41.0, 37.0, 56.0, 55.0, 52.0, 60.0, 55.0, 47.0, 61.0, 47.0, 54.0, 30.0, 26.0, 38.0, 27.0, 17.0, 21.0, 9.0, 14.0, 8.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.781097412109375, -0.75408935546875, -0.727081298828125, -0.7000732421875, -0.673065185546875, -0.64605712890625, -0.619049072265625, -0.592041015625, -0.565032958984375, -0.53802490234375, -0.511016845703125, -0.4840087890625, -0.457000732421875, -0.42999267578125, -0.402984619140625, -0.3759765625, -0.348968505859375, -0.32196044921875, -0.294952392578125, -0.2679443359375, -0.240936279296875, -0.21392822265625, -0.186920166015625, -0.159912109375, -0.132904052734375, -0.10589599609375, -0.078887939453125, -0.0518798828125, -0.024871826171875, 0.00213623046875, 0.029144287109375, 0.05615234375, 0.083160400390625, 0.11016845703125, 0.137176513671875, 0.1641845703125, 0.191192626953125, 0.21820068359375, 0.245208740234375, 0.272216796875, 0.299224853515625, 0.32623291015625, 0.353240966796875, 0.3802490234375, 0.407257080078125, 0.43426513671875, 0.461273193359375, 0.48828125, 0.515289306640625, 0.54229736328125, 0.569305419921875, 0.5963134765625, 0.623321533203125, 0.65032958984375, 0.677337646484375, 0.704345703125, 0.731353759765625, 0.75836181640625, 0.785369873046875, 0.8123779296875, 0.839385986328125, 0.86639404296875, 0.893402099609375, 0.92041015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 11.0, 9.0, 25.0, 30.0, 40.0, 67.0, 89.0, 105.0, 202.0, 309.0, 483.0, 740.0, 1145.0, 1861.0, 2939.0, 4793.0, 7669.0, 13415.0, 24459.0, 48517.0, 109502.0, 238368.0, 289311.0, 159972.0, 68712.0, 32814.0, 17259.0, 9906.0, 5892.0, 3651.0, 2210.0, 1433.0, 938.0, 547.0, 366.0, 260.0, 142.0, 113.0, 74.0, 57.0, 31.0, 19.0, 16.0, 9.0, 9.0, 8.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.09527587890625, -0.0924081802368164, -0.08954048156738281, -0.08667278289794922, -0.08380508422851562, -0.08093738555908203, -0.07806968688964844, -0.07520198822021484, -0.07233428955078125, -0.06946659088134766, -0.06659889221191406, -0.06373119354248047, -0.060863494873046875, -0.05799579620361328, -0.05512809753417969, -0.052260398864746094, -0.0493927001953125, -0.046525001525878906, -0.04365730285644531, -0.04078960418701172, -0.037921905517578125, -0.03505420684814453, -0.03218650817871094, -0.029318809509277344, -0.02645111083984375, -0.023583412170410156, -0.020715713500976562, -0.01784801483154297, -0.014980316162109375, -0.012112617492675781, -0.009244918823242188, -0.006377220153808594, -0.003509521484375, -0.0006418228149414062, 0.0022258758544921875, 0.005093574523925781, 0.007961273193359375, 0.010828971862792969, 0.013696670532226562, 0.016564369201660156, 0.01943206787109375, 0.022299766540527344, 0.025167465209960938, 0.02803516387939453, 0.030902862548828125, 0.03377056121826172, 0.03663825988769531, 0.039505958557128906, 0.0423736572265625, 0.045241355895996094, 0.04810905456542969, 0.05097675323486328, 0.053844451904296875, 0.05671215057373047, 0.05957984924316406, 0.062447547912597656, 0.06531524658203125, 0.06818294525146484, 0.07105064392089844, 0.07391834259033203, 0.07678604125976562, 0.07965373992919922, 0.08252143859863281, 0.0853891372680664, 0.0882568359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 3.0, 10.0, 2.0, 6.0, 13.0, 14.0, 21.0, 30.0, 44.0, 48.0, 80.0, 104.0, 134.0, 130.0, 112.0, 60.0, 48.0, 31.0, 34.0, 21.0, 13.0, 8.0, 9.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4226646423339844e-05, -4.263874143362045e-05, -4.105083644390106e-05, -3.946293145418167e-05, -3.787502646446228e-05, -3.628712147474289e-05, -3.46992164850235e-05, -3.311131149530411e-05, -3.152340650558472e-05, -2.9935501515865326e-05, -2.8347596526145935e-05, -2.6759691536426544e-05, -2.5171786546707153e-05, -2.3583881556987762e-05, -2.199597656726837e-05, -2.040807157754898e-05, -1.882016658782959e-05, -1.72322615981102e-05, -1.5644356608390808e-05, -1.4056451618671417e-05, -1.2468546628952026e-05, -1.0880641639232635e-05, -9.292736649513245e-06, -7.704831659793854e-06, -6.116926670074463e-06, -4.529021680355072e-06, -2.941116690635681e-06, -1.3532117009162903e-06, 2.3469328880310059e-07, 1.8225982785224915e-06, 3.4105032682418823e-06, 4.998408257961273e-06, 6.586313247680664e-06, 8.174218237400055e-06, 9.762123227119446e-06, 1.1350028216838837e-05, 1.2937933206558228e-05, 1.4525838196277618e-05, 1.611374318599701e-05, 1.77016481757164e-05, 1.928955316543579e-05, 2.0877458155155182e-05, 2.2465363144874573e-05, 2.4053268134593964e-05, 2.5641173124313354e-05, 2.7229078114032745e-05, 2.8816983103752136e-05, 3.0404888093471527e-05, 3.199279308319092e-05, 3.358069807291031e-05, 3.51686030626297e-05, 3.675650805234909e-05, 3.834441304206848e-05, 3.993231803178787e-05, 4.152022302150726e-05, 4.3108128011226654e-05, 4.4696033000946045e-05, 4.6283937990665436e-05, 4.787184298038483e-05, 4.945974797010422e-05, 5.104765295982361e-05, 5.2635557949543e-05, 5.422346293926239e-05, 5.581136792898178e-05, 5.739927291870117e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 14.0, 22.0, 33.0, 35.0, 61.0, 72.0, 135.0, 218.0, 332.0, 646.0, 1061.0, 1896.0, 3699.0, 7339.0, 14635.0, 31144.0, 71484.0, 170820.0, 297454.0, 243396.0, 113398.0, 47829.0, 21281.0, 10407.0, 5236.0, 2550.0, 1365.0, 750.0, 456.0, 264.0, 165.0, 106.0, 82.0, 40.0, 35.0, 25.0, 14.0, 8.0, 11.0, 5.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0997314453125, -0.09677696228027344, -0.09382247924804688, -0.09086799621582031, -0.08791351318359375, -0.08495903015136719, -0.08200454711914062, -0.07905006408691406, -0.0760955810546875, -0.07314109802246094, -0.07018661499023438, -0.06723213195800781, -0.06427764892578125, -0.06132316589355469, -0.058368682861328125, -0.05541419982910156, -0.052459716796875, -0.04950523376464844, -0.046550750732421875, -0.04359626770019531, -0.04064178466796875, -0.03768730163574219, -0.034732818603515625, -0.03177833557128906, -0.0288238525390625, -0.025869369506835938, -0.022914886474609375, -0.019960403442382812, -0.01700592041015625, -0.014051437377929688, -0.011096954345703125, -0.008142471313476562, -0.00518798828125, -0.0022335052490234375, 0.000720977783203125, 0.0036754608154296875, 0.00662994384765625, 0.009584426879882812, 0.012538909912109375, 0.015493392944335938, 0.0184478759765625, 0.021402359008789062, 0.024356842041015625, 0.027311325073242188, 0.03026580810546875, 0.03322029113769531, 0.036174774169921875, 0.03912925720214844, 0.042083740234375, 0.04503822326660156, 0.047992706298828125, 0.05094718933105469, 0.05390167236328125, 0.05685615539550781, 0.059810638427734375, 0.06276512145996094, 0.0657196044921875, 0.06867408752441406, 0.07162857055664062, 0.07458305358886719, 0.07753753662109375, 0.08049201965332031, 0.08344650268554688, 0.08640098571777344, 0.08935546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 5.0, 4.0, 4.0, 7.0, 7.0, 9.0, 9.0, 8.0, 19.0, 8.0, 17.0, 18.0, 34.0, 34.0, 34.0, 51.0, 39.0, 59.0, 59.0, 72.0, 70.0, 57.0, 63.0, 56.0, 50.0, 28.0, 36.0, 18.0, 20.0, 19.0, 19.0, 13.0, 10.0, 5.0, 11.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.109375, -0.10583019256591797, -0.10228538513183594, -0.0987405776977539, -0.09519577026367188, -0.09165096282958984, -0.08810615539550781, -0.08456134796142578, -0.08101654052734375, -0.07747173309326172, -0.07392692565917969, -0.07038211822509766, -0.06683731079101562, -0.0632925033569336, -0.05974769592285156, -0.05620288848876953, -0.0526580810546875, -0.04911327362060547, -0.04556846618652344, -0.042023658752441406, -0.038478851318359375, -0.034934043884277344, -0.03138923645019531, -0.02784442901611328, -0.02429962158203125, -0.02075481414794922, -0.017210006713867188, -0.013665199279785156, -0.010120391845703125, -0.006575584411621094, -0.0030307769775390625, 0.0005140304565429688, 0.004058837890625, 0.007603645324707031, 0.011148452758789062, 0.014693260192871094, 0.018238067626953125, 0.021782875061035156, 0.025327682495117188, 0.02887248992919922, 0.03241729736328125, 0.03596210479736328, 0.03950691223144531, 0.043051719665527344, 0.046596527099609375, 0.050141334533691406, 0.05368614196777344, 0.05723094940185547, 0.0607757568359375, 0.06432056427001953, 0.06786537170410156, 0.0714101791381836, 0.07495498657226562, 0.07849979400634766, 0.08204460144042969, 0.08558940887451172, 0.08913421630859375, 0.09267902374267578, 0.09622383117675781, 0.09976863861083984, 0.10331344604492188, 0.1068582534790039, 0.11040306091308594, 0.11394786834716797, 0.11749267578125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 29.0, 48.0, 122.0, 220.0, 261.0, 170.0, 78.0, 32.0, 13.0, 9.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.883645534515381, -4.770914554595947, -4.658183574676514, -4.54545259475708, -4.4327216148376465, -4.319990634918213, -4.207259654998779, -4.094528675079346, -3.981797695159912, -3.8690667152404785, -3.756335735321045, -3.6436047554016113, -3.5308737754821777, -3.418142795562744, -3.3054118156433105, -3.192680835723877, -3.0799498558044434, -2.9672188758850098, -2.854487895965576, -2.7417569160461426, -2.629025936126709, -2.5162949562072754, -2.403563976287842, -2.290832996368408, -2.1781020164489746, -2.065371036529541, -1.9526400566101074, -1.8399090766906738, -1.7271780967712402, -1.6144471168518066, -1.501716136932373, -1.3889851570129395, -1.2762541770935059, -1.1635231971740723, -1.0507922172546387, -0.9380612373352051, -0.8253302574157715, -0.7125992774963379, -0.5998682975769043, -0.4871373176574707, -0.3744063377380371, -0.2616753578186035, -0.14894437789916992, -0.03621339797973633, 0.07651758193969727, 0.18924856185913086, 0.30197954177856445, 0.41471052169799805, 0.5274415016174316, 0.6401724815368652, 0.7529034614562988, 0.8656344413757324, 0.978365421295166, 1.0910964012145996, 1.2038273811340332, 1.3165583610534668, 1.4292893409729004, 1.542020320892334, 1.6547513008117676, 1.7674822807312012, 1.8802132606506348, 1.9929442405700684, 2.105675220489502, 2.2184062004089355, 2.331137180328369]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 10.0, 10.0, 9.0, 17.0, 16.0, 20.0, 27.0, 22.0, 36.0, 39.0, 29.0, 44.0, 34.0, 60.0, 43.0, 35.0, 29.0, 34.0, 39.0, 40.0, 40.0, 32.0, 44.0, 34.0, 32.0, 36.0, 26.0, 12.0, 20.0, 27.0, 21.0, 16.0, 10.0, 11.0, 11.0, 4.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.416494607925415, -1.370276927947998, -1.3240591287612915, -1.2778414487838745, -1.231623649597168, -1.185405969619751, -1.139188289642334, -1.0929704904556274, -1.046752691268921, -1.000535011291504, -0.9543172121047974, -0.9080995321273804, -0.8618817329406738, -0.8156640529632568, -0.7694463133811951, -0.7232285737991333, -0.6770108938217163, -0.6307931542396545, -0.5845754146575928, -0.5383577346801758, -0.4921399652957916, -0.44592222571372986, -0.3997045159339905, -0.3534867763519287, -0.30726903676986694, -0.2610512971878052, -0.2148335725069046, -0.16861584782600403, -0.12239810824394226, -0.0761803686618805, -0.029962658882141113, 0.016255080699920654, 0.06247282028198242, 0.10869055241346359, 0.15490828454494476, 0.20112600922584534, 0.2473437488079071, 0.29356148838996887, 0.33977919816970825, 0.38599693775177, 0.4322146773338318, 0.47843241691589355, 0.5246501564979553, 0.5708678960800171, 0.6170855760574341, 0.6633033752441406, 0.7095210552215576, 0.7557387948036194, 0.8019565343856812, 0.8481742739677429, 0.8943920135498047, 0.9406096935272217, 0.9868274927139282, 1.0330451726913452, 1.0792629718780518, 1.1254806518554688, 1.1716983318328857, 1.2179160118103027, 1.2641338109970093, 1.3103514909744263, 1.3565692901611328, 1.4027869701385498, 1.4490046501159668, 1.4952224493026733, 1.5414402484893799]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 14.0, 16.0, 21.0, 39.0, 62.0, 76.0, 124.0, 193.0, 294.0, 450.0, 697.0, 1156.0, 2119.0, 3982.0, 8603.0, 20301.0, 52481.0, 140216.0, 354013.0, 721381.0, 1047183.0, 923575.0, 531214.0, 237594.0, 90102.0, 33160.0, 12804.0, 5482.0, 2843.0, 1570.0, 900.0, 544.0, 357.0, 229.0, 165.0, 93.0, 79.0, 48.0, 35.0, 26.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1375732421875, -0.1324329376220703, -0.12729263305664062, -0.12215232849121094, -0.11701202392578125, -0.11187171936035156, -0.10673141479492188, -0.10159111022949219, -0.0964508056640625, -0.09131050109863281, -0.08617019653320312, -0.08102989196777344, -0.07588958740234375, -0.07074928283691406, -0.06560897827148438, -0.06046867370605469, -0.055328369140625, -0.05018806457519531, -0.045047760009765625, -0.03990745544433594, -0.03476715087890625, -0.029626846313476562, -0.024486541748046875, -0.019346237182617188, -0.0142059326171875, -0.009065628051757812, -0.003925323486328125, 0.0012149810791015625, 0.00635528564453125, 0.011495590209960938, 0.016635894775390625, 0.021776199340820312, 0.02691650390625, 0.03205680847167969, 0.037197113037109375, 0.04233741760253906, 0.04747772216796875, 0.05261802673339844, 0.057758331298828125, 0.06289863586425781, 0.0680389404296875, 0.07317924499511719, 0.07831954956054688, 0.08345985412597656, 0.08860015869140625, 0.09374046325683594, 0.09888076782226562, 0.10402107238769531, 0.109161376953125, 0.11430168151855469, 0.11944198608398438, 0.12458229064941406, 0.12972259521484375, 0.13486289978027344, 0.14000320434570312, 0.1451435089111328, 0.1502838134765625, 0.1554241180419922, 0.16056442260742188, 0.16570472717285156, 0.17084503173828125, 0.17598533630371094, 0.18112564086914062, 0.1862659454345703, 0.19140625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 6.0, 14.0, 12.0, 22.0, 17.0, 22.0, 18.0, 17.0, 25.0, 34.0, 30.0, 26.0, 41.0, 38.0, 37.0, 39.0, 48.0, 39.0, 41.0, 24.0, 45.0, 37.0, 38.0, 26.0, 40.0, 30.0, 31.0, 28.0, 28.0, 20.0, 24.0, 17.0, 11.0, 15.0, 8.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2034912109375, -0.19691848754882812, -0.19034576416015625, -0.18377304077148438, -0.1772003173828125, -0.17062759399414062, -0.16405487060546875, -0.15748214721679688, -0.150909423828125, -0.14433670043945312, -0.13776397705078125, -0.13119125366210938, -0.1246185302734375, -0.11804580688476562, -0.11147308349609375, -0.10490036010742188, -0.09832763671875, -0.09175491333007812, -0.08518218994140625, -0.07860946655273438, -0.0720367431640625, -0.06546401977539062, -0.05889129638671875, -0.052318572998046875, -0.045745849609375, -0.039173126220703125, -0.03260040283203125, -0.026027679443359375, -0.0194549560546875, -0.012882232666015625, -0.00630950927734375, 0.000263214111328125, 0.0068359375, 0.013408660888671875, 0.01998138427734375, 0.026554107666015625, 0.0331268310546875, 0.039699554443359375, 0.04627227783203125, 0.052845001220703125, 0.059417724609375, 0.06599044799804688, 0.07256317138671875, 0.07913589477539062, 0.0857086181640625, 0.09228134155273438, 0.09885406494140625, 0.10542678833007812, 0.11199951171875, 0.11857223510742188, 0.12514495849609375, 0.13171768188476562, 0.1382904052734375, 0.14486312866210938, 0.15143585205078125, 0.15800857543945312, 0.164581298828125, 0.17115402221679688, 0.17772674560546875, 0.18429946899414062, 0.1908721923828125, 0.19744491577148438, 0.20401763916015625, 0.21059036254882812, 0.2171630859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 9.0, 16.0, 16.0, 28.0, 43.0, 77.0, 94.0, 197.0, 341.0, 644.0, 1308.0, 2749.0, 6763.0, 17612.0, 52610.0, 185559.0, 911035.0, 2208979.0, 607516.0, 134652.0, 40028.0, 13833.0, 5459.0, 2305.0, 1105.0, 555.0, 282.0, 169.0, 110.0, 74.0, 30.0, 28.0, 15.0, 13.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30078125, -0.29177093505859375, -0.2827606201171875, -0.27375030517578125, -0.264739990234375, -0.25572967529296875, -0.2467193603515625, -0.23770904541015625, -0.22869873046875, -0.21968841552734375, -0.2106781005859375, -0.20166778564453125, -0.192657470703125, -0.18364715576171875, -0.1746368408203125, -0.16562652587890625, -0.1566162109375, -0.14760589599609375, -0.1385955810546875, -0.12958526611328125, -0.120574951171875, -0.11156463623046875, -0.1025543212890625, -0.09354400634765625, -0.08453369140625, -0.07552337646484375, -0.0665130615234375, -0.05750274658203125, -0.048492431640625, -0.03948211669921875, -0.0304718017578125, -0.02146148681640625, -0.012451171875, -0.00344085693359375, 0.0055694580078125, 0.01457977294921875, 0.023590087890625, 0.03260040283203125, 0.0416107177734375, 0.05062103271484375, 0.05963134765625, 0.06864166259765625, 0.0776519775390625, 0.08666229248046875, 0.095672607421875, 0.10468292236328125, 0.1136932373046875, 0.12270355224609375, 0.1317138671875, 0.14072418212890625, 0.1497344970703125, 0.15874481201171875, 0.167755126953125, 0.17676544189453125, 0.1857757568359375, 0.19478607177734375, 0.20379638671875, 0.21280670166015625, 0.2218170166015625, 0.23082733154296875, 0.239837646484375, 0.24884796142578125, 0.2578582763671875, 0.26686859130859375, 0.27587890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 10.0, 14.0, 11.0, 13.0, 30.0, 33.0, 50.0, 65.0, 80.0, 84.0, 125.0, 190.0, 215.0, 327.0, 374.0, 446.0, 406.0, 398.0, 281.0, 218.0, 158.0, 106.0, 87.0, 68.0, 43.0, 60.0, 34.0, 27.0, 20.0, 17.0, 12.0, 10.0, 14.0, 1.0, 4.0, 11.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.313232421875, -0.30426788330078125, -0.2953033447265625, -0.28633880615234375, -0.277374267578125, -0.26840972900390625, -0.2594451904296875, -0.25048065185546875, -0.24151611328125, -0.23255157470703125, -0.2235870361328125, -0.21462249755859375, -0.205657958984375, -0.19669342041015625, -0.1877288818359375, -0.17876434326171875, -0.1697998046875, -0.16083526611328125, -0.1518707275390625, -0.14290618896484375, -0.133941650390625, -0.12497711181640625, -0.1160125732421875, -0.10704803466796875, -0.09808349609375, -0.08911895751953125, -0.0801544189453125, -0.07118988037109375, -0.062225341796875, -0.05326080322265625, -0.0442962646484375, -0.03533172607421875, -0.0263671875, -0.01740264892578125, -0.0084381103515625, 0.00052642822265625, 0.009490966796875, 0.01845550537109375, 0.0274200439453125, 0.03638458251953125, 0.04534912109375, 0.05431365966796875, 0.0632781982421875, 0.07224273681640625, 0.081207275390625, 0.09017181396484375, 0.0991363525390625, 0.10810089111328125, 0.1170654296875, 0.12602996826171875, 0.1349945068359375, 0.14395904541015625, 0.152923583984375, 0.16188812255859375, 0.1708526611328125, 0.17981719970703125, 0.18878173828125, 0.19774627685546875, 0.2067108154296875, 0.21567535400390625, 0.224639892578125, 0.23360443115234375, 0.2425689697265625, 0.25153350830078125, 0.260498046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 26.0, 32.0, 68.0, 111.0, 163.0, 221.0, 162.0, 112.0, 52.0, 25.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4291911125183105, -3.3318543434143066, -3.2345175743103027, -3.137181043624878, -3.039844274520874, -2.94250750541687, -2.845170736312866, -2.7478342056274414, -2.6504974365234375, -2.5531606674194336, -2.4558238983154297, -2.358487367630005, -2.261150598526001, -2.163813829421997, -2.066477060317993, -1.9691404104232788, -1.871803641319275, -1.774466872215271, -1.6771302223205566, -1.5797934532165527, -1.4824568033218384, -1.3851200342178345, -1.2877833843231201, -1.1904466152191162, -1.0931098461151123, -0.9957731366157532, -0.898436427116394, -0.8010996580123901, -0.7037630081176758, -0.6064262390136719, -0.5090895295143127, -0.4117528200149536, -0.31441617012023926, -0.21707946062088013, -0.1197427362203598, -0.022406011819839478, 0.07493069767951965, 0.17226740717887878, 0.2696041464805603, 0.36694085597991943, 0.46427756547927856, 0.5616142749786377, 0.6589509844779968, 0.756287693977356, 0.8536244630813599, 0.9509611129760742, 1.0482978820800781, 1.145634651184082, 1.2429713010787964, 1.3403080701828003, 1.4376447200775146, 1.5349814891815186, 1.632318139076233, 1.7296549081802368, 1.8269915580749512, 1.924328327178955, 2.021665096282959, 2.119001865386963, 2.216338634490967, 2.3136751651763916, 2.4110119342803955, 2.5083487033843994, 2.6056854724884033, 2.703022003173828, 2.800358772277832]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 2.0, 6.0, 5.0, 13.0, 17.0, 14.0, 13.0, 8.0, 14.0, 32.0, 20.0, 30.0, 26.0, 31.0, 36.0, 44.0, 39.0, 44.0, 40.0, 35.0, 44.0, 54.0, 37.0, 49.0, 38.0, 37.0, 40.0, 35.0, 40.0, 25.0, 16.0, 18.0, 18.0, 17.0, 10.0, 18.0, 7.0, 8.0, 5.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0969552993774414, -1.0629867315292358, -1.0290182828903198, -0.9950497150421143, -0.9610812067985535, -0.9271126985549927, -0.8931441903114319, -0.8591756820678711, -0.8252071142196655, -0.7912386059761047, -0.757270097732544, -0.7233015298843384, -0.6893330216407776, -0.6553645133972168, -0.621396005153656, -0.5874274969100952, -0.5534589886665344, -0.5194904804229736, -0.48552194237709045, -0.45155343413352966, -0.4175848960876465, -0.3836163878440857, -0.3496478796005249, -0.3156793713569641, -0.28171083331108093, -0.24774231016635895, -0.21377378702163696, -0.17980527877807617, -0.1458367556333542, -0.1118682324886322, -0.07789972424507141, -0.043931201100349426, -0.009962677955627441, 0.024005841463804245, 0.05797436088323593, 0.09194287657737732, 0.1259113997220993, 0.1598799228668213, 0.19384843111038208, 0.22781695425510406, 0.26178547739982605, 0.29575398564338684, 0.32972252368927, 0.3636910319328308, 0.3976595401763916, 0.4316280782222748, 0.46559658646583557, 0.49956512451171875, 0.5335336327552795, 0.5675021409988403, 0.6014706492424011, 0.6354391574859619, 0.6694077253341675, 0.7033762335777283, 0.7373447418212891, 0.7713132500648499, 0.8052817583084106, 0.8392502665519714, 0.8732187747955322, 0.9071873426437378, 0.9411558508872986, 0.9751243591308594, 1.0090928077697754, 1.043061375617981, 1.0770299434661865]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 6.0, 9.0, 7.0, 25.0, 32.0, 40.0, 63.0, 102.0, 161.0, 248.0, 388.0, 658.0, 1133.0, 2236.0, 4204.0, 9317.0, 22166.0, 59918.0, 179981.0, 369623.0, 254519.0, 88465.0, 30932.0, 12526.0, 5542.0, 2834.0, 1423.0, 780.0, 456.0, 265.0, 134.0, 118.0, 74.0, 47.0, 35.0, 28.0, 13.0, 12.0, 12.0, 10.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2637519836425781, -0.25455474853515625, -0.24535751342773438, -0.2361602783203125, -0.22696304321289062, -0.21776580810546875, -0.20856857299804688, -0.199371337890625, -0.19017410278320312, -0.18097686767578125, -0.17177963256835938, -0.1625823974609375, -0.15338516235351562, -0.14418792724609375, -0.13499069213867188, -0.12579345703125, -0.11659622192382812, -0.10739898681640625, -0.09820175170898438, -0.0890045166015625, -0.07980728149414062, -0.07061004638671875, -0.061412811279296875, -0.052215576171875, -0.043018341064453125, -0.03382110595703125, -0.024623870849609375, -0.0154266357421875, -0.006229400634765625, 0.00296783447265625, 0.012165069580078125, 0.0213623046875, 0.030559539794921875, 0.03975677490234375, 0.048954010009765625, 0.0581512451171875, 0.06734848022460938, 0.07654571533203125, 0.08574295043945312, 0.094940185546875, 0.10413742065429688, 0.11333465576171875, 0.12253189086914062, 0.1317291259765625, 0.14092636108398438, 0.15012359619140625, 0.15932083129882812, 0.16851806640625, 0.17771530151367188, 0.18691253662109375, 0.19610977172851562, 0.2053070068359375, 0.21450424194335938, 0.22370147705078125, 0.23289871215820312, 0.242095947265625, 0.2512931823730469, 0.26049041748046875, 0.2696876525878906, 0.2788848876953125, 0.2880821228027344, 0.29727935791015625, 0.3064765930175781, 0.315673828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 3.0, 6.0, 7.0, 10.0, 9.0, 14.0, 7.0, 15.0, 18.0, 19.0, 18.0, 24.0, 41.0, 32.0, 24.0, 27.0, 38.0, 47.0, 46.0, 50.0, 42.0, 37.0, 45.0, 32.0, 34.0, 36.0, 43.0, 31.0, 21.0, 36.0, 34.0, 32.0, 10.0, 9.0, 20.0, 10.0, 13.0, 16.0, 10.0, 5.0, 9.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.2210693359375, -0.21441650390625, -0.207763671875, -0.20111083984375, -0.1944580078125, -0.18780517578125, -0.18115234375, -0.17449951171875, -0.1678466796875, -0.16119384765625, -0.154541015625, -0.14788818359375, -0.1412353515625, -0.13458251953125, -0.1279296875, -0.12127685546875, -0.1146240234375, -0.10797119140625, -0.101318359375, -0.09466552734375, -0.0880126953125, -0.08135986328125, -0.07470703125, -0.06805419921875, -0.0614013671875, -0.05474853515625, -0.048095703125, -0.04144287109375, -0.0347900390625, -0.02813720703125, -0.021484375, -0.01483154296875, -0.0081787109375, -0.00152587890625, 0.005126953125, 0.01177978515625, 0.0184326171875, 0.02508544921875, 0.03173828125, 0.03839111328125, 0.0450439453125, 0.05169677734375, 0.058349609375, 0.06500244140625, 0.0716552734375, 0.07830810546875, 0.0849609375, 0.09161376953125, 0.0982666015625, 0.10491943359375, 0.111572265625, 0.11822509765625, 0.1248779296875, 0.13153076171875, 0.13818359375, 0.14483642578125, 0.1514892578125, 0.15814208984375, 0.164794921875, 0.17144775390625, 0.1781005859375, 0.18475341796875, 0.19140625, 0.19805908203125, 0.2047119140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 7.0, 10.0, 10.0, 19.0, 22.0, 28.0, 45.0, 64.0, 89.0, 145.0, 271.0, 422.0, 829.0, 1520.0, 3323.0, 6742.0, 13872.0, 30673.0, 76116.0, 206391.0, 359924.0, 210808.0, 77932.0, 31384.0, 14107.0, 6947.0, 3229.0, 1659.0, 824.0, 451.0, 235.0, 166.0, 91.0, 59.0, 40.0, 23.0, 21.0, 16.0, 7.0, 13.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.32373046875, -0.3143501281738281, -0.30496978759765625, -0.2955894470214844, -0.2862091064453125, -0.2768287658691406, -0.26744842529296875, -0.2580680847167969, -0.248687744140625, -0.23930740356445312, -0.22992706298828125, -0.22054672241210938, -0.2111663818359375, -0.20178604125976562, -0.19240570068359375, -0.18302536010742188, -0.17364501953125, -0.16426467895507812, -0.15488433837890625, -0.14550399780273438, -0.1361236572265625, -0.12674331665039062, -0.11736297607421875, -0.10798263549804688, -0.098602294921875, -0.08922195434570312, -0.07984161376953125, -0.07046127319335938, -0.0610809326171875, -0.051700592041015625, -0.04232025146484375, -0.032939910888671875, -0.0235595703125, -0.014179229736328125, -0.00479888916015625, 0.004581451416015625, 0.0139617919921875, 0.023342132568359375, 0.03272247314453125, 0.042102813720703125, 0.051483154296875, 0.060863494873046875, 0.07024383544921875, 0.07962417602539062, 0.0890045166015625, 0.09838485717773438, 0.10776519775390625, 0.11714553833007812, 0.12652587890625, 0.13590621948242188, 0.14528656005859375, 0.15466690063476562, 0.1640472412109375, 0.17342758178710938, 0.18280792236328125, 0.19218826293945312, 0.201568603515625, 0.21094894409179688, 0.22032928466796875, 0.22970962524414062, 0.2390899658203125, 0.24847030639648438, 0.25785064697265625, 0.2672309875488281, 0.276611328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 10.0, 5.0, 8.0, 12.0, 13.0, 11.0, 15.0, 22.0, 24.0, 27.0, 35.0, 38.0, 30.0, 41.0, 39.0, 48.0, 55.0, 50.0, 42.0, 38.0, 28.0, 55.0, 38.0, 37.0, 35.0, 34.0, 37.0, 30.0, 25.0, 22.0, 21.0, 16.0, 12.0, 13.0, 3.0, 11.0, 3.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.666015625, -0.6449050903320312, -0.6237945556640625, -0.6026840209960938, -0.581573486328125, -0.5604629516601562, -0.5393524169921875, -0.5182418823242188, -0.49713134765625, -0.47602081298828125, -0.4549102783203125, -0.43379974365234375, -0.412689208984375, -0.39157867431640625, -0.3704681396484375, -0.34935760498046875, -0.3282470703125, -0.30713653564453125, -0.2860260009765625, -0.26491546630859375, -0.243804931640625, -0.22269439697265625, -0.2015838623046875, -0.18047332763671875, -0.15936279296875, -0.13825225830078125, -0.1171417236328125, -0.09603118896484375, -0.074920654296875, -0.05381011962890625, -0.0326995849609375, -0.01158905029296875, 0.009521484375, 0.03063201904296875, 0.0517425537109375, 0.07285308837890625, 0.093963623046875, 0.11507415771484375, 0.1361846923828125, 0.15729522705078125, 0.17840576171875, 0.19951629638671875, 0.2206268310546875, 0.24173736572265625, 0.262847900390625, 0.28395843505859375, 0.3050689697265625, 0.32617950439453125, 0.3472900390625, 0.36840057373046875, 0.3895111083984375, 0.41062164306640625, 0.431732177734375, 0.45284271240234375, 0.4739532470703125, 0.49506378173828125, 0.51617431640625, 0.5372848510742188, 0.5583953857421875, 0.5795059204101562, 0.600616455078125, 0.6217269897460938, 0.6428375244140625, 0.6639480590820312, 0.68505859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 5.0, 10.0, 8.0, 14.0, 21.0, 23.0, 26.0, 51.0, 80.0, 124.0, 168.0, 254.0, 376.0, 574.0, 858.0, 1374.0, 2024.0, 3392.0, 5518.0, 9510.0, 16804.0, 30969.0, 60671.0, 121043.0, 214780.0, 244104.0, 160628.0, 82313.0, 40962.0, 21404.0, 11934.0, 6983.0, 4191.0, 2531.0, 1629.0, 1090.0, 679.0, 491.0, 313.0, 205.0, 142.0, 84.0, 52.0, 45.0, 29.0, 12.0, 15.0, 11.0, 10.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.060760498046875, -0.05893135070800781, -0.057102203369140625, -0.05527305603027344, -0.05344390869140625, -0.05161476135253906, -0.049785614013671875, -0.04795646667480469, -0.0461273193359375, -0.04429817199707031, -0.042469024658203125, -0.04063987731933594, -0.03881072998046875, -0.03698158264160156, -0.035152435302734375, -0.03332328796386719, -0.031494140625, -0.029664993286132812, -0.027835845947265625, -0.026006698608398438, -0.02417755126953125, -0.022348403930664062, -0.020519256591796875, -0.018690109252929688, -0.0168609619140625, -0.015031814575195312, -0.013202667236328125, -0.011373519897460938, -0.00954437255859375, -0.0077152252197265625, -0.005886077880859375, -0.0040569305419921875, -0.002227783203125, -0.0003986358642578125, 0.001430511474609375, 0.0032596588134765625, 0.00508880615234375, 0.0069179534912109375, 0.008747100830078125, 0.010576248168945312, 0.0124053955078125, 0.014234542846679688, 0.016063690185546875, 0.017892837524414062, 0.01972198486328125, 0.021551132202148438, 0.023380279541015625, 0.025209426879882812, 0.02703857421875, 0.028867721557617188, 0.030696868896484375, 0.03252601623535156, 0.03435516357421875, 0.03618431091308594, 0.038013458251953125, 0.03984260559082031, 0.0416717529296875, 0.04350090026855469, 0.045330047607421875, 0.04715919494628906, 0.04898834228515625, 0.05081748962402344, 0.052646636962890625, 0.05447578430175781, 0.056304931640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 11.0, 14.0, 19.0, 26.0, 35.0, 52.0, 87.0, 129.0, 142.0, 127.0, 114.0, 79.0, 55.0, 31.0, 27.0, 17.0, 5.0, 5.0, 6.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.264448165893555e-05, -6.103143095970154e-05, -5.941838026046753e-05, -5.780532956123352e-05, -5.619227886199951e-05, -5.45792281627655e-05, -5.2966177463531494e-05, -5.1353126764297485e-05, -4.9740076065063477e-05, -4.812702536582947e-05, -4.651397466659546e-05, -4.490092396736145e-05, -4.328787326812744e-05, -4.167482256889343e-05, -4.0061771869659424e-05, -3.8448721170425415e-05, -3.6835670471191406e-05, -3.52226197719574e-05, -3.360956907272339e-05, -3.199651837348938e-05, -3.038346767425537e-05, -2.8770416975021362e-05, -2.7157366275787354e-05, -2.5544315576553345e-05, -2.3931264877319336e-05, -2.2318214178085327e-05, -2.070516347885132e-05, -1.909211277961731e-05, -1.74790620803833e-05, -1.5866011381149292e-05, -1.4252960681915283e-05, -1.2639909982681274e-05, -1.1026859283447266e-05, -9.413808584213257e-06, -7.800757884979248e-06, -6.187707185745239e-06, -4.5746564865112305e-06, -2.9616057872772217e-06, -1.3485550880432129e-06, 2.644956111907959e-07, 1.8775463104248047e-06, 3.4905970096588135e-06, 5.103647708892822e-06, 6.716698408126831e-06, 8.32974910736084e-06, 9.942799806594849e-06, 1.1555850505828857e-05, 1.3168901205062866e-05, 1.4781951904296875e-05, 1.6395002603530884e-05, 1.8008053302764893e-05, 1.96211040019989e-05, 2.123415470123291e-05, 2.284720540046692e-05, 2.4460256099700928e-05, 2.6073306798934937e-05, 2.7686357498168945e-05, 2.9299408197402954e-05, 3.091245889663696e-05, 3.252550959587097e-05, 3.413856029510498e-05, 3.575161099433899e-05, 3.7364661693573e-05, 3.897771239280701e-05, 4.0590763092041016e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 2.0, 10.0, 9.0, 13.0, 15.0, 21.0, 27.0, 41.0, 66.0, 83.0, 131.0, 254.0, 359.0, 648.0, 1023.0, 1712.0, 2999.0, 5037.0, 8780.0, 14936.0, 26734.0, 47369.0, 84858.0, 140924.0, 194033.0, 192005.0, 136902.0, 82509.0, 45738.0, 25870.0, 14635.0, 8480.0, 4876.0, 2956.0, 1733.0, 1107.0, 606.0, 342.0, 244.0, 164.0, 90.0, 61.0, 50.0, 31.0, 22.0, 17.0, 11.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.047393798828125, -0.04586362838745117, -0.044333457946777344, -0.042803287506103516, -0.04127311706542969, -0.03974294662475586, -0.03821277618408203, -0.0366826057434082, -0.035152435302734375, -0.03362226486206055, -0.03209209442138672, -0.03056192398071289, -0.029031753540039062, -0.027501583099365234, -0.025971412658691406, -0.024441242218017578, -0.02291107177734375, -0.021380901336669922, -0.019850730895996094, -0.018320560455322266, -0.016790390014648438, -0.01526021957397461, -0.013730049133300781, -0.012199878692626953, -0.010669708251953125, -0.009139537811279297, -0.007609367370605469, -0.006079196929931641, -0.0045490264892578125, -0.0030188560485839844, -0.0014886856079101562, 4.1484832763671875e-05, 0.0015716552734375, 0.003101825714111328, 0.004631996154785156, 0.006162166595458984, 0.0076923370361328125, 0.00922250747680664, 0.010752677917480469, 0.012282848358154297, 0.013813018798828125, 0.015343189239501953, 0.01687335968017578, 0.01840353012084961, 0.019933700561523438, 0.021463871002197266, 0.022994041442871094, 0.024524211883544922, 0.02605438232421875, 0.027584552764892578, 0.029114723205566406, 0.030644893646240234, 0.03217506408691406, 0.03370523452758789, 0.03523540496826172, 0.03676557540893555, 0.038295745849609375, 0.0398259162902832, 0.04135608673095703, 0.04288625717163086, 0.04441642761230469, 0.045946598052978516, 0.047476768493652344, 0.04900693893432617, 0.050537109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 4.0, 7.0, 6.0, 9.0, 10.0, 16.0, 19.0, 22.0, 20.0, 34.0, 24.0, 42.0, 34.0, 47.0, 48.0, 43.0, 51.0, 60.0, 54.0, 61.0, 62.0, 44.0, 44.0, 42.0, 29.0, 27.0, 21.0, 9.0, 11.0, 10.0, 13.0, 15.0, 11.0, 11.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0673828125, -0.06515789031982422, -0.06293296813964844, -0.060708045959472656, -0.058483123779296875, -0.056258201599121094, -0.05403327941894531, -0.05180835723876953, -0.04958343505859375, -0.04735851287841797, -0.04513359069824219, -0.042908668518066406, -0.040683746337890625, -0.038458824157714844, -0.03623390197753906, -0.03400897979736328, -0.0317840576171875, -0.02955913543701172, -0.027334213256835938, -0.025109291076660156, -0.022884368896484375, -0.020659446716308594, -0.018434524536132812, -0.01620960235595703, -0.01398468017578125, -0.011759757995605469, -0.009534835815429688, -0.007309913635253906, -0.005084991455078125, -0.0028600692749023438, -0.0006351470947265625, 0.0015897750854492188, 0.003814697265625, 0.006039619445800781, 0.008264541625976562, 0.010489463806152344, 0.012714385986328125, 0.014939308166503906, 0.017164230346679688, 0.01938915252685547, 0.02161407470703125, 0.02383899688720703, 0.026063919067382812, 0.028288841247558594, 0.030513763427734375, 0.032738685607910156, 0.03496360778808594, 0.03718852996826172, 0.0394134521484375, 0.04163837432861328, 0.04386329650878906, 0.046088218688964844, 0.048313140869140625, 0.050538063049316406, 0.05276298522949219, 0.05498790740966797, 0.05721282958984375, 0.05943775177001953, 0.06166267395019531, 0.0638875961303711, 0.06611251831054688, 0.06833744049072266, 0.07056236267089844, 0.07278728485107422, 0.07501220703125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 10.0, 20.0, 27.0, 56.0, 105.0, 158.0, 187.0, 175.0, 106.0, 74.0, 31.0, 15.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1016831398010254, -2.0277719497680664, -1.9538606405258179, -1.8799493312835693, -1.8060381412506104, -1.7321269512176514, -1.6582156419754028, -1.5843043327331543, -1.5103931427001953, -1.4364819526672363, -1.3625706434249878, -1.2886593341827393, -1.2147481441497803, -1.1408369541168213, -1.0669256448745728, -0.993014395236969, -0.9191031455993652, -0.8451918959617615, -0.7712806463241577, -0.697369396686554, -0.6234581470489502, -0.5495468974113464, -0.4756356477737427, -0.4017243981361389, -0.32781314849853516, -0.2539018988609314, -0.17999064922332764, -0.10607939958572388, -0.03216814994812012, 0.04174309968948364, 0.1156543493270874, 0.18956559896469116, 0.2634766101837158, 0.3373878598213196, 0.41129910945892334, 0.4852103590965271, 0.5591216087341309, 0.6330328583717346, 0.7069441080093384, 0.7808553576469421, 0.8547666072845459, 0.9286778569221497, 1.0025891065597534, 1.076500415802002, 1.150411605834961, 1.22432279586792, 1.2982341051101685, 1.372145414352417, 1.446056604385376, 1.519967794418335, 1.5938791036605835, 1.667790412902832, 1.741701602935791, 1.81561279296875, 1.8895241022109985, 1.963435411453247, 2.037346601486206, 2.111257791519165, 2.185169219970703, 2.259080410003662, 2.332991600036621, 2.40690279006958, 2.480813980102539, 2.554725408554077, 2.628636598587036]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 11.0, 9.0, 12.0, 17.0, 9.0, 16.0, 20.0, 13.0, 21.0, 24.0, 34.0, 31.0, 32.0, 36.0, 41.0, 39.0, 43.0, 37.0, 47.0, 42.0, 48.0, 43.0, 36.0, 52.0, 27.0, 37.0, 28.0, 24.0, 28.0, 16.0, 21.0, 17.0, 14.0, 15.0, 14.0, 8.0, 6.0, 9.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.324843168258667, -1.2820192575454712, -1.2391953468322754, -1.1963715553283691, -1.1535476446151733, -1.1107237339019775, -1.0678998231887817, -1.025075912475586, -0.9822520613670349, -0.9394281506538391, -0.8966042995452881, -0.8537803888320923, -0.8109564781188965, -0.7681326270103455, -0.7253087162971497, -0.6824848651885986, -0.6396609544754028, -0.596837043762207, -0.554013192653656, -0.5111892819404602, -0.4683654010295868, -0.4255415201187134, -0.3827176094055176, -0.33989372849464417, -0.29706984758377075, -0.25424596667289734, -0.21142207086086273, -0.16859817504882812, -0.1257742941379547, -0.0829504132270813, -0.0401265025138855, 0.002697378396987915, 0.04552114009857178, 0.08834502846002579, 0.1311689168214798, 0.1739928126335144, 0.21681669354438782, 0.25964057445526123, 0.30246448516845703, 0.34528836607933044, 0.38811224699020386, 0.43093612790107727, 0.4737600088119507, 0.5165839195251465, 0.5594078302383423, 0.6022316813468933, 0.6450555920600891, 0.6878794431686401, 0.7307033538818359, 0.7735272645950317, 0.8163511157035828, 0.8591750264167786, 0.9019988775253296, 0.9448227882385254, 0.9876466989517212, 1.030470609664917, 1.0732944011688232, 1.116118311882019, 1.1589422225952148, 1.201766014099121, 1.244589924812317, 1.2874138355255127, 1.3302377462387085, 1.3730616569519043, 1.4158855676651]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 11.0, 7.0, 14.0, 24.0, 45.0, 52.0, 77.0, 109.0, 153.0, 213.0, 309.0, 442.0, 751.0, 1187.0, 2171.0, 4088.0, 9051.0, 23961.0, 76814.0, 268615.0, 818838.0, 1494199.0, 1000387.0, 343085.0, 96592.0, 29713.0, 11601.0, 5272.0, 2672.0, 1439.0, 849.0, 485.0, 347.0, 217.0, 142.0, 101.0, 79.0, 51.0, 35.0, 33.0, 12.0, 12.0, 16.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208984375, -0.20192527770996094, -0.19486618041992188, -0.1878070831298828, -0.18074798583984375, -0.1736888885498047, -0.16662979125976562, -0.15957069396972656, -0.1525115966796875, -0.14545249938964844, -0.13839340209960938, -0.1313343048095703, -0.12427520751953125, -0.11721611022949219, -0.11015701293945312, -0.10309791564941406, -0.096038818359375, -0.08897972106933594, -0.08192062377929688, -0.07486152648925781, -0.06780242919921875, -0.06074333190917969, -0.053684234619140625, -0.04662513732910156, -0.0395660400390625, -0.03250694274902344, -0.025447845458984375, -0.018388748168945312, -0.01132965087890625, -0.0042705535888671875, 0.002788543701171875, 0.009847640991210938, 0.01690673828125, 0.023965835571289062, 0.031024932861328125, 0.03808403015136719, 0.04514312744140625, 0.05220222473144531, 0.059261322021484375, 0.06632041931152344, 0.0733795166015625, 0.08043861389160156, 0.08749771118164062, 0.09455680847167969, 0.10161590576171875, 0.10867500305175781, 0.11573410034179688, 0.12279319763183594, 0.129852294921875, 0.13691139221191406, 0.14397048950195312, 0.1510295867919922, 0.15808868408203125, 0.1651477813720703, 0.17220687866210938, 0.17926597595214844, 0.1863250732421875, 0.19338417053222656, 0.20044326782226562, 0.2075023651123047, 0.21456146240234375, 0.2216205596923828, 0.22867965698242188, 0.23573875427246094, 0.2427978515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 5.0, 11.0, 11.0, 11.0, 15.0, 20.0, 25.0, 36.0, 38.0, 35.0, 39.0, 52.0, 33.0, 43.0, 46.0, 56.0, 57.0, 51.0, 61.0, 53.0, 35.0, 47.0, 30.0, 23.0, 29.0, 27.0, 16.0, 15.0, 16.0, 9.0, 8.0, 15.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.274658203125, -0.2674236297607422, -0.2601890563964844, -0.25295448303222656, -0.24571990966796875, -0.23848533630371094, -0.23125076293945312, -0.2240161895751953, -0.2167816162109375, -0.2095470428466797, -0.20231246948242188, -0.19507789611816406, -0.18784332275390625, -0.18060874938964844, -0.17337417602539062, -0.1661396026611328, -0.158905029296875, -0.1516704559326172, -0.14443588256835938, -0.13720130920410156, -0.12996673583984375, -0.12273216247558594, -0.11549758911132812, -0.10826301574707031, -0.1010284423828125, -0.09379386901855469, -0.08655929565429688, -0.07932472229003906, -0.07209014892578125, -0.06485557556152344, -0.057621002197265625, -0.05038642883300781, -0.04315185546875, -0.03591728210449219, -0.028682708740234375, -0.021448135375976562, -0.01421356201171875, -0.0069789886474609375, 0.000255584716796875, 0.0074901580810546875, 0.0147247314453125, 0.021959304809570312, 0.029193878173828125, 0.03642845153808594, 0.04366302490234375, 0.05089759826660156, 0.058132171630859375, 0.06536674499511719, 0.072601318359375, 0.07983589172363281, 0.08707046508789062, 0.09430503845214844, 0.10153961181640625, 0.10877418518066406, 0.11600875854492188, 0.12324333190917969, 0.1304779052734375, 0.1377124786376953, 0.14494705200195312, 0.15218162536621094, 0.15941619873046875, 0.16665077209472656, 0.17388534545898438, 0.1811199188232422, 0.1883544921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 15.0, 20.0, 28.0, 44.0, 75.0, 93.0, 231.0, 380.0, 749.0, 1331.0, 2824.0, 7030.0, 18878.0, 64240.0, 316711.0, 2310612.0, 1241772.0, 166544.0, 40365.0, 12823.0, 5013.0, 2177.0, 1036.0, 541.0, 307.0, 169.0, 102.0, 58.0, 40.0, 16.0, 18.0, 6.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.365478515625, -0.3546714782714844, -0.34386444091796875, -0.3330574035644531, -0.3222503662109375, -0.3114433288574219, -0.30063629150390625, -0.2898292541503906, -0.279022216796875, -0.2682151794433594, -0.25740814208984375, -0.24660110473632812, -0.2357940673828125, -0.22498703002929688, -0.21417999267578125, -0.20337295532226562, -0.19256591796875, -0.18175888061523438, -0.17095184326171875, -0.16014480590820312, -0.1493377685546875, -0.13853073120117188, -0.12772369384765625, -0.11691665649414062, -0.106109619140625, -0.09530258178710938, -0.08449554443359375, -0.07368850708007812, -0.0628814697265625, -0.052074432373046875, -0.04126739501953125, -0.030460357666015625, -0.0196533203125, -0.008846282958984375, 0.00196075439453125, 0.012767791748046875, 0.0235748291015625, 0.034381866455078125, 0.04518890380859375, 0.055995941162109375, 0.066802978515625, 0.07761001586914062, 0.08841705322265625, 0.09922409057617188, 0.1100311279296875, 0.12083816528320312, 0.13164520263671875, 0.14245223999023438, 0.15325927734375, 0.16406631469726562, 0.17487335205078125, 0.18568038940429688, 0.1964874267578125, 0.20729446411132812, 0.21810150146484375, 0.22890853881835938, 0.239715576171875, 0.2505226135253906, 0.26132965087890625, 0.2721366882324219, 0.2829437255859375, 0.2937507629394531, 0.30455780029296875, 0.3153648376464844, 0.326171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 6.0, 15.0, 13.0, 9.0, 23.0, 29.0, 50.0, 58.0, 96.0, 135.0, 220.0, 385.0, 581.0, 764.0, 624.0, 389.0, 230.0, 161.0, 99.0, 58.0, 35.0, 25.0, 20.0, 17.0, 11.0, 6.0, 3.0, 2.0, 0.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.3698577880859375, -0.355926513671875, -0.3419952392578125, -0.32806396484375, -0.3141326904296875, -0.300201416015625, -0.2862701416015625, -0.2723388671875, -0.2584075927734375, -0.244476318359375, -0.2305450439453125, -0.21661376953125, -0.2026824951171875, -0.188751220703125, -0.1748199462890625, -0.160888671875, -0.1469573974609375, -0.133026123046875, -0.1190948486328125, -0.10516357421875, -0.0912322998046875, -0.077301025390625, -0.0633697509765625, -0.0494384765625, -0.0355072021484375, -0.021575927734375, -0.0076446533203125, 0.00628662109375, 0.0202178955078125, 0.034149169921875, 0.0480804443359375, 0.06201171875, 0.0759429931640625, 0.089874267578125, 0.1038055419921875, 0.11773681640625, 0.1316680908203125, 0.145599365234375, 0.1595306396484375, 0.1734619140625, 0.1873931884765625, 0.201324462890625, 0.2152557373046875, 0.22918701171875, 0.2431182861328125, 0.257049560546875, 0.2709808349609375, 0.284912109375, 0.2988433837890625, 0.312774658203125, 0.3267059326171875, 0.34063720703125, 0.3545684814453125, 0.368499755859375, 0.3824310302734375, 0.3963623046875, 0.4102935791015625, 0.424224853515625, 0.4381561279296875, 0.45208740234375, 0.4660186767578125, 0.479949951171875, 0.4938812255859375, 0.5078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 7.0, 11.0, 35.0, 78.0, 139.0, 202.0, 215.0, 155.0, 84.0, 31.0, 15.0, 14.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4793975353240967, -3.3675782680511475, -3.2557590007781982, -3.143939971923828, -3.032120704650879, -2.9203014373779297, -2.8084821701049805, -2.6966629028320312, -2.584843635559082, -2.473024368286133, -2.3612051010131836, -2.2493858337402344, -2.1375668048858643, -2.025747537612915, -1.9139282703399658, -1.8021090030670166, -1.6902899742126465, -1.5784707069396973, -1.4666515588760376, -1.3548322916030884, -1.2430131435394287, -1.1311938762664795, -1.0193746089935303, -0.9075554013252258, -0.7957361936569214, -0.6839169859886169, -0.5720977783203125, -0.4602785110473633, -0.34845930337905884, -0.2366400957107544, -0.12482082843780518, -0.013001620769500732, 0.09881734848022461, 0.21063657104969025, 0.3224557936191559, 0.4342750310897827, 0.5460942387580872, 0.6579134464263916, 0.7697327136993408, 0.8815519213676453, 0.9933711290359497, 1.105190396308899, 1.2170095443725586, 1.3288288116455078, 1.440648078918457, 1.5524672269821167, 1.664286494255066, 1.7761056423187256, 1.8879249095916748, 1.999744176864624, 2.1115634441375732, 2.2233824729919434, 2.3352017402648926, 2.447021007537842, 2.558840274810791, 2.6706595420837402, 2.7824788093566895, 2.8942980766296387, 3.006117343902588, 3.117936611175537, 3.2297556400299072, 3.3415749073028564, 3.4533941745758057, 3.565213441848755, 3.677032470703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 8.0, 7.0, 9.0, 8.0, 5.0, 8.0, 14.0, 14.0, 16.0, 23.0, 20.0, 25.0, 33.0, 28.0, 36.0, 33.0, 34.0, 31.0, 38.0, 35.0, 50.0, 32.0, 36.0, 52.0, 59.0, 40.0, 36.0, 39.0, 32.0, 24.0, 26.0, 21.0, 20.0, 22.0, 13.0, 17.0, 10.0, 9.0, 11.0, 10.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.927424967288971, -0.894102931022644, -0.8607808351516724, -0.8274587988853455, -0.7941367626190186, -0.7608146667480469, -0.72749263048172, -0.6941705942153931, -0.6608484983444214, -0.6275264620780945, -0.5942043662071228, -0.5608823299407959, -0.5275602340698242, -0.4942381978034973, -0.4609161615371704, -0.4275940954685211, -0.3942720293998718, -0.36094996333122253, -0.32762789726257324, -0.29430586099624634, -0.26098379492759705, -0.22766172885894775, -0.19433967769145966, -0.16101762652397156, -0.12769556045532227, -0.09437350183725357, -0.061051443219184875, -0.02772938460111618, 0.005592674016952515, 0.03891474008560181, 0.0722367912530899, 0.105558842420578, 0.13888096809387207, 0.17220303416252136, 0.20552508533000946, 0.23884713649749756, 0.27216920256614685, 0.30549126863479614, 0.33881330490112305, 0.37213537096977234, 0.40545743703842163, 0.4387795031070709, 0.4721015691757202, 0.5054236054420471, 0.538745641708374, 0.5720677375793457, 0.6053897738456726, 0.6387118101119995, 0.6720339059829712, 0.7053559422492981, 0.7386780381202698, 0.7720000743865967, 0.8053221702575684, 0.8386442065238953, 0.8719662427902222, 0.9052883386611938, 0.9386103749275208, 0.9719324111938477, 1.0052545070648193, 1.038576602935791, 1.0718985795974731, 1.1052206754684448, 1.1385427713394165, 1.1718647480010986, 1.2051868438720703]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 7.0, 7.0, 10.0, 8.0, 14.0, 24.0, 30.0, 43.0, 59.0, 86.0, 85.0, 156.0, 234.0, 329.0, 491.0, 809.0, 1262.0, 1971.0, 3379.0, 5952.0, 10628.0, 19603.0, 35464.0, 65454.0, 115436.0, 182613.0, 212320.0, 165464.0, 100762.0, 56174.0, 30607.0, 16784.0, 9157.0, 5121.0, 3057.0, 1731.0, 1110.0, 672.0, 431.0, 318.0, 194.0, 131.0, 89.0, 63.0, 69.0, 34.0, 24.0, 38.0, 15.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.175048828125, -0.16964149475097656, -0.16423416137695312, -0.1588268280029297, -0.15341949462890625, -0.1480121612548828, -0.14260482788085938, -0.13719749450683594, -0.1317901611328125, -0.12638282775878906, -0.12097549438476562, -0.11556816101074219, -0.11016082763671875, -0.10475349426269531, -0.09934616088867188, -0.09393882751464844, -0.088531494140625, -0.08312416076660156, -0.07771682739257812, -0.07230949401855469, -0.06690216064453125, -0.06149482727050781, -0.056087493896484375, -0.05068016052246094, -0.0452728271484375, -0.03986549377441406, -0.034458160400390625, -0.029050827026367188, -0.02364349365234375, -0.018236160278320312, -0.012828826904296875, -0.0074214935302734375, -0.00201416015625, 0.0033931732177734375, 0.008800506591796875, 0.014207839965820312, 0.01961517333984375, 0.025022506713867188, 0.030429840087890625, 0.03583717346191406, 0.0412445068359375, 0.04665184020996094, 0.052059173583984375, 0.05746650695800781, 0.06287384033203125, 0.06828117370605469, 0.07368850708007812, 0.07909584045410156, 0.084503173828125, 0.08991050720214844, 0.09531784057617188, 0.10072517395019531, 0.10613250732421875, 0.11153984069824219, 0.11694717407226562, 0.12235450744628906, 0.1277618408203125, 0.13316917419433594, 0.13857650756835938, 0.1439838409423828, 0.14939117431640625, 0.1547985076904297, 0.16020584106445312, 0.16561317443847656, 0.1710205078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 5.0, 7.0, 18.0, 11.0, 11.0, 20.0, 17.0, 17.0, 27.0, 24.0, 44.0, 31.0, 29.0, 34.0, 51.0, 38.0, 42.0, 48.0, 45.0, 42.0, 34.0, 41.0, 34.0, 37.0, 27.0, 39.0, 25.0, 31.0, 23.0, 21.0, 20.0, 17.0, 11.0, 16.0, 6.0, 9.0, 9.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.20916175842285156, -0.20250320434570312, -0.1958446502685547, -0.18918609619140625, -0.1825275421142578, -0.17586898803710938, -0.16921043395996094, -0.1625518798828125, -0.15589332580566406, -0.14923477172851562, -0.1425762176513672, -0.13591766357421875, -0.1292591094970703, -0.12260055541992188, -0.11594200134277344, -0.109283447265625, -0.10262489318847656, -0.09596633911132812, -0.08930778503417969, -0.08264923095703125, -0.07599067687988281, -0.06933212280273438, -0.06267356872558594, -0.0560150146484375, -0.04935646057128906, -0.042697906494140625, -0.03603935241699219, -0.02938079833984375, -0.022722244262695312, -0.016063690185546875, -0.009405136108398438, -0.00274658203125, 0.0039119720458984375, 0.010570526123046875, 0.017229080200195312, 0.02388763427734375, 0.030546188354492188, 0.037204742431640625, 0.04386329650878906, 0.0505218505859375, 0.05718040466308594, 0.06383895874023438, 0.07049751281738281, 0.07715606689453125, 0.08381462097167969, 0.09047317504882812, 0.09713172912597656, 0.103790283203125, 0.11044883728027344, 0.11710739135742188, 0.12376594543457031, 0.13042449951171875, 0.1370830535888672, 0.14374160766601562, 0.15040016174316406, 0.1570587158203125, 0.16371726989746094, 0.17037582397460938, 0.1770343780517578, 0.18369293212890625, 0.1903514862060547, 0.19701004028320312, 0.20366859436035156, 0.2103271484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 5.0, 7.0, 9.0, 15.0, 26.0, 60.0, 86.0, 132.0, 213.0, 370.0, 726.0, 1335.0, 2641.0, 5571.0, 12686.0, 31026.0, 78758.0, 200159.0, 365791.0, 208674.0, 82605.0, 32613.0, 13292.0, 5876.0, 2792.0, 1397.0, 723.0, 391.0, 233.0, 126.0, 69.0, 49.0, 44.0, 31.0, 6.0, 4.0, 2.0, 7.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2519111633300781, -0.24308013916015625, -0.23424911499023438, -0.2254180908203125, -0.21658706665039062, -0.20775604248046875, -0.19892501831054688, -0.190093994140625, -0.18126296997070312, -0.17243194580078125, -0.16360092163085938, -0.1547698974609375, -0.14593887329101562, -0.13710784912109375, -0.12827682495117188, -0.11944580078125, -0.11061477661132812, -0.10178375244140625, -0.09295272827148438, -0.0841217041015625, -0.07529067993164062, -0.06645965576171875, -0.057628631591796875, -0.048797607421875, -0.039966583251953125, -0.03113555908203125, -0.022304534912109375, -0.0134735107421875, -0.004642486572265625, 0.00418853759765625, 0.013019561767578125, 0.0218505859375, 0.030681610107421875, 0.03951263427734375, 0.048343658447265625, 0.0571746826171875, 0.06600570678710938, 0.07483673095703125, 0.08366775512695312, 0.092498779296875, 0.10132980346679688, 0.11016082763671875, 0.11899185180664062, 0.1278228759765625, 0.13665390014648438, 0.14548492431640625, 0.15431594848632812, 0.16314697265625, 0.17197799682617188, 0.18080902099609375, 0.18964004516601562, 0.1984710693359375, 0.20730209350585938, 0.21613311767578125, 0.22496414184570312, 0.233795166015625, 0.24262619018554688, 0.25145721435546875, 0.2602882385253906, 0.2691192626953125, 0.2779502868652344, 0.28678131103515625, 0.2956123352050781, 0.304443359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 8.0, 9.0, 22.0, 13.0, 19.0, 16.0, 22.0, 32.0, 32.0, 45.0, 37.0, 47.0, 47.0, 52.0, 31.0, 43.0, 47.0, 43.0, 43.0, 51.0, 49.0, 39.0, 31.0, 29.0, 26.0, 22.0, 26.0, 13.0, 14.0, 15.0, 20.0, 6.0, 12.0, 2.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.599609375, -0.57977294921875, -0.5599365234375, -0.54010009765625, -0.520263671875, -0.50042724609375, -0.4805908203125, -0.46075439453125, -0.44091796875, -0.42108154296875, -0.4012451171875, -0.38140869140625, -0.361572265625, -0.34173583984375, -0.3218994140625, -0.30206298828125, -0.2822265625, -0.26239013671875, -0.2425537109375, -0.22271728515625, -0.202880859375, -0.18304443359375, -0.1632080078125, -0.14337158203125, -0.12353515625, -0.10369873046875, -0.0838623046875, -0.06402587890625, -0.044189453125, -0.02435302734375, -0.0045166015625, 0.01531982421875, 0.03515625, 0.05499267578125, 0.0748291015625, 0.09466552734375, 0.114501953125, 0.13433837890625, 0.1541748046875, 0.17401123046875, 0.19384765625, 0.21368408203125, 0.2335205078125, 0.25335693359375, 0.273193359375, 0.29302978515625, 0.3128662109375, 0.33270263671875, 0.3525390625, 0.37237548828125, 0.3922119140625, 0.41204833984375, 0.431884765625, 0.45172119140625, 0.4715576171875, 0.49139404296875, 0.51123046875, 0.53106689453125, 0.5509033203125, 0.57073974609375, 0.590576171875, 0.61041259765625, 0.6302490234375, 0.65008544921875, 0.669921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 3.0, 8.0, 18.0, 23.0, 29.0, 50.0, 53.0, 116.0, 172.0, 245.0, 441.0, 682.0, 1149.0, 1852.0, 3226.0, 5656.0, 9975.0, 18171.0, 33815.0, 64261.0, 119233.0, 201441.0, 252353.0, 152097.0, 84459.0, 44821.0, 23882.0, 13004.0, 7160.0, 4086.0, 2373.0, 1377.0, 882.0, 530.0, 316.0, 217.0, 128.0, 86.0, 48.0, 31.0, 21.0, 22.0, 10.0, 3.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.043609619140625, -0.0422968864440918, -0.040984153747558594, -0.03967142105102539, -0.03835868835449219, -0.037045955657958984, -0.03573322296142578, -0.03442049026489258, -0.033107757568359375, -0.03179502487182617, -0.03048229217529297, -0.029169559478759766, -0.027856826782226562, -0.02654409408569336, -0.025231361389160156, -0.023918628692626953, -0.02260589599609375, -0.021293163299560547, -0.019980430603027344, -0.01866769790649414, -0.017354965209960938, -0.016042232513427734, -0.014729499816894531, -0.013416767120361328, -0.012104034423828125, -0.010791301727294922, -0.009478569030761719, -0.008165836334228516, -0.0068531036376953125, -0.005540370941162109, -0.004227638244628906, -0.002914905548095703, -0.0016021728515625, -0.0002894401550292969, 0.0010232925415039062, 0.0023360252380371094, 0.0036487579345703125, 0.004961490631103516, 0.006274223327636719, 0.007586956024169922, 0.008899688720703125, 0.010212421417236328, 0.011525154113769531, 0.012837886810302734, 0.014150619506835938, 0.01546335220336914, 0.016776084899902344, 0.018088817596435547, 0.01940155029296875, 0.020714282989501953, 0.022027015686035156, 0.02333974838256836, 0.024652481079101562, 0.025965213775634766, 0.02727794647216797, 0.028590679168701172, 0.029903411865234375, 0.031216144561767578, 0.03252887725830078, 0.033841609954833984, 0.03515434265136719, 0.03646707534790039, 0.037779808044433594, 0.0390925407409668, 0.0404052734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 14.0, 21.0, 9.0, 20.0, 21.0, 39.0, 38.0, 49.0, 67.0, 57.0, 94.0, 84.0, 75.0, 76.0, 58.0, 65.0, 45.0, 37.0, 27.0, 16.0, 12.0, 11.0, 10.0, 11.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.7000904083251953e-05, -2.6241876184940338e-05, -2.5482848286628723e-05, -2.4723820388317108e-05, -2.3964792490005493e-05, -2.3205764591693878e-05, -2.2446736693382263e-05, -2.1687708795070648e-05, -2.0928680896759033e-05, -2.0169652998447418e-05, -1.9410625100135803e-05, -1.8651597201824188e-05, -1.7892569303512573e-05, -1.7133541405200958e-05, -1.6374513506889343e-05, -1.5615485608577728e-05, -1.4856457710266113e-05, -1.4097429811954498e-05, -1.3338401913642883e-05, -1.2579374015331268e-05, -1.1820346117019653e-05, -1.1061318218708038e-05, -1.0302290320396423e-05, -9.543262422084808e-06, -8.784234523773193e-06, -8.025206625461578e-06, -7.266178727149963e-06, -6.507150828838348e-06, -5.748122930526733e-06, -4.989095032215118e-06, -4.230067133903503e-06, -3.4710392355918884e-06, -2.7120113372802734e-06, -1.9529834389686584e-06, -1.1939555406570435e-06, -4.3492764234542847e-07, 3.241002559661865e-07, 1.0831281542778015e-06, 1.8421560525894165e-06, 2.6011839509010315e-06, 3.3602118492126465e-06, 4.1192397475242615e-06, 4.8782676458358765e-06, 5.6372955441474915e-06, 6.3963234424591064e-06, 7.1553513407707214e-06, 7.914379239082336e-06, 8.673407137393951e-06, 9.432435035705566e-06, 1.0191462934017181e-05, 1.0950490832328796e-05, 1.1709518730640411e-05, 1.2468546628952026e-05, 1.3227574527263641e-05, 1.3986602425575256e-05, 1.4745630323886871e-05, 1.5504658222198486e-05, 1.62636861205101e-05, 1.7022714018821716e-05, 1.778174191713333e-05, 1.8540769815444946e-05, 1.929979771375656e-05, 2.0058825612068176e-05, 2.081785351037979e-05, 2.1576881408691406e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 5.0, 12.0, 15.0, 24.0, 29.0, 47.0, 68.0, 97.0, 117.0, 224.0, 383.0, 615.0, 1077.0, 1878.0, 3621.0, 7437.0, 15533.0, 33750.0, 74043.0, 150591.0, 267364.0, 236307.0, 133555.0, 64971.0, 29237.0, 13552.0, 6422.0, 3300.0, 1757.0, 952.0, 566.0, 338.0, 208.0, 136.0, 82.0, 58.0, 48.0, 35.0, 28.0, 13.0, 11.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.052764892578125, -0.051161766052246094, -0.04955863952636719, -0.04795551300048828, -0.046352386474609375, -0.04474925994873047, -0.04314613342285156, -0.041543006896972656, -0.03993988037109375, -0.038336753845214844, -0.03673362731933594, -0.03513050079345703, -0.033527374267578125, -0.03192424774169922, -0.030321121215820312, -0.028717994689941406, -0.0271148681640625, -0.025511741638183594, -0.023908615112304688, -0.02230548858642578, -0.020702362060546875, -0.01909923553466797, -0.017496109008789062, -0.015892982482910156, -0.01428985595703125, -0.012686729431152344, -0.011083602905273438, -0.009480476379394531, -0.007877349853515625, -0.006274223327636719, -0.0046710968017578125, -0.0030679702758789062, -0.00146484375, 0.00013828277587890625, 0.0017414093017578125, 0.0033445358276367188, 0.004947662353515625, 0.006550788879394531, 0.008153915405273438, 0.009757041931152344, 0.01136016845703125, 0.012963294982910156, 0.014566421508789062, 0.01616954803466797, 0.017772674560546875, 0.01937580108642578, 0.020978927612304688, 0.022582054138183594, 0.0241851806640625, 0.025788307189941406, 0.027391433715820312, 0.02899456024169922, 0.030597686767578125, 0.03220081329345703, 0.03380393981933594, 0.035407066345214844, 0.03701019287109375, 0.038613319396972656, 0.04021644592285156, 0.04181957244873047, 0.043422698974609375, 0.04502582550048828, 0.04662895202636719, 0.048232078552246094, 0.049835205078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 11.0, 9.0, 11.0, 13.0, 18.0, 25.0, 24.0, 31.0, 39.0, 45.0, 47.0, 67.0, 60.0, 67.0, 78.0, 47.0, 55.0, 52.0, 44.0, 45.0, 38.0, 23.0, 21.0, 19.0, 22.0, 13.0, 15.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07366943359375, -0.07128429412841797, -0.06889915466308594, -0.0665140151977539, -0.06412887573242188, -0.061743736267089844, -0.05935859680175781, -0.05697345733642578, -0.05458831787109375, -0.05220317840576172, -0.04981803894042969, -0.047432899475097656, -0.045047760009765625, -0.042662620544433594, -0.04027748107910156, -0.03789234161376953, -0.0355072021484375, -0.03312206268310547, -0.030736923217773438, -0.028351783752441406, -0.025966644287109375, -0.023581504821777344, -0.021196365356445312, -0.01881122589111328, -0.01642608642578125, -0.014040946960449219, -0.011655807495117188, -0.009270668029785156, -0.006885528564453125, -0.004500389099121094, -0.0021152496337890625, 0.00026988983154296875, 0.002655029296875, 0.005040168762207031, 0.0074253082275390625, 0.009810447692871094, 0.012195587158203125, 0.014580726623535156, 0.016965866088867188, 0.01935100555419922, 0.02173614501953125, 0.02412128448486328, 0.026506423950195312, 0.028891563415527344, 0.031276702880859375, 0.033661842346191406, 0.03604698181152344, 0.03843212127685547, 0.0408172607421875, 0.04320240020751953, 0.04558753967285156, 0.047972679138183594, 0.050357818603515625, 0.052742958068847656, 0.05512809753417969, 0.05751323699951172, 0.05989837646484375, 0.06228351593017578, 0.06466865539550781, 0.06705379486083984, 0.06943893432617188, 0.0718240737915039, 0.07420921325683594, 0.07659435272216797, 0.0789794921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 13.0, 3.0, 12.0, 28.0, 43.0, 65.0, 103.0, 122.0, 126.0, 138.0, 108.0, 85.0, 51.0, 33.0, 36.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8664002418518066, -1.8145580291748047, -1.7627158164978027, -1.7108734846115112, -1.6590312719345093, -1.6071890592575073, -1.5553468465805054, -1.5035045146942139, -1.451662302017212, -1.39982008934021, -1.347977876663208, -1.2961355447769165, -1.2442933320999146, -1.1924511194229126, -1.1406089067459106, -1.0887665748596191, -1.0369243621826172, -0.9850821495056152, -0.9332398772239685, -0.8813976645469666, -0.8295553922653198, -0.7777131795883179, -0.7258709669113159, -0.6740286946296692, -0.622186541557312, -0.5703443288803101, -0.5185020565986633, -0.4666598439216614, -0.41481757164001465, -0.3629753589630127, -0.31113311648368835, -0.259290874004364, -0.20744860172271729, -0.15560635924339294, -0.1037641242146492, -0.05192188918590546, -7.964670658111572e-05, 0.05176258087158203, 0.10360482335090637, 0.1554470658302307, 0.20728930830955505, 0.2591315507888794, 0.31097379326820374, 0.3628160357475281, 0.41465824842453003, 0.46650049090385437, 0.5183427333831787, 0.5701849460601807, 0.6220272183418274, 0.6738694310188293, 0.7257117033004761, 0.777553915977478, 0.8293961882591248, 0.8812384009361267, 0.9330806732177734, 0.9849228858947754, 1.0367650985717773, 1.0886073112487793, 1.1404495239257812, 1.1922918558120728, 1.2441340684890747, 1.2959762811660767, 1.3478184938430786, 1.3996608257293701, 1.451503038406372]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 4.0, 8.0, 8.0, 14.0, 15.0, 14.0, 18.0, 16.0, 20.0, 10.0, 24.0, 28.0, 24.0, 30.0, 25.0, 32.0, 41.0, 42.0, 43.0, 42.0, 46.0, 43.0, 43.0, 27.0, 37.0, 41.0, 36.0, 33.0, 32.0, 23.0, 33.0, 27.0, 17.0, 18.0, 8.0, 15.0, 6.0, 9.0, 11.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.0778909921646118, -1.0413627624511719, -1.004834532737732, -0.968306303024292, -0.9317781329154968, -0.8952499032020569, -0.8587216734886169, -0.8221935033798218, -0.7856652736663818, -0.7491370439529419, -0.712608814239502, -0.676080584526062, -0.6395524144172668, -0.6030241847038269, -0.566495954990387, -0.5299677848815918, -0.4934394955635071, -0.45691126585006714, -0.4203830659389496, -0.38385483622550964, -0.3473266363143921, -0.31079840660095215, -0.2742701768875122, -0.23774197697639465, -0.2012137472629547, -0.16468553245067596, -0.12815731763839722, -0.09162908792495728, -0.05510087311267853, -0.01857265830039978, 0.01795557141304016, 0.054483771324157715, 0.09101200103759766, 0.1275402158498764, 0.16406843066215515, 0.2005966603755951, 0.23712487518787384, 0.2736530900001526, 0.31018131971359253, 0.3467095196247101, 0.38323774933815, 0.41976597905158997, 0.4562941789627075, 0.49282240867614746, 0.5293506383895874, 0.5658788681030273, 0.6024070978164673, 0.6389352679252625, 0.6754634976387024, 0.7119917273521423, 0.7485199570655823, 0.7850481271743774, 0.8215763568878174, 0.8581045866012573, 0.8946328163146973, 0.9311610460281372, 0.9676892757415771, 1.004217505455017, 1.040745735168457, 1.077273964881897, 1.113802194595337, 1.1503303050994873, 1.1868586540222168, 1.2233867645263672, 1.2599149942398071]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 14.0, 11.0, 23.0, 42.0, 58.0, 85.0, 131.0, 200.0, 239.0, 467.0, 802.0, 1419.0, 2734.0, 5946.0, 15256.0, 46333.0, 174970.0, 551975.0, 1147247.0, 1246209.0, 684248.0, 223563.0, 59751.0, 18193.0, 7015.0, 3201.0, 1657.0, 1000.0, 550.0, 324.0, 225.0, 133.0, 90.0, 45.0, 33.0, 26.0, 26.0, 14.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2149658203125, -0.20805740356445312, -0.20114898681640625, -0.19424057006835938, -0.1873321533203125, -0.18042373657226562, -0.17351531982421875, -0.16660690307617188, -0.159698486328125, -0.15279006958007812, -0.14588165283203125, -0.13897323608398438, -0.1320648193359375, -0.12515640258789062, -0.11824798583984375, -0.11133956909179688, -0.10443115234375, -0.09752273559570312, -0.09061431884765625, -0.08370590209960938, -0.0767974853515625, -0.06988906860351562, -0.06298065185546875, -0.056072235107421875, -0.049163818359375, -0.042255401611328125, -0.03534698486328125, -0.028438568115234375, -0.0215301513671875, -0.014621734619140625, -0.00771331787109375, -0.000804901123046875, 0.006103515625, 0.013011932373046875, 0.01992034912109375, 0.026828765869140625, 0.0337371826171875, 0.040645599365234375, 0.04755401611328125, 0.054462432861328125, 0.061370849609375, 0.06827926635742188, 0.07518768310546875, 0.08209609985351562, 0.0890045166015625, 0.09591293334960938, 0.10282135009765625, 0.10972976684570312, 0.11663818359375, 0.12354660034179688, 0.13045501708984375, 0.13736343383789062, 0.1442718505859375, 0.15118026733398438, 0.15808868408203125, 0.16499710083007812, 0.171905517578125, 0.17881393432617188, 0.18572235107421875, 0.19263076782226562, 0.1995391845703125, 0.20644760131835938, 0.21335601806640625, 0.22026443481445312, 0.2271728515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 6.0, 4.0, 6.0, 11.0, 10.0, 10.0, 15.0, 18.0, 21.0, 20.0, 20.0, 30.0, 34.0, 23.0, 35.0, 47.0, 41.0, 43.0, 39.0, 45.0, 43.0, 34.0, 51.0, 49.0, 38.0, 29.0, 42.0, 36.0, 27.0, 28.0, 21.0, 18.0, 9.0, 17.0, 18.0, 14.0, 14.0, 4.0, 9.0, 7.0, 6.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15888214111328125, -0.1530914306640625, -0.14730072021484375, -0.141510009765625, -0.13571929931640625, -0.1299285888671875, -0.12413787841796875, -0.11834716796875, -0.11255645751953125, -0.1067657470703125, -0.10097503662109375, -0.095184326171875, -0.08939361572265625, -0.0836029052734375, -0.07781219482421875, -0.072021484375, -0.06623077392578125, -0.0604400634765625, -0.05464935302734375, -0.048858642578125, -0.04306793212890625, -0.0372772216796875, -0.03148651123046875, -0.02569580078125, -0.01990509033203125, -0.0141143798828125, -0.00832366943359375, -0.002532958984375, 0.00325775146484375, 0.0090484619140625, 0.01483917236328125, 0.0206298828125, 0.02642059326171875, 0.0322113037109375, 0.03800201416015625, 0.043792724609375, 0.04958343505859375, 0.0553741455078125, 0.06116485595703125, 0.06695556640625, 0.07274627685546875, 0.0785369873046875, 0.08432769775390625, 0.090118408203125, 0.09590911865234375, 0.1016998291015625, 0.10749053955078125, 0.11328125, 0.11907196044921875, 0.1248626708984375, 0.13065338134765625, 0.136444091796875, 0.14223480224609375, 0.1480255126953125, 0.15381622314453125, 0.15960693359375, 0.16539764404296875, 0.1711883544921875, 0.17697906494140625, 0.182769775390625, 0.18856048583984375, 0.1943511962890625, 0.20014190673828125, 0.2059326171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 10.0, 9.0, 20.0, 19.0, 35.0, 46.0, 60.0, 109.0, 192.0, 315.0, 586.0, 1286.0, 3776.0, 19069.0, 230659.0, 3528489.0, 376332.0, 25909.0, 4672.0, 1376.0, 570.0, 298.0, 170.0, 94.0, 61.0, 40.0, 30.0, 19.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.71435546875, -0.695343017578125, -0.67633056640625, -0.657318115234375, -0.6383056640625, -0.619293212890625, -0.60028076171875, -0.581268310546875, -0.562255859375, -0.543243408203125, -0.52423095703125, -0.505218505859375, -0.4862060546875, -0.467193603515625, -0.44818115234375, -0.429168701171875, -0.41015625, -0.391143798828125, -0.37213134765625, -0.353118896484375, -0.3341064453125, -0.315093994140625, -0.29608154296875, -0.277069091796875, -0.258056640625, -0.239044189453125, -0.22003173828125, -0.201019287109375, -0.1820068359375, -0.162994384765625, -0.14398193359375, -0.124969482421875, -0.10595703125, -0.086944580078125, -0.06793212890625, -0.048919677734375, -0.0299072265625, -0.010894775390625, 0.00811767578125, 0.027130126953125, 0.046142578125, 0.065155029296875, 0.08416748046875, 0.103179931640625, 0.1221923828125, 0.141204833984375, 0.16021728515625, 0.179229736328125, 0.1982421875, 0.217254638671875, 0.23626708984375, 0.255279541015625, 0.2742919921875, 0.293304443359375, 0.31231689453125, 0.331329345703125, 0.350341796875, 0.369354248046875, 0.38836669921875, 0.407379150390625, 0.4263916015625, 0.445404052734375, 0.46441650390625, 0.483428955078125, 0.50244140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 4.0, 11.0, 16.0, 38.0, 20.0, 45.0, 78.0, 129.0, 179.0, 252.0, 380.0, 463.0, 556.0, 494.0, 434.0, 252.0, 227.0, 156.0, 102.0, 65.0, 47.0, 39.0, 23.0, 19.0, 11.0, 6.0, 4.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.358642578125, -0.3441352844238281, -0.32962799072265625, -0.3151206970214844, -0.3006134033203125, -0.2861061096191406, -0.27159881591796875, -0.2570915222167969, -0.242584228515625, -0.22807693481445312, -0.21356964111328125, -0.19906234741210938, -0.1845550537109375, -0.17004776000976562, -0.15554046630859375, -0.14103317260742188, -0.12652587890625, -0.11201858520507812, -0.09751129150390625, -0.08300399780273438, -0.0684967041015625, -0.053989410400390625, -0.03948211669921875, -0.024974822998046875, -0.010467529296875, 0.004039764404296875, 0.01854705810546875, 0.033054351806640625, 0.0475616455078125, 0.062068939208984375, 0.07657623291015625, 0.09108352661132812, 0.1055908203125, 0.12009811401367188, 0.13460540771484375, 0.14911270141601562, 0.1636199951171875, 0.17812728881835938, 0.19263458251953125, 0.20714187622070312, 0.221649169921875, 0.23615646362304688, 0.25066375732421875, 0.2651710510253906, 0.2796783447265625, 0.2941856384277344, 0.30869293212890625, 0.3232002258300781, 0.33770751953125, 0.3522148132324219, 0.36672210693359375, 0.3812294006347656, 0.3957366943359375, 0.4102439880371094, 0.42475128173828125, 0.4392585754394531, 0.453765869140625, 0.4682731628417969, 0.48278045654296875, 0.4972877502441406, 0.5117950439453125, 0.5263023376464844, 0.5408096313476562, 0.5553169250488281, 0.56982421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 7.0, 11.0, 10.0, 20.0, 41.0, 63.0, 61.0, 108.0, 121.0, 121.0, 100.0, 84.0, 74.0, 46.0, 33.0, 30.0, 17.0, 13.0, 2.0, 9.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.110228061676025, -4.000336647033691, -3.8904457092285156, -3.7805545330047607, -3.670663356781006, -3.560771942138672, -3.450881004333496, -3.340989589691162, -3.2310984134674072, -3.1212072372436523, -3.0113160610198975, -2.9014248847961426, -2.7915337085723877, -2.681642532348633, -2.571751117706299, -2.461859941482544, -2.351968765258789, -2.242077589035034, -2.1321864128112793, -2.0222952365875244, -1.91240394115448, -1.802512764930725, -1.6926215887069702, -1.5827302932739258, -1.47283935546875, -1.3629481792449951, -1.2530570030212402, -1.1431658267974854, -1.033274531364441, -0.923383355140686, -0.8134921789169312, -0.7036009430885315, -0.5937097072601318, -0.48381850123405457, -0.3739272952079773, -0.2640361189842224, -0.15414491295814514, -0.04425370693206787, 0.06563746929168701, 0.17552870512008667, 0.28541988134384155, 0.3953110873699188, 0.5052022933959961, 0.615093469619751, 0.7249846458435059, 0.8348758816719055, 0.9447670578956604, 1.05465829372406, 1.164549469947815, 1.2744406461715698, 1.3843318223953247, 1.4942231178283691, 1.604114294052124, 1.714005470275879, 1.8238966464996338, 1.9337878227233887, 2.0436789989471436, 2.1535701751708984, 2.2634613513946533, 2.373352527618408, 2.483243703842163, 2.593134880065918, 2.703026294708252, 2.812917470932007, 2.9228086471557617]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 6.0, 19.0, 21.0, 22.0, 21.0, 24.0, 20.0, 40.0, 39.0, 33.0, 48.0, 44.0, 71.0, 47.0, 58.0, 49.0, 49.0, 42.0, 42.0, 26.0, 41.0, 34.0, 35.0, 32.0, 22.0, 25.0, 13.0, 12.0, 5.0, 12.0, 6.0, 3.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8879380226135254, -1.82570481300354, -1.7634716033935547, -1.7012385129928589, -1.6390053033828735, -1.5767720937728882, -1.5145388841629028, -1.452305793762207, -1.3900725841522217, -1.3278393745422363, -1.265606164932251, -1.2033730745315552, -1.1411398649215698, -1.0789066553115845, -1.0166734457015991, -0.9544402956962585, -0.8922070860862732, -0.8299738764762878, -0.7677407264709473, -0.7055075168609619, -0.6432743668556213, -0.581041157245636, -0.5188080072402954, -0.45657479763031006, -0.3943416178226471, -0.33210843801498413, -0.26987525820732117, -0.207642063498497, -0.14540888369083405, -0.08317568898200989, -0.020942509174346924, 0.04129067063331604, 0.103523850440979, 0.16575703024864197, 0.22799021005630493, 0.2902234196662903, 0.35245656967163086, 0.4146897792816162, 0.4769229590892792, 0.5391561388969421, 0.6013892889022827, 0.6636224985122681, 0.7258556485176086, 0.788088858127594, 0.8503220081329346, 0.9125552177429199, 0.9747884273529053, 1.0370216369628906, 1.099254846572876, 1.1614880561828613, 1.2237212657928467, 1.2859543561935425, 1.3481875658035278, 1.4104207754135132, 1.4726539850234985, 1.5348870754241943, 1.5971202850341797, 1.659353494644165, 1.7215867042541504, 1.7838197946548462, 1.8460530042648315, 1.908286213874817, 1.9705194234848022, 2.032752513885498, 2.0949857234954834]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 13.0, 22.0, 33.0, 41.0, 59.0, 76.0, 109.0, 149.0, 201.0, 323.0, 464.0, 753.0, 1086.0, 1861.0, 3331.0, 6332.0, 12900.0, 31557.0, 95498.0, 351501.0, 375202.0, 104040.0, 33803.0, 13903.0, 6413.0, 3432.0, 1899.0, 1199.0, 752.0, 492.0, 318.0, 228.0, 175.0, 113.0, 76.0, 49.0, 39.0, 30.0, 17.0, 19.0, 1.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.26513671875, -0.257568359375, -0.25, -0.242431640625, -0.23486328125, -0.227294921875, -0.2197265625, -0.212158203125, -0.20458984375, -0.197021484375, -0.189453125, -0.181884765625, -0.17431640625, -0.166748046875, -0.1591796875, -0.151611328125, -0.14404296875, -0.136474609375, -0.12890625, -0.121337890625, -0.11376953125, -0.106201171875, -0.0986328125, -0.091064453125, -0.08349609375, -0.075927734375, -0.068359375, -0.060791015625, -0.05322265625, -0.045654296875, -0.0380859375, -0.030517578125, -0.02294921875, -0.015380859375, -0.0078125, -0.000244140625, 0.00732421875, 0.014892578125, 0.0224609375, 0.030029296875, 0.03759765625, 0.045166015625, 0.052734375, 0.060302734375, 0.06787109375, 0.075439453125, 0.0830078125, 0.090576171875, 0.09814453125, 0.105712890625, 0.11328125, 0.120849609375, 0.12841796875, 0.135986328125, 0.1435546875, 0.151123046875, 0.15869140625, 0.166259765625, 0.173828125, 0.181396484375, 0.18896484375, 0.196533203125, 0.2041015625, 0.211669921875, 0.21923828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 15.0, 11.0, 12.0, 12.0, 14.0, 24.0, 16.0, 28.0, 27.0, 32.0, 27.0, 45.0, 38.0, 36.0, 60.0, 53.0, 46.0, 56.0, 52.0, 42.0, 58.0, 50.0, 39.0, 32.0, 22.0, 19.0, 22.0, 16.0, 17.0, 20.0, 11.0, 8.0, 8.0, 2.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25439453125, -0.24651336669921875, -0.2386322021484375, -0.23075103759765625, -0.222869873046875, -0.21498870849609375, -0.2071075439453125, -0.19922637939453125, -0.19134521484375, -0.18346405029296875, -0.1755828857421875, -0.16770172119140625, -0.159820556640625, -0.15193939208984375, -0.1440582275390625, -0.13617706298828125, -0.1282958984375, -0.12041473388671875, -0.1125335693359375, -0.10465240478515625, -0.096771240234375, -0.08889007568359375, -0.0810089111328125, -0.07312774658203125, -0.06524658203125, -0.05736541748046875, -0.0494842529296875, -0.04160308837890625, -0.033721923828125, -0.02584075927734375, -0.0179595947265625, -0.01007843017578125, -0.002197265625, 0.00568389892578125, 0.0135650634765625, 0.02144622802734375, 0.029327392578125, 0.03720855712890625, 0.0450897216796875, 0.05297088623046875, 0.06085205078125, 0.06873321533203125, 0.0766143798828125, 0.08449554443359375, 0.092376708984375, 0.10025787353515625, 0.1081390380859375, 0.11602020263671875, 0.1239013671875, 0.13178253173828125, 0.1396636962890625, 0.14754486083984375, 0.155426025390625, 0.16330718994140625, 0.1711883544921875, 0.17906951904296875, 0.18695068359375, 0.19483184814453125, 0.2027130126953125, 0.21059417724609375, 0.218475341796875, 0.22635650634765625, 0.2342376708984375, 0.24211883544921875, 0.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 6.0, 14.0, 10.0, 9.0, 20.0, 42.0, 46.0, 62.0, 116.0, 176.0, 286.0, 485.0, 918.0, 1933.0, 4013.0, 9044.0, 21966.0, 62098.0, 229193.0, 514857.0, 134203.0, 40498.0, 15523.0, 6553.0, 3095.0, 1554.0, 765.0, 380.0, 258.0, 155.0, 86.0, 48.0, 42.0, 28.0, 12.0, 17.0, 9.0, 4.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.220947265625, -0.214508056640625, -0.20806884765625, -0.201629638671875, -0.1951904296875, -0.188751220703125, -0.18231201171875, -0.175872802734375, -0.16943359375, -0.162994384765625, -0.15655517578125, -0.150115966796875, -0.1436767578125, -0.137237548828125, -0.13079833984375, -0.124359130859375, -0.117919921875, -0.111480712890625, -0.10504150390625, -0.098602294921875, -0.0921630859375, -0.085723876953125, -0.07928466796875, -0.072845458984375, -0.06640625, -0.059967041015625, -0.05352783203125, -0.047088623046875, -0.0406494140625, -0.034210205078125, -0.02777099609375, -0.021331787109375, -0.014892578125, -0.008453369140625, -0.00201416015625, 0.004425048828125, 0.0108642578125, 0.017303466796875, 0.02374267578125, 0.030181884765625, 0.03662109375, 0.043060302734375, 0.04949951171875, 0.055938720703125, 0.0623779296875, 0.068817138671875, 0.07525634765625, 0.081695556640625, 0.088134765625, 0.094573974609375, 0.10101318359375, 0.107452392578125, 0.1138916015625, 0.120330810546875, 0.12677001953125, 0.133209228515625, 0.1396484375, 0.146087646484375, 0.15252685546875, 0.158966064453125, 0.1654052734375, 0.171844482421875, 0.17828369140625, 0.184722900390625, 0.191162109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 3.0, 7.0, 7.0, 13.0, 10.0, 16.0, 17.0, 30.0, 16.0, 30.0, 25.0, 43.0, 37.0, 43.0, 53.0, 66.0, 71.0, 53.0, 66.0, 49.0, 50.0, 45.0, 40.0, 36.0, 35.0, 25.0, 21.0, 18.0, 4.0, 18.0, 7.0, 11.0, 5.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.66943359375, -0.6504135131835938, -0.6313934326171875, -0.6123733520507812, -0.593353271484375, -0.5743331909179688, -0.5553131103515625, -0.5362930297851562, -0.51727294921875, -0.49825286865234375, -0.4792327880859375, -0.46021270751953125, -0.441192626953125, -0.42217254638671875, -0.4031524658203125, -0.38413238525390625, -0.3651123046875, -0.34609222412109375, -0.3270721435546875, -0.30805206298828125, -0.289031982421875, -0.27001190185546875, -0.2509918212890625, -0.23197174072265625, -0.21295166015625, -0.19393157958984375, -0.1749114990234375, -0.15589141845703125, -0.136871337890625, -0.11785125732421875, -0.0988311767578125, -0.07981109619140625, -0.060791015625, -0.04177093505859375, -0.0227508544921875, -0.00373077392578125, 0.015289306640625, 0.03430938720703125, 0.0533294677734375, 0.07234954833984375, 0.09136962890625, 0.11038970947265625, 0.1294097900390625, 0.14842987060546875, 0.167449951171875, 0.18647003173828125, 0.2054901123046875, 0.22451019287109375, 0.2435302734375, 0.26255035400390625, 0.2815704345703125, 0.30059051513671875, 0.319610595703125, 0.33863067626953125, 0.3576507568359375, 0.37667083740234375, 0.39569091796875, 0.41471099853515625, 0.4337310791015625, 0.45275115966796875, 0.471771240234375, 0.49079132080078125, 0.5098114013671875, 0.5288314819335938, 0.5478515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 7.0, 25.0, 32.0, 39.0, 78.0, 161.0, 313.0, 706.0, 2600.0, 16019.0, 245371.0, 734851.0, 41323.0, 5059.0, 1089.0, 391.0, 202.0, 90.0, 61.0, 33.0, 20.0, 22.0, 6.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08209228515625, -0.07946109771728516, -0.07682991027832031, -0.07419872283935547, -0.07156753540039062, -0.06893634796142578, -0.06630516052246094, -0.0636739730834961, -0.06104278564453125, -0.058411598205566406, -0.05578041076660156, -0.05314922332763672, -0.050518035888671875, -0.04788684844970703, -0.04525566101074219, -0.042624473571777344, -0.0399932861328125, -0.037362098693847656, -0.03473091125488281, -0.03209972381591797, -0.029468536376953125, -0.02683734893798828, -0.024206161499023438, -0.021574974060058594, -0.01894378662109375, -0.016312599182128906, -0.013681411743164062, -0.011050224304199219, -0.008419036865234375, -0.005787849426269531, -0.0031566619873046875, -0.0005254745483398438, 0.002105712890625, 0.004736900329589844, 0.0073680877685546875, 0.009999275207519531, 0.012630462646484375, 0.015261650085449219, 0.017892837524414062, 0.020524024963378906, 0.02315521240234375, 0.025786399841308594, 0.028417587280273438, 0.03104877471923828, 0.033679962158203125, 0.03631114959716797, 0.03894233703613281, 0.041573524475097656, 0.0442047119140625, 0.046835899353027344, 0.04946708679199219, 0.05209827423095703, 0.054729461669921875, 0.05736064910888672, 0.05999183654785156, 0.0626230239868164, 0.06525421142578125, 0.0678853988647461, 0.07051658630371094, 0.07314777374267578, 0.07577896118164062, 0.07841014862060547, 0.08104133605957031, 0.08367252349853516, 0.0863037109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 7.0, 3.0, 10.0, 14.0, 14.0, 18.0, 21.0, 32.0, 42.0, 55.0, 59.0, 80.0, 80.0, 100.0, 99.0, 82.0, 73.0, 56.0, 35.0, 36.0, 22.0, 12.0, 16.0, 8.0, 7.0, 8.0, 4.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0623207092285156e-05, -2.011377364397049e-05, -1.9604340195655823e-05, -1.9094906747341156e-05, -1.858547329902649e-05, -1.8076039850711823e-05, -1.7566606402397156e-05, -1.705717295408249e-05, -1.6547739505767822e-05, -1.6038306057453156e-05, -1.552887260913849e-05, -1.5019439160823822e-05, -1.4510005712509155e-05, -1.4000572264194489e-05, -1.3491138815879822e-05, -1.2981705367565155e-05, -1.2472271919250488e-05, -1.1962838470935822e-05, -1.1453405022621155e-05, -1.0943971574306488e-05, -1.0434538125991821e-05, -9.925104677677155e-06, -9.415671229362488e-06, -8.906237781047821e-06, -8.396804332733154e-06, -7.887370884418488e-06, -7.377937436103821e-06, -6.868503987789154e-06, -6.359070539474487e-06, -5.8496370911598206e-06, -5.340203642845154e-06, -4.830770194530487e-06, -4.32133674621582e-06, -3.8119032979011536e-06, -3.302469849586487e-06, -2.79303640127182e-06, -2.2836029529571533e-06, -1.7741695046424866e-06, -1.2647360563278198e-06, -7.553026080131531e-07, -2.4586915969848633e-07, 2.635642886161804e-07, 7.729977369308472e-07, 1.282431185245514e-06, 1.7918646335601807e-06, 2.3012980818748474e-06, 2.810731530189514e-06, 3.320164978504181e-06, 3.829598426818848e-06, 4.339031875133514e-06, 4.848465323448181e-06, 5.357898771762848e-06, 5.867332220077515e-06, 6.376765668392181e-06, 6.886199116706848e-06, 7.395632565021515e-06, 7.905066013336182e-06, 8.414499461650848e-06, 8.923932909965515e-06, 9.433366358280182e-06, 9.942799806594849e-06, 1.0452233254909515e-05, 1.0961666703224182e-05, 1.1471100151538849e-05, 1.1980533599853516e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 11.0, 15.0, 13.0, 20.0, 39.0, 59.0, 68.0, 94.0, 165.0, 267.0, 556.0, 1184.0, 2944.0, 9410.0, 42601.0, 265949.0, 601066.0, 97228.0, 18433.0, 4844.0, 1696.0, 799.0, 411.0, 211.0, 138.0, 89.0, 67.0, 51.0, 35.0, 29.0, 14.0, 20.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05742692947387695, -0.055527687072753906, -0.05362844467163086, -0.05172920227050781, -0.049829959869384766, -0.04793071746826172, -0.04603147506713867, -0.044132232666015625, -0.04223299026489258, -0.04033374786376953, -0.038434505462646484, -0.03653526306152344, -0.03463602066040039, -0.032736778259277344, -0.030837535858154297, -0.02893829345703125, -0.027039051055908203, -0.025139808654785156, -0.02324056625366211, -0.021341323852539062, -0.019442081451416016, -0.01754283905029297, -0.015643596649169922, -0.013744354248046875, -0.011845111846923828, -0.009945869445800781, -0.008046627044677734, -0.0061473846435546875, -0.004248142242431641, -0.0023488998413085938, -0.0004496574401855469, 0.0014495849609375, 0.003348827362060547, 0.005248069763183594, 0.007147312164306641, 0.009046554565429688, 0.010945796966552734, 0.012845039367675781, 0.014744281768798828, 0.016643524169921875, 0.018542766571044922, 0.02044200897216797, 0.022341251373291016, 0.024240493774414062, 0.02613973617553711, 0.028038978576660156, 0.029938220977783203, 0.03183746337890625, 0.0337367057800293, 0.035635948181152344, 0.03753519058227539, 0.03943443298339844, 0.041333675384521484, 0.04323291778564453, 0.04513216018676758, 0.047031402587890625, 0.04893064498901367, 0.05082988739013672, 0.052729129791259766, 0.05462837219238281, 0.05652761459350586, 0.058426856994628906, 0.06032609939575195, 0.062225341796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 17.0, 25.0, 56.0, 127.0, 166.0, 218.0, 173.0, 102.0, 57.0, 18.0, 18.0, 12.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1220703125, -0.11745643615722656, -0.11284255981445312, -0.10822868347167969, -0.10361480712890625, -0.09900093078613281, -0.09438705444335938, -0.08977317810058594, -0.0851593017578125, -0.08054542541503906, -0.07593154907226562, -0.07131767272949219, -0.06670379638671875, -0.06208992004394531, -0.057476043701171875, -0.05286216735839844, -0.048248291015625, -0.04363441467285156, -0.039020538330078125, -0.03440666198730469, -0.02979278564453125, -0.025178909301757812, -0.020565032958984375, -0.015951156616210938, -0.0113372802734375, -0.0067234039306640625, -0.002109527587890625, 0.0025043487548828125, 0.00711822509765625, 0.011732101440429688, 0.016345977783203125, 0.020959854125976562, 0.02557373046875, 0.030187606811523438, 0.034801483154296875, 0.03941535949707031, 0.04402923583984375, 0.04864311218261719, 0.053256988525390625, 0.05787086486816406, 0.0624847412109375, 0.06709861755371094, 0.07171249389648438, 0.07632637023925781, 0.08094024658203125, 0.08555412292480469, 0.09016799926757812, 0.09478187561035156, 0.099395751953125, 0.10400962829589844, 0.10862350463867188, 0.11323738098144531, 0.11785125732421875, 0.12246513366699219, 0.12707901000976562, 0.13169288635253906, 0.1363067626953125, 0.14092063903808594, 0.14553451538085938, 0.1501483917236328, 0.15476226806640625, 0.1593761444091797, 0.16399002075195312, 0.16860389709472656, 0.1732177734375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 16.0, 28.0, 60.0, 104.0, 161.0, 206.0, 144.0, 101.0, 63.0, 40.0, 17.0, 16.0, 7.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4897353649139404, -1.4257055521011353, -1.36167573928833, -1.297645926475525, -1.2336161136627197, -1.169586181640625, -1.1055563688278198, -1.0415265560150146, -0.9774967432022095, -0.9134669303894043, -0.8494371175765991, -0.7854072451591492, -0.721377432346344, -0.6573476195335388, -0.5933177471160889, -0.5292879343032837, -0.4652581214904785, -0.40122830867767334, -0.3371984660625458, -0.2731686234474182, -0.20913881063461304, -0.14510899782180786, -0.0810791552066803, -0.017049312591552734, 0.04698050022125244, 0.11101032793521881, 0.17504015564918518, 0.23906998336315155, 0.3030998110771179, 0.3671296238899231, 0.43115946650505066, 0.4951893091201782, 0.5592188835144043, 0.6232486963272095, 0.6872785091400146, 0.7513083815574646, 0.8153381943702698, 0.879368007183075, 0.9433978796005249, 1.00742769241333, 1.0714575052261353, 1.1354873180389404, 1.1995171308517456, 1.2635469436645508, 1.3275768756866455, 1.3916065692901611, 1.4556365013122559, 1.519666314125061, 1.5836961269378662, 1.6477259397506714, 1.7117557525634766, 1.7757855653762817, 1.839815378189087, 1.9038453102111816, 1.9678751230239868, 2.031904935836792, 2.0959348678588867, 2.1599647998809814, 2.223994493484497, 2.288024425506592, 2.3520541191101074, 2.416084051132202, 2.4801137447357178, 2.5441436767578125, 2.608173370361328]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 3.0, 8.0, 17.0, 13.0, 17.0, 19.0, 37.0, 51.0, 29.0, 46.0, 77.0, 84.0, 98.0, 93.0, 93.0, 54.0, 50.0, 45.0, 31.0, 33.0, 15.0, 15.0, 16.0, 11.0, 12.0, 9.0, 8.0, 5.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.70977783203125, -2.6448240280151367, -2.5798699855804443, -2.514916181564331, -2.4499623775482178, -2.3850083351135254, -2.320054531097412, -2.255100727081299, -2.1901469230651855, -2.1251931190490723, -2.06023907661438, -1.9952852725982666, -1.9303314685821533, -1.8653775453567505, -1.8004236221313477, -1.7354698181152344, -1.670515775680542, -1.6055618524551392, -1.5406080484390259, -1.475654125213623, -1.4107003211975098, -1.345746397972107, -1.280792474746704, -1.2158386707305908, -1.150884747505188, -1.0859308242797852, -1.0209770202636719, -0.956023097038269, -0.891069233417511, -0.8261153697967529, -0.7611614465713501, -0.696207582950592, -0.6312539577484131, -0.566300094127655, -0.501346230506897, -0.43639230728149414, -0.3714384436607361, -0.306484580039978, -0.24153068661689758, -0.17657679319381714, -0.11162292957305908, -0.04666905105113983, 0.01828482747077942, 0.08323870599269867, 0.14819258451461792, 0.21314644813537598, 0.2781003415584564, 0.34305423498153687, 0.4080080986022949, 0.472961962223053, 0.537915825843811, 0.6028697490692139, 0.6678236126899719, 0.73277747631073, 0.7977313995361328, 0.8626852631568909, 0.9276391267776489, 0.992592990398407, 1.057546854019165, 1.1225007772445679, 1.1874547004699707, 1.252408504486084, 1.3173624277114868, 1.3823163509368896, 1.447270154953003]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 8.0, 13.0, 20.0, 18.0, 24.0, 39.0, 46.0, 94.0, 345.0, 149.0, 72.0, 37.0, 34.0, 28.0, 18.0, 5.0, 15.0, 3.0, 8.0, 9.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5461463928222656, -0.5327224731445312, -0.5192985534667969, -0.5058746337890625, -0.4924507141113281, -0.47902679443359375, -0.4656028747558594, -0.452178955078125, -0.4387550354003906, -0.42533111572265625, -0.4119071960449219, -0.3984832763671875, -0.3850593566894531, -0.37163543701171875, -0.3582115173339844, -0.34478759765625, -0.3313636779785156, -0.31793975830078125, -0.3045158386230469, -0.2910919189453125, -0.2776679992675781, -0.26424407958984375, -0.2508201599121094, -0.237396240234375, -0.22397232055664062, -0.21054840087890625, -0.19712448120117188, -0.1837005615234375, -0.17027664184570312, -0.15685272216796875, -0.14342880249023438, -0.1300048828125, -0.11658096313476562, -0.10315704345703125, -0.08973312377929688, -0.0763092041015625, -0.06288528442382812, -0.04946136474609375, -0.036037445068359375, -0.022613525390625, -0.009189605712890625, 0.00423431396484375, 0.017658233642578125, 0.0310821533203125, 0.044506072998046875, 0.05792999267578125, 0.07135391235351562, 0.08477783203125, 0.09820175170898438, 0.11162567138671875, 0.12504959106445312, 0.1384735107421875, 0.15189743041992188, 0.16532135009765625, 0.17874526977539062, 0.192169189453125, 0.20559310913085938, 0.21901702880859375, 0.23244094848632812, 0.2458648681640625, 0.2592887878417969, 0.27271270751953125, 0.2861366271972656, 0.299560546875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 8.0, 6.0, 10.0, 13.0, 26.0, 37.0, 45.0, 62.0, 91.0, 153.0, 325.0, 505.0, 1043.0, 2579.0, 7921.0, 46830.0, 8290924.0, 27571.0, 6332.0, 2185.0, 886.0, 407.0, 210.0, 138.0, 88.0, 53.0, 43.0, 22.0, 17.0, 16.0, 5.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0089939832687378, -0.9812751412391663, -0.9535562992095947, -0.9258373975753784, -0.8981185555458069, -0.8703997135162354, -0.842680811882019, -0.8149619698524475, -0.787243127822876, -0.7595242857933044, -0.7318054437637329, -0.7040865421295166, -0.6763677000999451, -0.6486488580703735, -0.6209299564361572, -0.5932111144065857, -0.5654922723770142, -0.5377734303474426, -0.5100545883178711, -0.4823356866836548, -0.45461684465408325, -0.4268980026245117, -0.3991791307926178, -0.3714602589607239, -0.34374141693115234, -0.3160225749015808, -0.2883037030696869, -0.26058483123779297, -0.23286598920822144, -0.2051471322774887, -0.17742827534675598, -0.14970941841602325, -0.12199056148529053, -0.0942717045545578, -0.06655284762382507, -0.038833990693092346, -0.01111513376235962, 0.016603723168373108, 0.044322580099105835, 0.07204143702983856, 0.09976029396057129, 0.12747915089130402, 0.15519800782203674, 0.18291686475276947, 0.2106357216835022, 0.23835457861423492, 0.26607343554496765, 0.2937923073768616, 0.3215111494064331, 0.34922999143600464, 0.37694886326789856, 0.4046677350997925, 0.432386577129364, 0.46010541915893555, 0.48782429099082947, 0.5155431628227234, 0.5432620048522949, 0.5709808468818665, 0.598699688911438, 0.6264185905456543, 0.6541374325752258, 0.6818562746047974, 0.7095751762390137, 0.7372940182685852, 0.7650128602981567]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 5.0, 0.0, 6.0, 10.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1780942678451538, -1.1300227642059326, -1.0819511413574219, -1.0338796377182007, -0.9858080744743347, -0.9377365112304688, -0.8896650075912476, -0.8415934443473816, -0.7935218811035156, -0.7454503178596497, -0.6973788142204285, -0.6493072509765625, -0.6012356877326965, -0.5531641244888306, -0.5050926208496094, -0.4570210576057434, -0.4089495539665222, -0.36087802052497864, -0.31280645728111267, -0.2647349238395691, -0.21666337549686432, -0.16859182715415955, -0.12052029371261597, -0.07244873046875, -0.02437719702720642, 0.023694347590208054, 0.07176589220762253, 0.1198374330997467, 0.16790898144245148, 0.21598052978515625, 0.26405206322669983, 0.3121236264705658, 0.3601951599121094, 0.40826669335365295, 0.4563382565975189, 0.5044097900390625, 0.5524813532829285, 0.6005529165267944, 0.6486244201660156, 0.6966959834098816, 0.7447675466537476, 0.7928391098976135, 0.8409106135368347, 0.8889821767807007, 0.9370537400245667, 0.9851253032684326, 1.0331968069076538, 1.081268310546875, 1.1293399333953857, 1.177411437034607, 1.2254830598831177, 1.2735545635223389, 1.32162606716156, 1.3696976900100708, 1.417769193649292, 1.4658408164978027, 1.5139122009277344, 1.5619837045669556, 1.6100553274154663, 1.6581268310546875, 1.7061983346939087, 1.7542699575424194, 1.8023414611816406, 1.8504130840301514, 1.8984845876693726]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 5.0, 15.0, 14.0, 18.0, 18.0, 20.0, 35.0, 37.0, 48.0, 63.0, 56.0, 56.0, 59.0, 66.0, 48.0, 63.0, 51.0, 50.0, 50.0, 41.0, 34.0, 32.0, 28.0, 16.0, 14.0, 16.0, 15.0, 2.0, 8.0, 6.0, 5.0, 5.0, 2.0, 0.0, 4.0], "bins": [-0.125, -0.12207317352294922, -0.11914634704589844, -0.11621952056884766, -0.11329269409179688, -0.1103658676147461, -0.10743904113769531, -0.10451221466064453, -0.10158538818359375, -0.09865856170654297, -0.09573173522949219, -0.0928049087524414, -0.08987808227539062, -0.08695125579833984, -0.08402442932128906, -0.08109760284423828, -0.0781707763671875, -0.07524394989013672, -0.07231712341308594, -0.06939029693603516, -0.06646347045898438, -0.0635366439819336, -0.06060981750488281, -0.05768299102783203, -0.05475616455078125, -0.05182933807373047, -0.04890251159667969, -0.045975685119628906, -0.043048858642578125, -0.040122032165527344, -0.03719520568847656, -0.03426837921142578, -0.031341552734375, -0.02841472625732422, -0.025487899780273438, -0.022561073303222656, -0.019634246826171875, -0.016707420349121094, -0.013780593872070312, -0.010853767395019531, -0.00792694091796875, -0.005000114440917969, -0.0020732879638671875, 0.0008535385131835938, 0.003780364990234375, 0.006707191467285156, 0.009634017944335938, 0.012560844421386719, 0.0154876708984375, 0.01841449737548828, 0.021341323852539062, 0.024268150329589844, 0.027194976806640625, 0.030121803283691406, 0.03304862976074219, 0.03597545623779297, 0.03890228271484375, 0.04182910919189453, 0.04475593566894531, 0.047682762145996094, 0.050609588623046875, 0.053536415100097656, 0.05646324157714844, 0.05939006805419922, 0.06231689453125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 1.0, 2.0, 6.0, 10.0, 19.0, 18.0, 28.0, 44.0, 73.0, 137.0, 209.0, 349.0, 608.0, 1224.0, 2529.0, 5803.0, 16735.0, 70773.0, 295271.0, 97049.0, 20538.0, 6716.0, 2902.0, 1404.0, 747.0, 410.0, 236.0, 148.0, 96.0, 54.0, 45.0, 26.0, 17.0, 16.0, 12.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.70684814453125, -3.5894775390625, -3.47210693359375, -3.354736328125, -3.23736572265625, -3.1199951171875, -3.00262451171875, -2.88525390625, -2.76788330078125, -2.6505126953125, -2.53314208984375, -2.415771484375, -2.29840087890625, -2.1810302734375, -2.06365966796875, -1.9462890625, -1.82891845703125, -1.7115478515625, -1.59417724609375, -1.476806640625, -1.35943603515625, -1.2420654296875, -1.12469482421875, -1.00732421875, -0.88995361328125, -0.7725830078125, -0.65521240234375, -0.537841796875, -0.42047119140625, -0.3031005859375, -0.18572998046875, -0.068359375, 0.04901123046875, 0.1663818359375, 0.28375244140625, 0.401123046875, 0.51849365234375, 0.6358642578125, 0.75323486328125, 0.87060546875, 0.98797607421875, 1.1053466796875, 1.22271728515625, 1.340087890625, 1.45745849609375, 1.5748291015625, 1.69219970703125, 1.8095703125, 1.92694091796875, 2.0443115234375, 2.16168212890625, 2.279052734375, 2.39642333984375, 2.5137939453125, 2.63116455078125, 2.74853515625, 2.86590576171875, 2.9832763671875, 3.10064697265625, 3.218017578125, 3.33538818359375, 3.4527587890625, 3.57012939453125, 3.6875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 12.0, 12.0, 8.0, 16.0, 12.0, 19.0, 18.0, 24.0, 25.0, 34.0, 43.0, 31.0, 53.0, 42.0, 51.0, 53.0, 68.0, 46.0, 51.0, 49.0, 44.0, 40.0, 49.0, 27.0, 29.0, 18.0, 19.0, 19.0, 16.0, 7.0, 5.0, 6.0, 12.0, 12.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.274169921875, -0.2668342590332031, -0.25949859619140625, -0.2521629333496094, -0.2448272705078125, -0.23749160766601562, -0.23015594482421875, -0.22282028198242188, -0.215484619140625, -0.20814895629882812, -0.20081329345703125, -0.19347763061523438, -0.1861419677734375, -0.17880630493164062, -0.17147064208984375, -0.16413497924804688, -0.15679931640625, -0.14946365356445312, -0.14212799072265625, -0.13479232788085938, -0.1274566650390625, -0.12012100219726562, -0.11278533935546875, -0.10544967651367188, -0.098114013671875, -0.09077835083007812, -0.08344268798828125, -0.07610702514648438, -0.0687713623046875, -0.061435699462890625, -0.05410003662109375, -0.046764373779296875, -0.0394287109375, -0.032093048095703125, -0.02475738525390625, -0.017421722412109375, -0.0100860595703125, -0.002750396728515625, 0.00458526611328125, 0.011920928955078125, 0.019256591796875, 0.026592254638671875, 0.03392791748046875, 0.041263580322265625, 0.0485992431640625, 0.055934906005859375, 0.06327056884765625, 0.07060623168945312, 0.07794189453125, 0.08527755737304688, 0.09261322021484375, 0.09994888305664062, 0.1072845458984375, 0.11462020874023438, 0.12195587158203125, 0.12929153442382812, 0.136627197265625, 0.14396286010742188, 0.15129852294921875, 0.15863418579101562, 0.1659698486328125, 0.17330551147460938, 0.18064117431640625, 0.18797683715820312, 0.1953125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 5.0, 8.0, 8.0, 17.0, 12.0, 15.0, 26.0, 23.0, 43.0, 63.0, 58.0, 56.0, 43.0, 36.0, 16.0, 13.0, 13.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.92402184009552, -0.9018286466598511, -0.8796354532241821, -0.8574422597885132, -0.835249125957489, -0.8130559325218201, -0.7908627390861511, -0.7686695456504822, -0.7464763522148132, -0.7242831587791443, -0.7020899653434753, -0.6798968315124512, -0.6577036380767822, -0.6355104446411133, -0.6133172512054443, -0.5911240577697754, -0.5689308643341064, -0.5467376708984375, -0.5245444774627686, -0.5023512840270996, -0.48015812039375305, -0.4579649567604065, -0.43577176332473755, -0.4135785698890686, -0.39138543605804443, -0.3691922426223755, -0.34699907898902893, -0.32480588555336, -0.30261269211769104, -0.2804195284843445, -0.25822633504867554, -0.2360331416130066, -0.21383994817733765, -0.1916467696428299, -0.16945357620716095, -0.1472603976726532, -0.12506720423698425, -0.1028740257024765, -0.08068084716796875, -0.058487653732299805, -0.03629447519779205, -0.014101291075348854, 0.008091893047094345, 0.030285075306892395, 0.05247826129198074, 0.07467144727706909, 0.09686462581157684, 0.11905781924724579, 0.14125099778175354, 0.1634441763162613, 0.18563736975193024, 0.207830548286438, 0.23002374172210693, 0.2522169351577759, 0.27441009879112244, 0.2966032922267914, 0.31879645586013794, 0.3409896492958069, 0.36318281292915344, 0.3853760063648224, 0.40756919980049133, 0.4297623634338379, 0.45195555686950684, 0.4741487503051758, 0.4963419437408447]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 2.0, 3.0, 5.0, 5.0, 15.0, 4.0, 5.0, 5.0, 13.0, 8.0, 16.0, 39.0, 77.0, 97.0, 63.0, 25.0, 17.0, 12.0, 10.0, 6.0, 4.0, 10.0, 4.0, 6.0, 3.0, 5.0, 5.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8056405782699585, -0.7803385853767395, -0.7550365924835205, -0.7297345995903015, -0.7044326066970825, -0.6791306138038635, -0.6538286209106445, -0.6285266876220703, -0.6032246351242065, -0.5779226422309875, -0.5526206493377686, -0.5273186564445496, -0.5020166635513306, -0.4767146706581116, -0.45141270756721497, -0.42611071467399597, -0.40080875158309937, -0.37550675868988037, -0.3502047657966614, -0.3249027729034424, -0.2996007800102234, -0.2742987871170044, -0.2489968240261078, -0.2236948311328888, -0.1983928382396698, -0.1730908453464508, -0.1477888524532318, -0.12248687446117401, -0.09718488156795502, -0.07188288867473602, -0.04658091068267822, -0.02127891778945923, 0.004023134708404541, 0.029325123876333237, 0.05462711304426193, 0.07992909848690033, 0.10523109138011932, 0.13053308427333832, 0.15583506226539612, 0.1811370551586151, 0.2064390480518341, 0.2317410409450531, 0.2570430338382721, 0.2823449969291687, 0.3076469898223877, 0.3329489827156067, 0.3582509756088257, 0.3835529685020447, 0.40885496139526367, 0.43415695428848267, 0.45945894718170166, 0.48476094007492065, 0.5100629329681396, 0.5353649258613586, 0.5606669187545776, 0.5859688520431519, 0.6112709045410156, 0.6365728974342346, 0.6618748903274536, 0.6871768832206726, 0.7124788761138916, 0.7377808690071106, 0.7630828619003296, 0.7883847951889038, 0.8136867880821228]}, "eval/loss": 2.26958966255188, "eval/bleu": 5.858561653487833e-14, "eval/runtime": 2627.4744, "eval/samples_per_second": 5.618, "eval/steps_per_second": 0.702} \ No newline at end of file +{"train/loss": 2.2063, "train/learning_rate": 5.972477064220184e-06, "train/epoch": 2.47, "train/global_step": 4000, "_runtime": 57505, "_timestamp": 1651829773, "_step": 4007, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 44.0, 74.0, 144.0, 206.0, 198.0, 163.0, 108.0, 37.0, 18.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.9302027225494385, -1.8950679302215576, -1.8599330186843872, -1.8247982263565063, -1.789663314819336, -1.754528522491455, -1.7193936109542847, -1.6842588186264038, -1.6491239070892334, -1.6139891147613525, -1.5788542032241821, -1.5437194108963013, -1.5085844993591309, -1.47344970703125, -1.4383147954940796, -1.4031800031661987, -1.3680452108383179, -1.332910418510437, -1.2977755069732666, -1.2626407146453857, -1.2275058031082153, -1.1923710107803345, -1.157236099243164, -1.1221013069152832, -1.0869665145874023, -1.0518317222595215, -1.016696810722351, -0.9815619587898254, -0.9464271068572998, -0.911292314529419, -0.8761574625968933, -0.8410226106643677, -0.8058875799179077, -0.7707527279853821, -0.7356178760528564, -0.7004830241203308, -0.6653481721878052, -0.6302133798599243, -0.5950785279273987, -0.559943675994873, -0.5248088240623474, -0.4896739721298218, -0.45453912019729614, -0.4194042980670929, -0.38426944613456726, -0.3491345942020416, -0.3139997720718384, -0.27886492013931274, -0.2437300682067871, -0.20859521627426147, -0.17346037924289703, -0.1383255422115326, -0.10319069027900696, -0.06805583834648132, -0.03292100131511688, 0.0022138357162475586, 0.03734868764877319, 0.07248353213071823, 0.10761837661266327, 0.1427532136440277, 0.17788806557655334, 0.21302291750907898, 0.24815775454044342, 0.28329259157180786, 0.3184274435043335]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 11.0, 8.0, 10.0, 6.0, 12.0, 13.0, 10.0, 12.0, 18.0, 28.0, 16.0, 21.0, 27.0, 30.0, 28.0, 39.0, 27.0, 35.0, 45.0, 38.0, 46.0, 30.0, 29.0, 30.0, 34.0, 42.0, 37.0, 38.0, 29.0, 35.0, 31.0, 30.0, 21.0, 18.0, 26.0, 19.0, 14.0, 11.0, 5.0, 7.0, 5.0, 4.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.3742057681083679, -0.3616308569908142, -0.3490559458732605, -0.3364810347557068, -0.3239060938358307, -0.311331182718277, -0.29875627160072327, -0.28618136048316956, -0.27360644936561584, -0.26103153824806213, -0.24845661222934723, -0.23588170111179352, -0.2233067899942398, -0.2107318639755249, -0.1981569528579712, -0.18558204174041748, -0.17300711572170258, -0.16043220460414886, -0.14785727858543396, -0.13528236746788025, -0.12270745635032654, -0.11013253778219223, -0.09755761921405792, -0.08498270809650421, -0.0724077895283699, -0.059832874685525894, -0.047257959842681885, -0.03468304127454758, -0.022108126431703568, -0.009533211588859558, 0.0030417069792747498, 0.01561661809682846, 0.02819153666496277, 0.04076645150780678, 0.05334136635065079, 0.0659162849187851, 0.0784911960363388, 0.09106611460447311, 0.10364103317260742, 0.11621594429016113, 0.12879085540771484, 0.14136576652526855, 0.15394069254398346, 0.16651560366153717, 0.17909051477909088, 0.1916654407978058, 0.2042403519153595, 0.2168152630329132, 0.2293901890516281, 0.24196510016918182, 0.25454002618789673, 0.26711493730545044, 0.27968984842300415, 0.29226475954055786, 0.3048396706581116, 0.3174145817756653, 0.3299895226955414, 0.3425644338130951, 0.3551393449306488, 0.3677142858505249, 0.3802891969680786, 0.3928641080856323, 0.40543901920318604, 0.41801393032073975, 0.43058884143829346]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 11.0, 17.0, 15.0, 20.0, 25.0, 43.0, 52.0, 79.0, 150.0, 172.0, 317.0, 473.0, 802.0, 1399.0, 2615.0, 5560.0, 13004.0, 32638.0, 87229.0, 214239.0, 469599.0, 866516.0, 1091776.0, 749619.0, 385070.0, 165821.0, 63622.0, 23994.0, 9838.0, 4364.0, 2165.0, 1172.0, 678.0, 400.0, 300.0, 166.0, 103.0, 79.0, 43.0, 35.0, 25.0, 13.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.6259765625, -0.6077499389648438, -0.5895233154296875, -0.5712966918945312, -0.553070068359375, -0.5348434448242188, -0.5166168212890625, -0.49839019775390625, -0.48016357421875, -0.46193695068359375, -0.4437103271484375, -0.42548370361328125, -0.407257080078125, -0.38903045654296875, -0.3708038330078125, -0.35257720947265625, -0.3343505859375, -0.31612396240234375, -0.2978973388671875, -0.27967071533203125, -0.261444091796875, -0.24321746826171875, -0.2249908447265625, -0.20676422119140625, -0.18853759765625, -0.17031097412109375, -0.1520843505859375, -0.13385772705078125, -0.115631103515625, -0.09740447998046875, -0.0791778564453125, -0.06095123291015625, -0.042724609375, -0.02449798583984375, -0.0062713623046875, 0.01195526123046875, 0.030181884765625, 0.04840850830078125, 0.0666351318359375, 0.08486175537109375, 0.10308837890625, 0.12131500244140625, 0.1395416259765625, 0.15776824951171875, 0.175994873046875, 0.19422149658203125, 0.2124481201171875, 0.23067474365234375, 0.2489013671875, 0.26712799072265625, 0.2853546142578125, 0.30358123779296875, 0.321807861328125, 0.34003448486328125, 0.3582611083984375, 0.37648773193359375, 0.39471435546875, 0.41294097900390625, 0.4311676025390625, 0.44939422607421875, 0.467620849609375, 0.48584747314453125, 0.5040740966796875, 0.5223007202148438, 0.54052734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 13.0, 18.0, 16.0, 16.0, 15.0, 21.0, 23.0, 25.0, 26.0, 37.0, 33.0, 39.0, 32.0, 30.0, 36.0, 32.0, 39.0, 36.0, 20.0, 42.0, 49.0, 31.0, 32.0, 33.0, 32.0, 32.0, 22.0, 34.0, 21.0, 19.0, 12.0, 23.0, 8.0, 8.0, 7.0, 11.0, 8.0, 8.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.63671875, -0.6169815063476562, -0.5972442626953125, -0.5775070190429688, -0.557769775390625, -0.5380325317382812, -0.5182952880859375, -0.49855804443359375, -0.47882080078125, -0.45908355712890625, -0.4393463134765625, -0.41960906982421875, -0.399871826171875, -0.38013458251953125, -0.3603973388671875, -0.34066009521484375, -0.3209228515625, -0.30118560791015625, -0.2814483642578125, -0.26171112060546875, -0.241973876953125, -0.22223663330078125, -0.2024993896484375, -0.18276214599609375, -0.16302490234375, -0.14328765869140625, -0.1235504150390625, -0.10381317138671875, -0.084075927734375, -0.06433868408203125, -0.0446014404296875, -0.02486419677734375, -0.005126953125, 0.01461029052734375, 0.0343475341796875, 0.05408477783203125, 0.073822021484375, 0.09355926513671875, 0.1132965087890625, 0.13303375244140625, 0.15277099609375, 0.17250823974609375, 0.1922454833984375, 0.21198272705078125, 0.231719970703125, 0.25145721435546875, 0.2711944580078125, 0.29093170166015625, 0.3106689453125, 0.33040618896484375, 0.3501434326171875, 0.36988067626953125, 0.389617919921875, 0.40935516357421875, 0.4290924072265625, 0.44882965087890625, 0.46856689453125, 0.48830413818359375, 0.5080413818359375, 0.5277786254882812, 0.547515869140625, 0.5672531127929688, 0.5869903564453125, 0.6067276000976562, 0.62646484375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 12.0, 18.0, 43.0, 58.0, 102.0, 144.0, 292.0, 558.0, 3330.0, 4179908.0, 8401.0, 637.0, 295.0, 152.0, 86.0, 81.0, 46.0, 23.0, 14.0, 19.0, 6.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2984619140625, -10.971923828125, -10.6453857421875, -10.31884765625, -9.9923095703125, -9.665771484375, -9.3392333984375, -9.0126953125, -8.6861572265625, -8.359619140625, -8.0330810546875, -7.70654296875, -7.3800048828125, -7.053466796875, -6.7269287109375, -6.400390625, -6.0738525390625, -5.747314453125, -5.4207763671875, -5.09423828125, -4.7677001953125, -4.441162109375, -4.1146240234375, -3.7880859375, -3.4615478515625, -3.135009765625, -2.8084716796875, -2.48193359375, -2.1553955078125, -1.828857421875, -1.5023193359375, -1.17578125, -0.8492431640625, -0.522705078125, -0.1961669921875, 0.13037109375, 0.4569091796875, 0.783447265625, 1.1099853515625, 1.4365234375, 1.7630615234375, 2.089599609375, 2.4161376953125, 2.74267578125, 3.0692138671875, 3.395751953125, 3.7222900390625, 4.048828125, 4.3753662109375, 4.701904296875, 5.0284423828125, 5.35498046875, 5.6815185546875, 6.008056640625, 6.3345947265625, 6.6611328125, 6.9876708984375, 7.314208984375, 7.6407470703125, 7.96728515625, 8.2938232421875, 8.620361328125, 8.9468994140625, 9.2734375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 12.0, 10.0, 18.0, 21.0, 41.0, 78.0, 106.0, 162.0, 272.0, 403.0, 629.0, 800.0, 555.0, 352.0, 197.0, 135.0, 89.0, 62.0, 36.0, 30.0, 17.0, 8.0, 6.0, 6.0, 7.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.494140625, -0.48091888427734375, -0.4676971435546875, -0.45447540283203125, -0.441253662109375, -0.42803192138671875, -0.4148101806640625, -0.40158843994140625, -0.38836669921875, -0.37514495849609375, -0.3619232177734375, -0.34870147705078125, -0.335479736328125, -0.32225799560546875, -0.3090362548828125, -0.29581451416015625, -0.2825927734375, -0.26937103271484375, -0.2561492919921875, -0.24292755126953125, -0.229705810546875, -0.21648406982421875, -0.2032623291015625, -0.19004058837890625, -0.17681884765625, -0.16359710693359375, -0.1503753662109375, -0.13715362548828125, -0.123931884765625, -0.11071014404296875, -0.0974884033203125, -0.08426666259765625, -0.071044921875, -0.05782318115234375, -0.0446014404296875, -0.03137969970703125, -0.018157958984375, -0.00493621826171875, 0.0082855224609375, 0.02150726318359375, 0.03472900390625, 0.04795074462890625, 0.0611724853515625, 0.07439422607421875, 0.087615966796875, 0.10083770751953125, 0.1140594482421875, 0.12728118896484375, 0.1405029296875, 0.15372467041015625, 0.1669464111328125, 0.18016815185546875, 0.193389892578125, 0.20661163330078125, 0.2198333740234375, 0.23305511474609375, 0.24627685546875, 0.25949859619140625, 0.2727203369140625, 0.28594207763671875, 0.299163818359375, 0.31238555908203125, 0.3256072998046875, 0.33882904052734375, 0.35205078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 15.0, 13.0, 21.0, 18.0, 27.0, 39.0, 36.0, 63.0, 62.0, 80.0, 80.0, 108.0, 79.0, 71.0, 80.0, 66.0, 41.0, 24.0, 29.0, 15.0, 14.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1213198900222778, -1.0827076435089111, -1.0440953969955444, -1.0054831504821777, -0.9668708443641663, -0.9282585978507996, -0.8896462917327881, -0.8510340452194214, -0.8124217987060547, -0.773809552192688, -0.7351973056793213, -0.6965849995613098, -0.6579727530479431, -0.6193605065345764, -0.5807482004165649, -0.5421359539031982, -0.5035237073898315, -0.46491146087646484, -0.42629918456077576, -0.38768690824508667, -0.34907466173171997, -0.31046241521835327, -0.2718501389026642, -0.2332378625869751, -0.1946256160736084, -0.1560133546590805, -0.11740109324455261, -0.07878883183002472, -0.040176570415496826, -0.001564309000968933, 0.03704795241355896, 0.07566022872924805, 0.11427247524261475, 0.15288473665714264, 0.19149699807167053, 0.23010925948619843, 0.2687215209007263, 0.307333767414093, 0.3459460437297821, 0.3845583200454712, 0.4231705665588379, 0.4617828130722046, 0.5003950595855713, 0.5390073657035828, 0.5776196122169495, 0.6162318587303162, 0.6548441648483276, 0.6934564113616943, 0.732068657875061, 0.7706809043884277, 0.8092931509017944, 0.8479054570198059, 0.8865177035331726, 0.9251299500465393, 0.9637422561645508, 1.0023545026779175, 1.0409667491912842, 1.0795789957046509, 1.1181912422180176, 1.1568034887313843, 1.195415735244751, 1.2340281009674072, 1.272640347480774, 1.3112525939941406, 1.3498648405075073]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 8.0, 1.0, 5.0, 8.0, 6.0, 6.0, 14.0, 8.0, 13.0, 16.0, 21.0, 16.0, 28.0, 18.0, 34.0, 24.0, 28.0, 18.0, 41.0, 33.0, 39.0, 41.0, 43.0, 44.0, 32.0, 52.0, 40.0, 40.0, 38.0, 31.0, 26.0, 34.0, 25.0, 25.0, 19.0, 20.0, 23.0, 14.0, 13.0, 17.0, 11.0, 4.0, 4.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.6490494012832642, -0.6292263269424438, -0.6094032526016235, -0.589580237865448, -0.5697571635246277, -0.5499340891838074, -0.5301110148429871, -0.5102879405021667, -0.4904648959636688, -0.4706418216228485, -0.4508187770843506, -0.4309957027435303, -0.41117262840270996, -0.39134958386421204, -0.3715265095233917, -0.3517034649848938, -0.3318803906440735, -0.3120573163032532, -0.29223427176475525, -0.27241119742393494, -0.252588152885437, -0.2327650785446167, -0.2129420042037964, -0.19311894476413727, -0.17329588532447815, -0.15347282588481903, -0.1336497664451599, -0.1138266921043396, -0.09400363266468048, -0.07418057322502136, -0.05435750633478165, -0.03453443944454193, -0.014711320400238037, 0.00511174276471138, 0.024934805929660797, 0.044757869094610214, 0.06458093225955963, 0.08440399169921875, 0.10422705858945847, 0.12405012547969818, 0.1438731849193573, 0.16369624435901642, 0.18351930379867554, 0.20334237813949585, 0.22316543757915497, 0.2429884970188141, 0.2628115713596344, 0.2826346158981323, 0.30245769023895264, 0.32228076457977295, 0.3421038091182709, 0.3619268834590912, 0.3817499279975891, 0.4015730023384094, 0.42139607667922974, 0.44121915102005005, 0.461042195558548, 0.4808652698993683, 0.5006883144378662, 0.5205113887786865, 0.5403344631195068, 0.5601575374603271, 0.5799805521965027, 0.599803626537323, 0.6196267008781433]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 5.0, 6.0, 16.0, 17.0, 34.0, 56.0, 82.0, 109.0, 150.0, 230.0, 293.0, 429.0, 725.0, 1071.0, 1588.0, 2515.0, 4005.0, 6923.0, 12096.0, 21245.0, 39414.0, 74440.0, 136281.0, 217572.0, 218907.0, 139765.0, 76786.0, 40679.0, 22281.0, 12192.0, 7081.0, 4086.0, 2526.0, 1606.0, 1116.0, 753.0, 460.0, 318.0, 236.0, 140.0, 100.0, 87.0, 41.0, 21.0, 16.0, 17.0, 13.0, 4.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1796875, -0.17407608032226562, -0.16846466064453125, -0.16285324096679688, -0.1572418212890625, -0.15163040161132812, -0.14601898193359375, -0.14040756225585938, -0.134796142578125, -0.12918472290039062, -0.12357330322265625, -0.11796188354492188, -0.1123504638671875, -0.10673904418945312, -0.10112762451171875, -0.09551620483398438, -0.08990478515625, -0.08429336547851562, -0.07868194580078125, -0.07307052612304688, -0.0674591064453125, -0.061847686767578125, -0.05623626708984375, -0.050624847412109375, -0.045013427734375, -0.039402008056640625, -0.03379058837890625, -0.028179168701171875, -0.0225677490234375, -0.016956329345703125, -0.01134490966796875, -0.005733489990234375, -0.0001220703125, 0.005489349365234375, 0.01110076904296875, 0.016712188720703125, 0.0223236083984375, 0.027935028076171875, 0.03354644775390625, 0.039157867431640625, 0.044769287109375, 0.050380706787109375, 0.05599212646484375, 0.061603546142578125, 0.0672149658203125, 0.07282638549804688, 0.07843780517578125, 0.08404922485351562, 0.08966064453125, 0.09527206420898438, 0.10088348388671875, 0.10649490356445312, 0.1121063232421875, 0.11771774291992188, 0.12332916259765625, 0.12894058227539062, 0.134552001953125, 0.14016342163085938, 0.14577484130859375, 0.15138626098632812, 0.1569976806640625, 0.16260910034179688, 0.16822052001953125, 0.17383193969726562, 0.179443359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 3.0, 14.0, 8.0, 10.0, 8.0, 21.0, 16.0, 22.0, 25.0, 35.0, 24.0, 33.0, 26.0, 42.0, 41.0, 39.0, 41.0, 55.0, 54.0, 43.0, 42.0, 43.0, 35.0, 40.0, 33.0, 41.0, 30.0, 28.0, 25.0, 12.0, 20.0, 11.0, 21.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.59765625, -0.5807571411132812, -0.5638580322265625, -0.5469589233398438, -0.530059814453125, -0.5131607055664062, -0.4962615966796875, -0.47936248779296875, -0.46246337890625, -0.44556427001953125, -0.4286651611328125, -0.41176605224609375, -0.394866943359375, -0.37796783447265625, -0.3610687255859375, -0.34416961669921875, -0.3272705078125, -0.31037139892578125, -0.2934722900390625, -0.27657318115234375, -0.259674072265625, -0.24277496337890625, -0.2258758544921875, -0.20897674560546875, -0.19207763671875, -0.17517852783203125, -0.1582794189453125, -0.14138031005859375, -0.124481201171875, -0.10758209228515625, -0.0906829833984375, -0.07378387451171875, -0.056884765625, -0.03998565673828125, -0.0230865478515625, -0.00618743896484375, 0.010711669921875, 0.02761077880859375, 0.0445098876953125, 0.06140899658203125, 0.07830810546875, 0.09520721435546875, 0.1121063232421875, 0.12900543212890625, 0.145904541015625, 0.16280364990234375, 0.1797027587890625, 0.19660186767578125, 0.2135009765625, 0.23040008544921875, 0.2472991943359375, 0.26419830322265625, 0.281097412109375, 0.29799652099609375, 0.3148956298828125, 0.33179473876953125, 0.34869384765625, 0.36559295654296875, 0.3824920654296875, 0.39939117431640625, 0.416290283203125, 0.43318939208984375, 0.4500885009765625, 0.46698760986328125, 0.48388671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 4.0, 12.0, 7.0, 15.0, 27.0, 38.0, 60.0, 87.0, 148.0, 239.0, 406.0, 745.0, 1670.0, 4030.0, 11500.0, 39524.0, 177753.0, 507956.0, 231393.0, 50222.0, 14057.0, 4735.0, 1959.0, 860.0, 462.0, 215.0, 154.0, 90.0, 45.0, 41.0, 32.0, 26.0, 10.0, 9.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.50634765625, -0.49170684814453125, -0.4770660400390625, -0.46242523193359375, -0.447784423828125, -0.43314361572265625, -0.4185028076171875, -0.40386199951171875, -0.38922119140625, -0.37458038330078125, -0.3599395751953125, -0.34529876708984375, -0.330657958984375, -0.31601715087890625, -0.3013763427734375, -0.28673553466796875, -0.2720947265625, -0.25745391845703125, -0.2428131103515625, -0.22817230224609375, -0.213531494140625, -0.19889068603515625, -0.1842498779296875, -0.16960906982421875, -0.15496826171875, -0.14032745361328125, -0.1256866455078125, -0.11104583740234375, -0.096405029296875, -0.08176422119140625, -0.0671234130859375, -0.05248260498046875, -0.037841796875, -0.02320098876953125, -0.0085601806640625, 0.00608062744140625, 0.020721435546875, 0.03536224365234375, 0.0500030517578125, 0.06464385986328125, 0.07928466796875, 0.09392547607421875, 0.1085662841796875, 0.12320709228515625, 0.137847900390625, 0.15248870849609375, 0.1671295166015625, 0.18177032470703125, 0.1964111328125, 0.21105194091796875, 0.2256927490234375, 0.24033355712890625, 0.254974365234375, 0.26961517333984375, 0.2842559814453125, 0.29889678955078125, 0.31353759765625, 0.32817840576171875, 0.3428192138671875, 0.35746002197265625, 0.372100830078125, 0.38674163818359375, 0.4013824462890625, 0.41602325439453125, 0.4306640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 10.0, 14.0, 13.0, 19.0, 23.0, 29.0, 22.0, 26.0, 29.0, 28.0, 40.0, 43.0, 38.0, 45.0, 51.0, 43.0, 37.0, 43.0, 41.0, 40.0, 46.0, 31.0, 28.0, 49.0, 39.0, 23.0, 21.0, 17.0, 17.0, 12.0, 15.0, 15.0, 9.0, 7.0, 8.0, 2.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.09613037109375, -1.0614013671875, -1.02667236328125, -0.991943359375, -0.95721435546875, -0.9224853515625, -0.88775634765625, -0.85302734375, -0.81829833984375, -0.7835693359375, -0.74884033203125, -0.714111328125, -0.67938232421875, -0.6446533203125, -0.60992431640625, -0.5751953125, -0.54046630859375, -0.5057373046875, -0.47100830078125, -0.436279296875, -0.40155029296875, -0.3668212890625, -0.33209228515625, -0.29736328125, -0.26263427734375, -0.2279052734375, -0.19317626953125, -0.158447265625, -0.12371826171875, -0.0889892578125, -0.05426025390625, -0.01953125, 0.01519775390625, 0.0499267578125, 0.08465576171875, 0.119384765625, 0.15411376953125, 0.1888427734375, 0.22357177734375, 0.25830078125, 0.29302978515625, 0.3277587890625, 0.36248779296875, 0.397216796875, 0.43194580078125, 0.4666748046875, 0.50140380859375, 0.5361328125, 0.57086181640625, 0.6055908203125, 0.64031982421875, 0.675048828125, 0.70977783203125, 0.7445068359375, 0.77923583984375, 0.81396484375, 0.84869384765625, 0.8834228515625, 0.91815185546875, 0.952880859375, 0.98760986328125, 1.0223388671875, 1.05706787109375, 1.091796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 6.0, 13.0, 13.0, 38.0, 59.0, 62.0, 89.0, 143.0, 276.0, 435.0, 895.0, 1504.0, 3869.0, 11100.0, 54077.0, 558284.0, 367872.0, 35222.0, 8386.0, 3085.0, 1400.0, 705.0, 383.0, 237.0, 140.0, 88.0, 45.0, 34.0, 21.0, 21.0, 11.0, 11.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.237060546875, -0.2285614013671875, -0.220062255859375, -0.2115631103515625, -0.20306396484375, -0.1945648193359375, -0.186065673828125, -0.1775665283203125, -0.1690673828125, -0.1605682373046875, -0.152069091796875, -0.1435699462890625, -0.13507080078125, -0.1265716552734375, -0.118072509765625, -0.1095733642578125, -0.10107421875, -0.0925750732421875, -0.084075927734375, -0.0755767822265625, -0.06707763671875, -0.0585784912109375, -0.050079345703125, -0.0415802001953125, -0.0330810546875, -0.0245819091796875, -0.016082763671875, -0.0075836181640625, 0.00091552734375, 0.0094146728515625, 0.017913818359375, 0.0264129638671875, 0.034912109375, 0.0434112548828125, 0.051910400390625, 0.0604095458984375, 0.06890869140625, 0.0774078369140625, 0.085906982421875, 0.0944061279296875, 0.1029052734375, 0.1114044189453125, 0.119903564453125, 0.1284027099609375, 0.13690185546875, 0.1454010009765625, 0.153900146484375, 0.1623992919921875, 0.1708984375, 0.1793975830078125, 0.187896728515625, 0.1963958740234375, 0.20489501953125, 0.2133941650390625, 0.221893310546875, 0.2303924560546875, 0.2388916015625, 0.2473907470703125, 0.255889892578125, 0.2643890380859375, 0.27288818359375, 0.2813873291015625, 0.289886474609375, 0.2983856201171875, 0.306884765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 6.0, 11.0, 16.0, 37.0, 50.0, 75.0, 143.0, 187.0, 163.0, 105.0, 72.0, 45.0, 36.0, 19.0, 13.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001310110092163086, -0.0001268964260816574, -0.00012278184294700623, -0.00011866725981235504, -0.00011455267667770386, -0.00011043809354305267, -0.00010632351040840149, -0.0001022089272737503, -9.809434413909912e-05, -9.397976100444794e-05, -8.986517786979675e-05, -8.575059473514557e-05, -8.163601160049438e-05, -7.75214284658432e-05, -7.340684533119202e-05, -6.929226219654083e-05, -6.517767906188965e-05, -6.106309592723846e-05, -5.694851279258728e-05, -5.2833929657936096e-05, -4.871934652328491e-05, -4.460476338863373e-05, -4.0490180253982544e-05, -3.637559711933136e-05, -3.2261013984680176e-05, -2.8146430850028992e-05, -2.4031847715377808e-05, -1.9917264580726624e-05, -1.580268144607544e-05, -1.1688098311424255e-05, -7.573515176773071e-06, -3.458932042121887e-06, 6.556510925292969e-07, 4.770234227180481e-06, 8.884817361831665e-06, 1.2999400496482849e-05, 1.7113983631134033e-05, 2.1228566765785217e-05, 2.53431499004364e-05, 2.9457733035087585e-05, 3.357231616973877e-05, 3.7686899304389954e-05, 4.180148243904114e-05, 4.591606557369232e-05, 5.0030648708343506e-05, 5.414523184299469e-05, 5.8259814977645874e-05, 6.237439811229706e-05, 6.648898124694824e-05, 7.060356438159943e-05, 7.471814751625061e-05, 7.88327306509018e-05, 8.294731378555298e-05, 8.706189692020416e-05, 9.117648005485535e-05, 9.529106318950653e-05, 9.940564632415771e-05, 0.0001035202294588089, 0.00010763481259346008, 0.00011174939572811127, 0.00011586397886276245, 0.00011997856199741364, 0.00012409314513206482, 0.000128207728266716, 0.0001323223114013672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 2.0, 7.0, 5.0, 4.0, 18.0, 4.0, 16.0, 31.0, 48.0, 80.0, 134.0, 466.0, 2553.0, 29771.0, 938810.0, 71471.0, 3977.0, 693.0, 220.0, 96.0, 35.0, 30.0, 21.0, 12.0, 15.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.68603515625, -0.6667709350585938, -0.6475067138671875, -0.6282424926757812, -0.608978271484375, -0.5897140502929688, -0.5704498291015625, -0.5511856079101562, -0.53192138671875, -0.5126571655273438, -0.4933929443359375, -0.47412872314453125, -0.454864501953125, -0.43560028076171875, -0.4163360595703125, -0.39707183837890625, -0.3778076171875, -0.35854339599609375, -0.3392791748046875, -0.32001495361328125, -0.300750732421875, -0.28148651123046875, -0.2622222900390625, -0.24295806884765625, -0.22369384765625, -0.20442962646484375, -0.1851654052734375, -0.16590118408203125, -0.146636962890625, -0.12737274169921875, -0.1081085205078125, -0.08884429931640625, -0.069580078125, -0.05031585693359375, -0.0310516357421875, -0.01178741455078125, 0.007476806640625, 0.02674102783203125, 0.0460052490234375, 0.06526947021484375, 0.08453369140625, 0.10379791259765625, 0.1230621337890625, 0.14232635498046875, 0.161590576171875, 0.18085479736328125, 0.2001190185546875, 0.21938323974609375, 0.2386474609375, 0.25791168212890625, 0.2771759033203125, 0.29644012451171875, 0.315704345703125, 0.33496856689453125, 0.3542327880859375, 0.37349700927734375, 0.39276123046875, 0.41202545166015625, 0.4312896728515625, 0.45055389404296875, 0.469818115234375, 0.48908233642578125, 0.5083465576171875, 0.5276107788085938, 0.546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 10.0, 15.0, 28.0, 42.0, 55.0, 99.0, 122.0, 132.0, 151.0, 103.0, 74.0, 47.0, 35.0, 17.0, 17.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0882568359375, -0.08563899993896484, -0.08302116394042969, -0.08040332794189453, -0.07778549194335938, -0.07516765594482422, -0.07254981994628906, -0.0699319839477539, -0.06731414794921875, -0.0646963119506836, -0.06207847595214844, -0.05946063995361328, -0.056842803955078125, -0.05422496795654297, -0.05160713195800781, -0.048989295959472656, -0.0463714599609375, -0.043753623962402344, -0.04113578796386719, -0.03851795196533203, -0.035900115966796875, -0.03328227996826172, -0.030664443969726562, -0.028046607971191406, -0.02542877197265625, -0.022810935974121094, -0.020193099975585938, -0.01757526397705078, -0.014957427978515625, -0.012339591979980469, -0.009721755981445312, -0.007103919982910156, -0.004486083984375, -0.0018682479858398438, 0.0007495880126953125, 0.0033674240112304688, 0.005985260009765625, 0.008603096008300781, 0.011220932006835938, 0.013838768005371094, 0.01645660400390625, 0.019074440002441406, 0.021692276000976562, 0.02431011199951172, 0.026927947998046875, 0.02954578399658203, 0.03216361999511719, 0.034781455993652344, 0.0373992919921875, 0.040017127990722656, 0.04263496398925781, 0.04525279998779297, 0.047870635986328125, 0.05048847198486328, 0.05310630798339844, 0.055724143981933594, 0.05834197998046875, 0.060959815979003906, 0.06357765197753906, 0.06619548797607422, 0.06881332397460938, 0.07143115997314453, 0.07404899597167969, 0.07666683197021484, 0.07928466796875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 13.0, 23.0, 37.0, 55.0, 68.0, 113.0, 131.0, 131.0, 138.0, 94.0, 69.0, 52.0, 33.0, 15.0, 6.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1161253452301025, -2.0722553730010986, -2.028385639190674, -1.9845157861709595, -1.9406459331512451, -1.8967760801315308, -1.8529062271118164, -1.809036374092102, -1.7651665210723877, -1.7212966680526733, -1.677426815032959, -1.6335569620132446, -1.5896871089935303, -1.545817255973816, -1.5019474029541016, -1.4580775499343872, -1.4142076969146729, -1.3703378438949585, -1.3264679908752441, -1.2825981378555298, -1.2387282848358154, -1.194858431816101, -1.1509885787963867, -1.1071187257766724, -1.0632487535476685, -1.019378900527954, -0.9755090475082397, -0.9316391944885254, -0.887769341468811, -0.8438994884490967, -0.8000296354293823, -0.756159782409668, -0.7122898697853088, -0.6684200167655945, -0.6245501637458801, -0.5806803107261658, -0.5368104577064514, -0.49294060468673706, -0.4490707218647003, -0.40520086884498596, -0.3613310158252716, -0.31746116280555725, -0.2735913097858429, -0.22972144186496735, -0.185851588845253, -0.14198173582553864, -0.09811186790466309, -0.05424201488494873, -0.010372161865234375, 0.03349769487977028, 0.07736755162477493, 0.12123741209506989, 0.16510726511478424, 0.2089771181344986, 0.25284698605537415, 0.2967168390750885, 0.34058669209480286, 0.3844565451145172, 0.42832639813423157, 0.4721962809562683, 0.5160661339759827, 0.559935986995697, 0.6038058400154114, 0.6476756930351257, 0.6915455460548401]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 1.0, 7.0, 5.0, 11.0, 10.0, 13.0, 14.0, 22.0, 19.0, 22.0, 22.0, 31.0, 23.0, 29.0, 28.0, 38.0, 36.0, 42.0, 42.0, 44.0, 35.0, 43.0, 46.0, 41.0, 37.0, 36.0, 37.0, 46.0, 27.0, 19.0, 26.0, 26.0, 18.0, 21.0, 16.0, 12.0, 7.0, 17.0, 6.0, 5.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5063486099243164, -0.4902411103248596, -0.47413361072540283, -0.45802611112594604, -0.44191861152648926, -0.42581111192703247, -0.4097035825252533, -0.3935960829257965, -0.3774885833263397, -0.36138108372688293, -0.34527358412742615, -0.32916608452796936, -0.3130585551261902, -0.2969510555267334, -0.2808435559272766, -0.2647360563278198, -0.24862855672836304, -0.23252105712890625, -0.21641355752944946, -0.20030604302883148, -0.1841985434293747, -0.1680910438299179, -0.15198352932929993, -0.13587602972984314, -0.11976853013038635, -0.10366103053092957, -0.08755352348089218, -0.0714460164308548, -0.05533851683139801, -0.03923101723194122, -0.02312351018190384, -0.007016003131866455, 0.009091496467590332, 0.025198999792337418, 0.0413065031170845, 0.05741400644183159, 0.07352150976657867, 0.08962900936603546, 0.10573651641607285, 0.12184402346611023, 0.13795152306556702, 0.1540590226650238, 0.1701665222644806, 0.18627403676509857, 0.20238153636455536, 0.21848903596401215, 0.23459655046463013, 0.2507040500640869, 0.2668115496635437, 0.2829190492630005, 0.2990265488624573, 0.31513404846191406, 0.33124154806137085, 0.34734904766082764, 0.3634565770626068, 0.3795640766620636, 0.3956715762615204, 0.4117790758609772, 0.42788657546043396, 0.44399407505989075, 0.4601016044616699, 0.4762091040611267, 0.4923166036605835, 0.5084241032600403, 0.5245316028594971]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 12.0, 17.0, 23.0, 34.0, 69.0, 96.0, 123.0, 242.0, 424.0, 755.0, 1404.0, 2570.0, 5296.0, 11480.0, 26396.0, 62826.0, 140445.0, 248867.0, 262852.0, 156903.0, 71702.0, 30284.0, 13180.0, 6096.0, 2974.0, 1542.0, 788.0, 445.0, 258.0, 155.0, 109.0, 59.0, 46.0, 21.0, 15.0, 10.0, 12.0, 7.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2737083435058594, -0.26543426513671875, -0.2571601867675781, -0.2488861083984375, -0.24061203002929688, -0.23233795166015625, -0.22406387329101562, -0.215789794921875, -0.20751571655273438, -0.19924163818359375, -0.19096755981445312, -0.1826934814453125, -0.17441940307617188, -0.16614532470703125, -0.15787124633789062, -0.14959716796875, -0.14132308959960938, -0.13304901123046875, -0.12477493286132812, -0.1165008544921875, -0.10822677612304688, -0.09995269775390625, -0.09167861938476562, -0.083404541015625, -0.07513046264648438, -0.06685638427734375, -0.058582305908203125, -0.0503082275390625, -0.042034149169921875, -0.03376007080078125, -0.025485992431640625, -0.0172119140625, -0.008937835693359375, -0.00066375732421875, 0.007610321044921875, 0.0158843994140625, 0.024158477783203125, 0.03243255615234375, 0.040706634521484375, 0.048980712890625, 0.057254791259765625, 0.06552886962890625, 0.07380294799804688, 0.0820770263671875, 0.09035110473632812, 0.09862518310546875, 0.10689926147460938, 0.11517333984375, 0.12344741821289062, 0.13172149658203125, 0.13999557495117188, 0.1482696533203125, 0.15654373168945312, 0.16481781005859375, 0.17309188842773438, 0.181365966796875, 0.18964004516601562, 0.19791412353515625, 0.20618820190429688, 0.2144622802734375, 0.22273635864257812, 0.23101043701171875, 0.23928451538085938, 0.24755859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 9.0, 7.0, 13.0, 10.0, 13.0, 13.0, 13.0, 15.0, 12.0, 18.0, 20.0, 25.0, 23.0, 23.0, 36.0, 34.0, 38.0, 33.0, 55.0, 45.0, 39.0, 44.0, 40.0, 33.0, 39.0, 49.0, 32.0, 38.0, 28.0, 21.0, 32.0, 22.0, 16.0, 22.0, 22.0, 18.0, 9.0, 12.0, 5.0, 3.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.619140625, -2.524749755859375, -2.43035888671875, -2.335968017578125, -2.2415771484375, -2.147186279296875, -2.05279541015625, -1.958404541015625, -1.864013671875, -1.769622802734375, -1.67523193359375, -1.580841064453125, -1.4864501953125, -1.392059326171875, -1.29766845703125, -1.203277587890625, -1.10888671875, -1.014495849609375, -0.92010498046875, -0.825714111328125, -0.7313232421875, -0.636932373046875, -0.54254150390625, -0.448150634765625, -0.353759765625, -0.259368896484375, -0.16497802734375, -0.070587158203125, 0.0238037109375, 0.118194580078125, 0.21258544921875, 0.306976318359375, 0.4013671875, 0.495758056640625, 0.59014892578125, 0.684539794921875, 0.7789306640625, 0.873321533203125, 0.96771240234375, 1.062103271484375, 1.156494140625, 1.250885009765625, 1.34527587890625, 1.439666748046875, 1.5340576171875, 1.628448486328125, 1.72283935546875, 1.817230224609375, 1.91162109375, 2.006011962890625, 2.10040283203125, 2.194793701171875, 2.2891845703125, 2.383575439453125, 2.47796630859375, 2.572357177734375, 2.666748046875, 2.761138916015625, 2.85552978515625, 2.949920654296875, 3.0443115234375, 3.138702392578125, 3.23309326171875, 3.327484130859375, 3.421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 11.0, 12.0, 19.0, 20.0, 31.0, 46.0, 52.0, 63.0, 73.0, 106.0, 159.0, 231.0, 355.0, 637.0, 2038.0, 42602.0, 887529.0, 109221.0, 3220.0, 783.0, 408.0, 236.0, 162.0, 114.0, 108.0, 66.0, 48.0, 45.0, 48.0, 18.0, 25.0, 18.0, 13.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.425994873046875, -1.38226318359375, -1.338531494140625, -1.2947998046875, -1.251068115234375, -1.20733642578125, -1.163604736328125, -1.119873046875, -1.076141357421875, -1.03240966796875, -0.988677978515625, -0.9449462890625, -0.901214599609375, -0.85748291015625, -0.813751220703125, -0.77001953125, -0.726287841796875, -0.68255615234375, -0.638824462890625, -0.5950927734375, -0.551361083984375, -0.50762939453125, -0.463897705078125, -0.420166015625, -0.376434326171875, -0.33270263671875, -0.288970947265625, -0.2452392578125, -0.201507568359375, -0.15777587890625, -0.114044189453125, -0.0703125, -0.026580810546875, 0.01715087890625, 0.060882568359375, 0.1046142578125, 0.148345947265625, 0.19207763671875, 0.235809326171875, 0.279541015625, 0.323272705078125, 0.36700439453125, 0.410736083984375, 0.4544677734375, 0.498199462890625, 0.54193115234375, 0.585662841796875, 0.62939453125, 0.673126220703125, 0.71685791015625, 0.760589599609375, 0.8043212890625, 0.848052978515625, 0.89178466796875, 0.935516357421875, 0.979248046875, 1.022979736328125, 1.06671142578125, 1.110443115234375, 1.1541748046875, 1.197906494140625, 1.24163818359375, 1.285369873046875, 1.3291015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 8.0, 18.0, 23.0, 22.0, 21.0, 21.0, 31.0, 39.0, 32.0, 49.0, 53.0, 51.0, 76.0, 48.0, 40.0, 66.0, 61.0, 53.0, 48.0, 33.0, 36.0, 33.0, 23.0, 15.0, 20.0, 19.0, 6.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.923828125, -3.8067626953125, -3.689697265625, -3.5726318359375, -3.45556640625, -3.3385009765625, -3.221435546875, -3.1043701171875, -2.9873046875, -2.8702392578125, -2.753173828125, -2.6361083984375, -2.51904296875, -2.4019775390625, -2.284912109375, -2.1678466796875, -2.05078125, -1.9337158203125, -1.816650390625, -1.6995849609375, -1.58251953125, -1.4654541015625, -1.348388671875, -1.2313232421875, -1.1142578125, -0.9971923828125, -0.880126953125, -0.7630615234375, -0.64599609375, -0.5289306640625, -0.411865234375, -0.2947998046875, -0.177734375, -0.0606689453125, 0.056396484375, 0.1734619140625, 0.29052734375, 0.4075927734375, 0.524658203125, 0.6417236328125, 0.7587890625, 0.8758544921875, 0.992919921875, 1.1099853515625, 1.22705078125, 1.3441162109375, 1.461181640625, 1.5782470703125, 1.6953125, 1.8123779296875, 1.929443359375, 2.0465087890625, 2.16357421875, 2.2806396484375, 2.397705078125, 2.5147705078125, 2.6318359375, 2.7489013671875, 2.865966796875, 2.9830322265625, 3.10009765625, 3.2171630859375, 3.334228515625, 3.4512939453125, 3.568359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 17.0, 39.0, 58.0, 189.0, 876.0, 22212.0, 1019943.0, 4556.0, 410.0, 117.0, 58.0, 27.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.23828125, -1.2115440368652344, -1.1848068237304688, -1.1580696105957031, -1.1313323974609375, -1.1045951843261719, -1.0778579711914062, -1.0511207580566406, -1.024383544921875, -0.9976463317871094, -0.9709091186523438, -0.9441719055175781, -0.9174346923828125, -0.8906974792480469, -0.8639602661132812, -0.8372230529785156, -0.81048583984375, -0.7837486267089844, -0.7570114135742188, -0.7302742004394531, -0.7035369873046875, -0.6767997741699219, -0.6500625610351562, -0.6233253479003906, -0.596588134765625, -0.5698509216308594, -0.5431137084960938, -0.5163764953613281, -0.4896392822265625, -0.4629020690917969, -0.43616485595703125, -0.4094276428222656, -0.3826904296875, -0.3559532165527344, -0.32921600341796875, -0.3024787902832031, -0.2757415771484375, -0.24900436401367188, -0.22226715087890625, -0.19552993774414062, -0.168792724609375, -0.14205551147460938, -0.11531829833984375, -0.08858108520507812, -0.0618438720703125, -0.035106658935546875, -0.00836944580078125, 0.018367767333984375, 0.04510498046875, 0.07184219360351562, 0.09857940673828125, 0.12531661987304688, 0.1520538330078125, 0.17879104614257812, 0.20552825927734375, 0.23226547241210938, 0.259002685546875, 0.2857398986816406, 0.31247711181640625, 0.3392143249511719, 0.3659515380859375, 0.3926887512207031, 0.41942596435546875, 0.4461631774902344, 0.472900390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 14.0, 13.0, 24.0, 28.0, 71.0, 127.0, 204.0, 171.0, 135.0, 87.0, 38.0, 29.0, 14.0, 12.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11732292175293e-05, -3.002304583787918e-05, -2.8872862458229065e-05, -2.772267907857895e-05, -2.6572495698928833e-05, -2.5422312319278717e-05, -2.42721289396286e-05, -2.3121945559978485e-05, -2.197176218032837e-05, -2.0821578800678253e-05, -1.9671395421028137e-05, -1.852121204137802e-05, -1.7371028661727905e-05, -1.622084528207779e-05, -1.5070661902427673e-05, -1.3920478522777557e-05, -1.2770295143127441e-05, -1.1620111763477325e-05, -1.046992838382721e-05, -9.319745004177094e-06, -8.169561624526978e-06, -7.0193782448768616e-06, -5.869194865226746e-06, -4.71901148557663e-06, -3.5688281059265137e-06, -2.4186447262763977e-06, -1.2684613466262817e-06, -1.1827796697616577e-07, 1.0319054126739502e-06, 2.182088792324066e-06, 3.332272171974182e-06, 4.482455551624298e-06, 5.632638931274414e-06, 6.78282231092453e-06, 7.933005690574646e-06, 9.083189070224762e-06, 1.0233372449874878e-05, 1.1383555829524994e-05, 1.253373920917511e-05, 1.3683922588825226e-05, 1.4834105968475342e-05, 1.5984289348125458e-05, 1.7134472727775574e-05, 1.828465610742569e-05, 1.9434839487075806e-05, 2.058502286672592e-05, 2.1735206246376038e-05, 2.2885389626026154e-05, 2.403557300567627e-05, 2.5185756385326385e-05, 2.63359397649765e-05, 2.7486123144626617e-05, 2.8636306524276733e-05, 2.978648990392685e-05, 3.0936673283576965e-05, 3.208685666322708e-05, 3.32370400428772e-05, 3.438722342252731e-05, 3.553740680217743e-05, 3.6687590181827545e-05, 3.783777356147766e-05, 3.898795694112778e-05, 4.013814032077789e-05, 4.128832370042801e-05, 4.2438507080078125e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 10.0, 24.0, 47.0, 89.0, 209.0, 579.0, 2250.0, 27613.0, 930038.0, 82672.0, 3665.0, 813.0, 282.0, 141.0, 58.0, 31.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276611328125, -0.2666015625, -0.256591796875, -0.24658203125, -0.236572265625, -0.2265625, -0.216552734375, -0.20654296875, -0.196533203125, -0.1865234375, -0.176513671875, -0.16650390625, -0.156494140625, -0.146484375, -0.136474609375, -0.12646484375, -0.116455078125, -0.1064453125, -0.096435546875, -0.08642578125, -0.076416015625, -0.06640625, -0.056396484375, -0.04638671875, -0.036376953125, -0.0263671875, -0.016357421875, -0.00634765625, 0.003662109375, 0.013671875, 0.023681640625, 0.03369140625, 0.043701171875, 0.0537109375, 0.063720703125, 0.07373046875, 0.083740234375, 0.09375, 0.103759765625, 0.11376953125, 0.123779296875, 0.1337890625, 0.143798828125, 0.15380859375, 0.163818359375, 0.173828125, 0.183837890625, 0.19384765625, 0.203857421875, 0.2138671875, 0.223876953125, 0.23388671875, 0.243896484375, 0.25390625, 0.263916015625, 0.27392578125, 0.283935546875, 0.2939453125, 0.303955078125, 0.31396484375, 0.323974609375, 0.333984375, 0.343994140625, 0.35400390625, 0.364013671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 10.0, 17.0, 27.0, 41.0, 69.0, 92.0, 161.0, 162.0, 129.0, 90.0, 60.0, 47.0, 33.0, 19.0, 12.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06884765625, -0.06624126434326172, -0.06363487243652344, -0.061028480529785156, -0.058422088623046875, -0.055815696716308594, -0.05320930480957031, -0.05060291290283203, -0.04799652099609375, -0.04539012908935547, -0.04278373718261719, -0.040177345275878906, -0.037570953369140625, -0.034964561462402344, -0.03235816955566406, -0.02975177764892578, -0.0271453857421875, -0.02453899383544922, -0.021932601928710938, -0.019326210021972656, -0.016719818115234375, -0.014113426208496094, -0.011507034301757812, -0.008900642395019531, -0.00629425048828125, -0.0036878585815429688, -0.0010814666748046875, 0.0015249252319335938, 0.004131317138671875, 0.006737709045410156, 0.009344100952148438, 0.011950492858886719, 0.014556884765625, 0.01716327667236328, 0.019769668579101562, 0.022376060485839844, 0.024982452392578125, 0.027588844299316406, 0.030195236206054688, 0.03280162811279297, 0.03540802001953125, 0.03801441192626953, 0.04062080383300781, 0.043227195739746094, 0.045833587646484375, 0.048439979553222656, 0.05104637145996094, 0.05365276336669922, 0.0562591552734375, 0.05886554718017578, 0.06147193908691406, 0.06407833099365234, 0.06668472290039062, 0.0692911148071289, 0.07189750671386719, 0.07450389862060547, 0.07711029052734375, 0.07971668243408203, 0.08232307434082031, 0.0849294662475586, 0.08753585815429688, 0.09014225006103516, 0.09274864196777344, 0.09535503387451172, 0.09796142578125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 66.0, 346.0, 456.0, 130.0, 15.0], "bins": [-17.658966064453125, -17.370206832885742, -17.08144760131836, -16.792688369750977, -16.503929138183594, -16.21516990661621, -15.926409721374512, -15.637650489807129, -15.348891258239746, -15.060132026672363, -14.77137279510498, -14.482613563537598, -14.193853378295898, -13.905094146728516, -13.616334915161133, -13.32757568359375, -13.038816452026367, -12.750057220458984, -12.461297988891602, -12.172538757324219, -11.883779525756836, -11.595019340515137, -11.306260108947754, -11.017500877380371, -10.728741645812988, -10.439982414245605, -10.151223182678223, -9.86246395111084, -9.57370376586914, -9.284944534301758, -8.996185302734375, -8.707426071166992, -8.41866683959961, -8.129907608032227, -7.841148376464844, -7.552388668060303, -7.26362943649292, -6.974870204925537, -6.686110496520996, -6.397351264953613, -6.1085920333862305, -5.819832801818848, -5.531073570251465, -5.242313861846924, -4.953554630279541, -4.664795398712158, -4.376035690307617, -4.087276458740234, -3.7985169887542725, -3.5097575187683105, -3.2209982872009277, -2.932239055633545, -2.643479585647583, -2.354720115661621, -2.0659608840942383, -1.7772014141082764, -1.4884421825408936, -1.1996828317642212, -0.9109234809875488, -0.6221641302108765, -0.3334047794342041, -0.04464542865753174, 0.24411392211914062, 0.5328733921051025, 0.8216326236724854]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 5.0, 6.0, 6.0, 6.0, 15.0, 14.0, 12.0, 17.0, 22.0, 20.0, 23.0, 19.0, 34.0, 28.0, 33.0, 47.0, 38.0, 39.0, 36.0, 48.0, 39.0, 38.0, 34.0, 58.0, 37.0, 42.0, 42.0, 34.0, 26.0, 26.0, 20.0, 24.0, 19.0, 9.0, 12.0, 14.0, 11.0, 6.0, 10.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.449974060058594, -4.299516201019287, -4.149057865142822, -3.9986000061035156, -3.84814190864563, -3.697683811187744, -3.5472257137298584, -3.3967676162719727, -3.246309757232666, -3.0958516597747803, -2.9453935623168945, -2.794935703277588, -2.644477605819702, -2.4940195083618164, -2.3435614109039307, -2.193103313446045, -2.042645215988159, -1.8921871185302734, -1.7417291402816772, -1.5912710428237915, -1.4408130645751953, -1.2903549671173096, -1.1398968696594238, -0.9894388914108276, -0.8389807939529419, -0.6885227560997009, -0.53806471824646, -0.3876066207885742, -0.23714858293533325, -0.08669054508209229, 0.06376755237579346, 0.21422553062438965, 0.3646836280822754, 0.5151416659355164, 0.6655997037887573, 0.8160578012466431, 0.966515839099884, 1.116973876953125, 1.2674319744110107, 1.417889952659607, 1.5683480501174927, 1.7188061475753784, 1.8692641258239746, 2.0197222232818604, 2.170180320739746, 2.3206381797790527, 2.4710965156555176, 2.621554374694824, 2.77201247215271, 2.9224705696105957, 3.0729286670684814, 3.223386764526367, 3.373844623565674, 3.5243027210235596, 3.6747608184814453, 3.825218677520752, 3.975677013397217, 4.126134872436523, 4.276593208312988, 4.427051067352295, 4.57750940322876, 4.727967262268066, 4.878425598144531, 5.028883457183838, 5.1793413162231445]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 6.0, 6.0, 15.0, 16.0, 18.0, 29.0, 25.0, 40.0, 40.0, 70.0, 91.0, 247.0, 596.0, 2475.0, 14879.0, 148877.0, 1357820.0, 2232344.0, 393235.0, 35922.0, 5223.0, 1340.0, 440.0, 177.0, 94.0, 65.0, 42.0, 28.0, 22.0, 24.0, 9.0, 9.0, 9.0, 12.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.0587310791015625, -1.019805908203125, -0.9808807373046875, -0.94195556640625, -0.9030303955078125, -0.864105224609375, -0.8251800537109375, -0.7862548828125, -0.7473297119140625, -0.708404541015625, -0.6694793701171875, -0.63055419921875, -0.5916290283203125, -0.552703857421875, -0.5137786865234375, -0.474853515625, -0.4359283447265625, -0.397003173828125, -0.3580780029296875, -0.31915283203125, -0.2802276611328125, -0.241302490234375, -0.2023773193359375, -0.1634521484375, -0.1245269775390625, -0.085601806640625, -0.0466766357421875, -0.00775146484375, 0.0311737060546875, 0.070098876953125, 0.1090240478515625, 0.14794921875, 0.1868743896484375, 0.225799560546875, 0.2647247314453125, 0.30364990234375, 0.3425750732421875, 0.381500244140625, 0.4204254150390625, 0.4593505859375, 0.4982757568359375, 0.537200927734375, 0.5761260986328125, 0.61505126953125, 0.6539764404296875, 0.692901611328125, 0.7318267822265625, 0.770751953125, 0.8096771240234375, 0.848602294921875, 0.8875274658203125, 0.92645263671875, 0.9653778076171875, 1.004302978515625, 1.0432281494140625, 1.0821533203125, 1.1210784912109375, 1.160003662109375, 1.1989288330078125, 1.23785400390625, 1.2767791748046875, 1.315704345703125, 1.3546295166015625, 1.3935546875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 3.0, 3.0, 11.0, 10.0, 16.0, 20.0, 25.0, 19.0, 28.0, 25.0, 38.0, 44.0, 45.0, 31.0, 57.0, 49.0, 52.0, 55.0, 50.0, 45.0, 51.0, 40.0, 45.0, 32.0, 25.0, 25.0, 29.0, 22.0, 19.0, 15.0, 10.0, 4.0, 18.0, 7.0, 2.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.7706146240234375, -0.747283935546875, -0.7239532470703125, -0.70062255859375, -0.6772918701171875, -0.653961181640625, -0.6306304931640625, -0.6072998046875, -0.5839691162109375, -0.560638427734375, -0.5373077392578125, -0.51397705078125, -0.4906463623046875, -0.467315673828125, -0.4439849853515625, -0.420654296875, -0.3973236083984375, -0.373992919921875, -0.3506622314453125, -0.32733154296875, -0.3040008544921875, -0.280670166015625, -0.2573394775390625, -0.2340087890625, -0.2106781005859375, -0.187347412109375, -0.1640167236328125, -0.14068603515625, -0.1173553466796875, -0.094024658203125, -0.0706939697265625, -0.04736328125, -0.0240325927734375, -0.000701904296875, 0.0226287841796875, 0.04595947265625, 0.0692901611328125, 0.092620849609375, 0.1159515380859375, 0.1392822265625, 0.1626129150390625, 0.185943603515625, 0.2092742919921875, 0.23260498046875, 0.2559356689453125, 0.279266357421875, 0.3025970458984375, 0.325927734375, 0.3492584228515625, 0.372589111328125, 0.3959197998046875, 0.41925048828125, 0.4425811767578125, 0.465911865234375, 0.4892425537109375, 0.5125732421875, 0.5359039306640625, 0.559234619140625, 0.5825653076171875, 0.60589599609375, 0.6292266845703125, 0.652557373046875, 0.6758880615234375, 0.69921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 9.0, 5.0, 9.0, 9.0, 11.0, 20.0, 39.0, 114.0, 361.0, 1321101.0, 2871961.0, 385.0, 89.0, 40.0, 26.0, 19.0, 15.0, 7.0, 9.0, 4.0, 5.0, 5.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.59375, -14.1231689453125, -13.652587890625, -13.1820068359375, -12.71142578125, -12.2408447265625, -11.770263671875, -11.2996826171875, -10.8291015625, -10.3585205078125, -9.887939453125, -9.4173583984375, -8.94677734375, -8.4761962890625, -8.005615234375, -7.5350341796875, -7.064453125, -6.5938720703125, -6.123291015625, -5.6527099609375, -5.18212890625, -4.7115478515625, -4.240966796875, -3.7703857421875, -3.2998046875, -2.8292236328125, -2.358642578125, -1.8880615234375, -1.41748046875, -0.9468994140625, -0.476318359375, -0.0057373046875, 0.46484375, 0.9354248046875, 1.406005859375, 1.8765869140625, 2.34716796875, 2.8177490234375, 3.288330078125, 3.7589111328125, 4.2294921875, 4.7000732421875, 5.170654296875, 5.6412353515625, 6.11181640625, 6.5823974609375, 7.052978515625, 7.5235595703125, 7.994140625, 8.4647216796875, 8.935302734375, 9.4058837890625, 9.87646484375, 10.3470458984375, 10.817626953125, 11.2882080078125, 11.7587890625, 12.2293701171875, 12.699951171875, 13.1705322265625, 13.64111328125, 14.1116943359375, 14.582275390625, 15.0528564453125, 15.5234375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 10.0, 16.0, 16.0, 19.0, 33.0, 55.0, 89.0, 114.0, 164.0, 265.0, 390.0, 535.0, 607.0, 531.0, 405.0, 281.0, 178.0, 128.0, 71.0, 61.0, 29.0, 21.0, 14.0, 14.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.413330078125, -0.4025993347167969, -0.39186859130859375, -0.3811378479003906, -0.3704071044921875, -0.3596763610839844, -0.34894561767578125, -0.3382148742675781, -0.327484130859375, -0.3167533874511719, -0.30602264404296875, -0.2952919006347656, -0.2845611572265625, -0.2738304138183594, -0.26309967041015625, -0.2523689270019531, -0.24163818359375, -0.23090744018554688, -0.22017669677734375, -0.20944595336914062, -0.1987152099609375, -0.18798446655273438, -0.17725372314453125, -0.16652297973632812, -0.155792236328125, -0.14506149291992188, -0.13433074951171875, -0.12360000610351562, -0.1128692626953125, -0.10213851928710938, -0.09140777587890625, -0.08067703247070312, -0.0699462890625, -0.059215545654296875, -0.04848480224609375, -0.037754058837890625, -0.0270233154296875, -0.016292572021484375, -0.00556182861328125, 0.005168914794921875, 0.015899658203125, 0.026630401611328125, 0.03736114501953125, 0.048091888427734375, 0.0588226318359375, 0.06955337524414062, 0.08028411865234375, 0.09101486206054688, 0.10174560546875, 0.11247634887695312, 0.12320709228515625, 0.13393783569335938, 0.1446685791015625, 0.15539932250976562, 0.16613006591796875, 0.17686080932617188, 0.187591552734375, 0.19832229614257812, 0.20905303955078125, 0.21978378295898438, 0.2305145263671875, 0.24124526977539062, 0.25197601318359375, 0.2627067565917969, 0.2734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 6.0, 11.0, 9.0, 12.0, 19.0, 19.0, 19.0, 28.0, 45.0, 56.0, 63.0, 63.0, 88.0, 78.0, 99.0, 63.0, 73.0, 66.0, 52.0, 39.0, 27.0, 21.0, 13.0, 7.0, 14.0, 5.0, 5.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0], "bins": [-1.4711329936981201, -1.438071370124817, -1.4050097465515137, -1.3719481229782104, -1.3388864994049072, -1.3058249950408936, -1.2727633714675903, -1.239701747894287, -1.2066401243209839, -1.1735785007476807, -1.1405168771743774, -1.1074552536010742, -1.0743937492370605, -1.0413321256637573, -1.008270502090454, -0.9752088785171509, -0.9421472549438477, -0.9090856313705444, -0.8760240077972412, -0.8429624438285828, -0.8099008202552795, -0.7768391966819763, -0.7437776327133179, -0.7107160091400146, -0.6776543855667114, -0.6445927619934082, -0.611531138420105, -0.5784695744514465, -0.5454079508781433, -0.5123463273048401, -0.47928473353385925, -0.4462231397628784, -0.41316157579421997, -0.38009995222091675, -0.3470383584499359, -0.3139767646789551, -0.28091514110565186, -0.24785353243350983, -0.2147919237613678, -0.18173031508922577, -0.14866870641708374, -0.11560709774494171, -0.08254548907279968, -0.049483880400657654, -0.016422271728515625, 0.016639336943626404, 0.04970094561576843, 0.08276255428791046, 0.11582416296005249, 0.14888577163219452, 0.18194738030433655, 0.21500898897647858, 0.2480705976486206, 0.28113222122192383, 0.31419381499290466, 0.3472554087638855, 0.3803170323371887, 0.41337865591049194, 0.4464402496814728, 0.4795018434524536, 0.5125634670257568, 0.5456250905990601, 0.5786867141723633, 0.6117482781410217, 0.644809901714325]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 6.0, 11.0, 13.0, 24.0, 29.0, 46.0, 32.0, 38.0, 25.0, 32.0, 37.0, 39.0, 42.0, 47.0, 46.0, 34.0, 52.0, 42.0, 36.0, 36.0, 45.0, 30.0, 29.0, 26.0, 22.0, 28.0, 22.0, 11.0, 9.0, 12.0, 11.0, 11.0, 15.0, 10.0, 3.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6389943957328796, -0.6174085736274719, -0.595822811126709, -0.5742369890213013, -0.5526511669158936, -0.5310653448104858, -0.5094795823097229, -0.4878937602043152, -0.46630796790122986, -0.44472217559814453, -0.4231363534927368, -0.4015505611896515, -0.37996476888656616, -0.35837894678115845, -0.3367931544780731, -0.3152073621749878, -0.2936215400695801, -0.27203574776649475, -0.25044992566108704, -0.2288641333580017, -0.2072783261537552, -0.18569251894950867, -0.16410672664642334, -0.14252091944217682, -0.1209351122379303, -0.09934930503368378, -0.07776350528001785, -0.05617770552635193, -0.03459189832210541, -0.013006091117858887, 0.00857970118522644, 0.03016550838947296, 0.05175137519836426, 0.07333718240261078, 0.0949229821562767, 0.11650878190994263, 0.13809458911418915, 0.15968039631843567, 0.181266188621521, 0.20285199582576752, 0.22443780303001404, 0.24602361023426056, 0.2676094174385071, 0.2891952097415924, 0.31078100204467773, 0.33236682415008545, 0.3539526164531708, 0.3755384087562561, 0.3971242308616638, 0.41871002316474915, 0.44029584527015686, 0.4618816375732422, 0.4834674596786499, 0.5050532817840576, 0.5266390442848206, 0.5482248663902283, 0.5698106288909912, 0.5913964509963989, 0.6129822134971619, 0.6345680356025696, 0.6561538577079773, 0.6777396202087402, 0.699325442314148, 0.7209112644195557, 0.7424970865249634]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 12.0, 17.0, 30.0, 39.0, 64.0, 100.0, 136.0, 239.0, 307.0, 505.0, 878.0, 1387.0, 2150.0, 3117.0, 5291.0, 10089.0, 22455.0, 60271.0, 164604.0, 326735.0, 265481.0, 110207.0, 39574.0, 15703.0, 7578.0, 4214.0, 2555.0, 1719.0, 1047.0, 726.0, 467.0, 288.0, 190.0, 150.0, 77.0, 63.0, 28.0, 23.0, 15.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.267822265625, -0.26033973693847656, -0.2528572082519531, -0.2453746795654297, -0.23789215087890625, -0.2304096221923828, -0.22292709350585938, -0.21544456481933594, -0.2079620361328125, -0.20047950744628906, -0.19299697875976562, -0.1855144500732422, -0.17803192138671875, -0.1705493927001953, -0.16306686401367188, -0.15558433532714844, -0.148101806640625, -0.14061927795410156, -0.13313674926757812, -0.1256542205810547, -0.11817169189453125, -0.11068916320800781, -0.10320663452148438, -0.09572410583496094, -0.0882415771484375, -0.08075904846191406, -0.07327651977539062, -0.06579399108886719, -0.05831146240234375, -0.05082893371582031, -0.043346405029296875, -0.03586387634277344, -0.02838134765625, -0.020898818969726562, -0.013416290283203125, -0.0059337615966796875, 0.00154876708984375, 0.009031295776367188, 0.016513824462890625, 0.023996353149414062, 0.0314788818359375, 0.03896141052246094, 0.046443939208984375, 0.05392646789550781, 0.06140899658203125, 0.06889152526855469, 0.07637405395507812, 0.08385658264160156, 0.091339111328125, 0.09882164001464844, 0.10630416870117188, 0.11378669738769531, 0.12126922607421875, 0.1287517547607422, 0.13623428344726562, 0.14371681213378906, 0.1511993408203125, 0.15868186950683594, 0.16616439819335938, 0.1736469268798828, 0.18112945556640625, 0.1886119842529297, 0.19609451293945312, 0.20357704162597656, 0.2110595703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 13.0, 20.0, 14.0, 35.0, 35.0, 35.0, 42.0, 43.0, 39.0, 48.0, 52.0, 53.0, 52.0, 50.0, 49.0, 46.0, 45.0, 43.0, 40.0, 42.0, 34.0, 19.0, 22.0, 17.0, 15.0, 9.0, 15.0, 14.0, 14.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.507568359375, -0.49072265625, -0.473876953125, -0.45703125, -0.440185546875, -0.42333984375, -0.406494140625, -0.3896484375, -0.372802734375, -0.35595703125, -0.339111328125, -0.322265625, -0.305419921875, -0.28857421875, -0.271728515625, -0.2548828125, -0.238037109375, -0.22119140625, -0.204345703125, -0.1875, -0.170654296875, -0.15380859375, -0.136962890625, -0.1201171875, -0.103271484375, -0.08642578125, -0.069580078125, -0.052734375, -0.035888671875, -0.01904296875, -0.002197265625, 0.0146484375, 0.031494140625, 0.04833984375, 0.065185546875, 0.08203125, 0.098876953125, 0.11572265625, 0.132568359375, 0.1494140625, 0.166259765625, 0.18310546875, 0.199951171875, 0.216796875, 0.233642578125, 0.25048828125, 0.267333984375, 0.2841796875, 0.301025390625, 0.31787109375, 0.334716796875, 0.3515625, 0.368408203125, 0.38525390625, 0.402099609375, 0.4189453125, 0.435791015625, 0.45263671875, 0.469482421875, 0.486328125, 0.503173828125, 0.52001953125, 0.536865234375, 0.5537109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 10.0, 7.0, 10.0, 10.0, 27.0, 30.0, 49.0, 111.0, 145.0, 255.0, 470.0, 848.0, 1604.0, 3347.0, 8876.0, 35969.0, 189382.0, 527467.0, 220371.0, 42243.0, 10050.0, 3637.0, 1695.0, 869.0, 423.0, 247.0, 140.0, 86.0, 46.0, 40.0, 24.0, 20.0, 8.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.451934814453125, -0.43804931640625, -0.424163818359375, -0.4102783203125, -0.396392822265625, -0.38250732421875, -0.368621826171875, -0.354736328125, -0.340850830078125, -0.32696533203125, -0.313079833984375, -0.2991943359375, -0.285308837890625, -0.27142333984375, -0.257537841796875, -0.24365234375, -0.229766845703125, -0.21588134765625, -0.201995849609375, -0.1881103515625, -0.174224853515625, -0.16033935546875, -0.146453857421875, -0.132568359375, -0.118682861328125, -0.10479736328125, -0.090911865234375, -0.0770263671875, -0.063140869140625, -0.04925537109375, -0.035369873046875, -0.021484375, -0.007598876953125, 0.00628662109375, 0.020172119140625, 0.0340576171875, 0.047943115234375, 0.06182861328125, 0.075714111328125, 0.089599609375, 0.103485107421875, 0.11737060546875, 0.131256103515625, 0.1451416015625, 0.159027099609375, 0.17291259765625, 0.186798095703125, 0.20068359375, 0.214569091796875, 0.22845458984375, 0.242340087890625, 0.2562255859375, 0.270111083984375, 0.28399658203125, 0.297882080078125, 0.311767578125, 0.325653076171875, 0.33953857421875, 0.353424072265625, 0.3673095703125, 0.381195068359375, 0.39508056640625, 0.408966064453125, 0.4228515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 11.0, 14.0, 12.0, 19.0, 20.0, 18.0, 26.0, 23.0, 39.0, 36.0, 33.0, 36.0, 49.0, 41.0, 47.0, 34.0, 58.0, 44.0, 43.0, 45.0, 25.0, 50.0, 28.0, 35.0, 29.0, 29.0, 19.0, 15.0, 14.0, 18.0, 13.0, 7.0, 6.0, 4.0, 12.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86865234375, -0.8400039672851562, -0.8113555908203125, -0.7827072143554688, -0.754058837890625, -0.7254104614257812, -0.6967620849609375, -0.6681137084960938, -0.63946533203125, -0.6108169555664062, -0.5821685791015625, -0.5535202026367188, -0.524871826171875, -0.49622344970703125, -0.4675750732421875, -0.43892669677734375, -0.4102783203125, -0.38162994384765625, -0.3529815673828125, -0.32433319091796875, -0.295684814453125, -0.26703643798828125, -0.2383880615234375, -0.20973968505859375, -0.18109130859375, -0.15244293212890625, -0.1237945556640625, -0.09514617919921875, -0.066497802734375, -0.03784942626953125, -0.0092010498046875, 0.01944732666015625, 0.048095703125, 0.07674407958984375, 0.1053924560546875, 0.13404083251953125, 0.162689208984375, 0.19133758544921875, 0.2199859619140625, 0.24863433837890625, 0.27728271484375, 0.30593109130859375, 0.3345794677734375, 0.36322784423828125, 0.391876220703125, 0.42052459716796875, 0.4491729736328125, 0.47782135009765625, 0.5064697265625, 0.5351181030273438, 0.5637664794921875, 0.5924148559570312, 0.621063232421875, 0.6497116088867188, 0.6783599853515625, 0.7070083618164062, 0.73565673828125, 0.7643051147460938, 0.7929534912109375, 0.8216018676757812, 0.850250244140625, 0.8788986206054688, 0.9075469970703125, 0.9361953735351562, 0.96484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 12.0, 6.0, 17.0, 26.0, 51.0, 88.0, 149.0, 318.0, 713.0, 1737.0, 4993.0, 18363.0, 180838.0, 748316.0, 75269.0, 11696.0, 3567.0, 1350.0, 533.0, 220.0, 111.0, 75.0, 42.0, 20.0, 17.0, 9.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221923828125, -0.21564483642578125, -0.2093658447265625, -0.20308685302734375, -0.196807861328125, -0.19052886962890625, -0.1842498779296875, -0.17797088623046875, -0.17169189453125, -0.16541290283203125, -0.1591339111328125, -0.15285491943359375, -0.146575927734375, -0.14029693603515625, -0.1340179443359375, -0.12773895263671875, -0.1214599609375, -0.11518096923828125, -0.1089019775390625, -0.10262298583984375, -0.096343994140625, -0.09006500244140625, -0.0837860107421875, -0.07750701904296875, -0.07122802734375, -0.06494903564453125, -0.0586700439453125, -0.05239105224609375, -0.046112060546875, -0.03983306884765625, -0.0335540771484375, -0.02727508544921875, -0.02099609375, -0.01471710205078125, -0.0084381103515625, -0.00215911865234375, 0.004119873046875, 0.01039886474609375, 0.0166778564453125, 0.02295684814453125, 0.02923583984375, 0.03551483154296875, 0.0417938232421875, 0.04807281494140625, 0.054351806640625, 0.06063079833984375, 0.0669097900390625, 0.07318878173828125, 0.0794677734375, 0.08574676513671875, 0.0920257568359375, 0.09830474853515625, 0.104583740234375, 0.11086273193359375, 0.1171417236328125, 0.12342071533203125, 0.12969970703125, 0.13597869873046875, 0.1422576904296875, 0.14853668212890625, 0.154815673828125, 0.16109466552734375, 0.1673736572265625, 0.17365264892578125, 0.179931640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 24.0, 62.0, 122.0, 216.0, 232.0, 155.0, 74.0, 37.0, 21.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.101629257202148e-05, -8.740182965993881e-05, -8.378736674785614e-05, -8.017290383577347e-05, -7.65584409236908e-05, -7.294397801160812e-05, -6.932951509952545e-05, -6.571505218744278e-05, -6.210058927536011e-05, -5.8486126363277435e-05, -5.487166345119476e-05, -5.125720053911209e-05, -4.764273762702942e-05, -4.402827471494675e-05, -4.0413811802864075e-05, -3.67993488907814e-05, -3.318488597869873e-05, -2.957042306661606e-05, -2.5955960154533386e-05, -2.2341497242450714e-05, -1.8727034330368042e-05, -1.511257141828537e-05, -1.1498108506202698e-05, -7.883645594120026e-06, -4.2691826820373535e-06, -6.547197699546814e-07, 2.9597431421279907e-06, 6.574206054210663e-06, 1.0188668966293335e-05, 1.3803131878376007e-05, 1.741759479045868e-05, 2.103205770254135e-05, 2.4646520614624023e-05, 2.8260983526706696e-05, 3.187544643878937e-05, 3.548990935087204e-05, 3.910437226295471e-05, 4.2718835175037384e-05, 4.6333298087120056e-05, 4.994776099920273e-05, 5.35622239112854e-05, 5.717668682336807e-05, 6.0791149735450745e-05, 6.440561264753342e-05, 6.802007555961609e-05, 7.163453847169876e-05, 7.524900138378143e-05, 7.88634642958641e-05, 8.247792720794678e-05, 8.609239012002945e-05, 8.970685303211212e-05, 9.33213159441948e-05, 9.693577885627747e-05, 0.00010055024176836014, 0.00010416470468044281, 0.00010777916759252548, 0.00011139363050460815, 0.00011500809341669083, 0.0001186225563287735, 0.00012223701924085617, 0.00012585148215293884, 0.00012946594506502151, 0.0001330804079771042, 0.00013669487088918686, 0.00014030933380126953]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 3.0, 9.0, 10.0, 23.0, 22.0, 61.0, 117.0, 249.0, 1065.0, 9830.0, 817388.0, 213748.0, 5044.0, 583.0, 156.0, 73.0, 42.0, 29.0, 18.0, 14.0, 14.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3366546630859375, -0.321258544921875, -0.3058624267578125, -0.29046630859375, -0.2750701904296875, -0.259674072265625, -0.2442779541015625, -0.2288818359375, -0.2134857177734375, -0.198089599609375, -0.1826934814453125, -0.16729736328125, -0.1519012451171875, -0.136505126953125, -0.1211090087890625, -0.105712890625, -0.0903167724609375, -0.074920654296875, -0.0595245361328125, -0.04412841796875, -0.0287322998046875, -0.013336181640625, 0.0020599365234375, 0.0174560546875, 0.0328521728515625, 0.048248291015625, 0.0636444091796875, 0.07904052734375, 0.0944366455078125, 0.109832763671875, 0.1252288818359375, 0.140625, 0.1560211181640625, 0.171417236328125, 0.1868133544921875, 0.20220947265625, 0.2176055908203125, 0.233001708984375, 0.2483978271484375, 0.2637939453125, 0.2791900634765625, 0.294586181640625, 0.3099822998046875, 0.32537841796875, 0.3407745361328125, 0.356170654296875, 0.3715667724609375, 0.386962890625, 0.4023590087890625, 0.417755126953125, 0.4331512451171875, 0.44854736328125, 0.4639434814453125, 0.479339599609375, 0.4947357177734375, 0.5101318359375, 0.5255279541015625, 0.540924072265625, 0.5563201904296875, 0.57171630859375, 0.5871124267578125, 0.602508544921875, 0.6179046630859375, 0.63330078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 9.0, 14.0, 29.0, 42.0, 76.0, 129.0, 151.0, 177.0, 132.0, 72.0, 69.0, 23.0, 14.0, 13.0, 6.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05145263671875, -0.049628257751464844, -0.04780387878417969, -0.04597949981689453, -0.044155120849609375, -0.04233074188232422, -0.04050636291503906, -0.038681983947753906, -0.03685760498046875, -0.035033226013183594, -0.03320884704589844, -0.03138446807861328, -0.029560089111328125, -0.02773571014404297, -0.025911331176757812, -0.024086952209472656, -0.0222625732421875, -0.020438194274902344, -0.018613815307617188, -0.01678943634033203, -0.014965057373046875, -0.013140678405761719, -0.011316299438476562, -0.009491920471191406, -0.00766754150390625, -0.005843162536621094, -0.0040187835693359375, -0.0021944046020507812, -0.000370025634765625, 0.0014543533325195312, 0.0032787322998046875, 0.005103111267089844, 0.006927490234375, 0.008751869201660156, 0.010576248168945312, 0.012400627136230469, 0.014225006103515625, 0.01604938507080078, 0.017873764038085938, 0.019698143005371094, 0.02152252197265625, 0.023346900939941406, 0.025171279907226562, 0.02699565887451172, 0.028820037841796875, 0.03064441680908203, 0.03246879577636719, 0.034293174743652344, 0.0361175537109375, 0.037941932678222656, 0.03976631164550781, 0.04159069061279297, 0.043415069580078125, 0.04523944854736328, 0.04706382751464844, 0.048888206481933594, 0.05071258544921875, 0.052536964416503906, 0.05436134338378906, 0.05618572235107422, 0.058010101318359375, 0.05983448028564453, 0.06165885925292969, 0.06348323822021484, 0.0653076171875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 14.0, 16.0, 35.0, 40.0, 41.0, 53.0, 81.0, 80.0, 100.0, 111.0, 63.0, 95.0, 78.0, 58.0, 41.0, 16.0, 22.0, 15.0, 8.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.025408387184143, -1.0015565156936646, -0.977704644203186, -0.9538527727127075, -0.930000901222229, -0.9061490297317505, -0.882297158241272, -0.8584452867507935, -0.8345934152603149, -0.8107415437698364, -0.7868896722793579, -0.7630378007888794, -0.7391859292984009, -0.7153340578079224, -0.6914821863174438, -0.6676303148269653, -0.643778383731842, -0.6199265122413635, -0.596074640750885, -0.5722227692604065, -0.548370897769928, -0.5245190262794495, -0.5006670951843262, -0.47681525349617004, -0.45296338200569153, -0.429111510515213, -0.4052596390247345, -0.3814077377319336, -0.3575558662414551, -0.33370399475097656, -0.30985212326049805, -0.28600025177001953, -0.2621484398841858, -0.23829656839370728, -0.21444469690322876, -0.19059281051158905, -0.16674093902111053, -0.14288906753063202, -0.11903718113899231, -0.0951853096485138, -0.07133343815803528, -0.047481562942266464, -0.02362968772649765, 0.0002221912145614624, 0.024074062705039978, 0.047925934195518494, 0.0717778205871582, 0.09562969207763672, 0.11948156356811523, 0.14333343505859375, 0.16718530654907227, 0.19103719294071198, 0.2148890644311905, 0.238740935921669, 0.2625928223133087, 0.28644469380378723, 0.31029656529426575, 0.33414843678474426, 0.3580003082752228, 0.3818522095680237, 0.4057040810585022, 0.4295559525489807, 0.45340782403945923, 0.47725969552993774, 0.5011115670204163]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 5.0, 11.0, 20.0, 17.0, 31.0, 31.0, 40.0, 39.0, 37.0, 39.0, 30.0, 34.0, 45.0, 50.0, 40.0, 44.0, 59.0, 47.0, 31.0, 35.0, 43.0, 36.0, 22.0, 36.0, 16.0, 24.0, 13.0, 15.0, 9.0, 15.0, 9.0, 16.0, 10.0, 4.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.45454877614974976, -0.4400072693824768, -0.42546579241752625, -0.4109243154525757, -0.39638280868530273, -0.3818413019180298, -0.3672998249530792, -0.35275834798812866, -0.3382168412208557, -0.32367533445358276, -0.3091338574886322, -0.29459238052368164, -0.2800508737564087, -0.26550936698913574, -0.2509678900241852, -0.23642639815807343, -0.22188490629196167, -0.20734341442584991, -0.19280192255973816, -0.1782604306936264, -0.16371893882751465, -0.1491774469614029, -0.13463595509529114, -0.12009446322917938, -0.10555297136306763, -0.09101147949695587, -0.07646998763084412, -0.06192849576473236, -0.047387003898620605, -0.03284551203250885, -0.018304020166397095, -0.0037625283002853394, 0.010778933763504028, 0.025320425629615784, 0.03986191749572754, 0.054403409361839294, 0.06894490122795105, 0.0834863930940628, 0.09802788496017456, 0.11256937682628632, 0.12711086869239807, 0.14165236055850983, 0.15619385242462158, 0.17073534429073334, 0.1852768361568451, 0.19981832802295685, 0.2143598198890686, 0.22890131175518036, 0.24344280362129211, 0.2579842805862427, 0.2725257873535156, 0.2870672941207886, 0.30160877108573914, 0.3161502480506897, 0.33069175481796265, 0.3452332615852356, 0.35977473855018616, 0.3743162155151367, 0.38885772228240967, 0.4033992290496826, 0.4179407060146332, 0.43248218297958374, 0.4470236897468567, 0.46156519651412964, 0.4761066734790802]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 15.0, 14.0, 35.0, 56.0, 96.0, 167.0, 313.0, 554.0, 1221.0, 2992.0, 7898.0, 24763.0, 87801.0, 481227.0, 345999.0, 65264.0, 19017.0, 6603.0, 2398.0, 1070.0, 470.0, 222.0, 142.0, 79.0, 49.0, 21.0, 20.0, 14.0, 7.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60302734375, -0.5846939086914062, -0.5663604736328125, -0.5480270385742188, -0.529693603515625, -0.5113601684570312, -0.4930267333984375, -0.47469329833984375, -0.45635986328125, -0.43802642822265625, -0.4196929931640625, -0.40135955810546875, -0.383026123046875, -0.36469268798828125, -0.3463592529296875, -0.32802581787109375, -0.3096923828125, -0.29135894775390625, -0.2730255126953125, -0.25469207763671875, -0.236358642578125, -0.21802520751953125, -0.1996917724609375, -0.18135833740234375, -0.16302490234375, -0.14469146728515625, -0.1263580322265625, -0.10802459716796875, -0.089691162109375, -0.07135772705078125, -0.0530242919921875, -0.03469085693359375, -0.016357421875, 0.00197601318359375, 0.0203094482421875, 0.03864288330078125, 0.056976318359375, 0.07530975341796875, 0.0936431884765625, 0.11197662353515625, 0.13031005859375, 0.14864349365234375, 0.1669769287109375, 0.18531036376953125, 0.203643798828125, 0.22197723388671875, 0.2403106689453125, 0.25864410400390625, 0.2769775390625, 0.29531097412109375, 0.3136444091796875, 0.33197784423828125, 0.350311279296875, 0.36864471435546875, 0.3869781494140625, 0.40531158447265625, 0.42364501953125, 0.44197845458984375, 0.4603118896484375, 0.47864532470703125, 0.496978759765625, 0.5153121948242188, 0.5336456298828125, 0.5519790649414062, 0.5703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 8.0, 11.0, 16.0, 14.0, 16.0, 20.0, 18.0, 27.0, 31.0, 32.0, 32.0, 44.0, 49.0, 36.0, 42.0, 51.0, 44.0, 42.0, 44.0, 48.0, 29.0, 36.0, 30.0, 22.0, 27.0, 36.0, 25.0, 19.0, 17.0, 28.0, 17.0, 7.0, 13.0, 8.0, 9.0, 4.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.396484375, -1.3516082763671875, -1.306732177734375, -1.2618560791015625, -1.21697998046875, -1.1721038818359375, -1.127227783203125, -1.0823516845703125, -1.0374755859375, -0.9925994873046875, -0.947723388671875, -0.9028472900390625, -0.85797119140625, -0.8130950927734375, -0.768218994140625, -0.7233428955078125, -0.678466796875, -0.6335906982421875, -0.588714599609375, -0.5438385009765625, -0.49896240234375, -0.4540863037109375, -0.409210205078125, -0.3643341064453125, -0.3194580078125, -0.2745819091796875, -0.229705810546875, -0.1848297119140625, -0.13995361328125, -0.0950775146484375, -0.050201416015625, -0.0053253173828125, 0.03955078125, 0.0844268798828125, 0.129302978515625, 0.1741790771484375, 0.21905517578125, 0.2639312744140625, 0.308807373046875, 0.3536834716796875, 0.3985595703125, 0.4434356689453125, 0.488311767578125, 0.5331878662109375, 0.57806396484375, 0.6229400634765625, 0.667816162109375, 0.7126922607421875, 0.757568359375, 0.8024444580078125, 0.847320556640625, 0.8921966552734375, 0.93707275390625, 0.9819488525390625, 1.026824951171875, 1.0717010498046875, 1.1165771484375, 1.1614532470703125, 1.206329345703125, 1.2512054443359375, 1.29608154296875, 1.3409576416015625, 1.385833740234375, 1.4307098388671875, 1.4755859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 12.0, 15.0, 20.0, 22.0, 38.0, 35.0, 55.0, 82.0, 109.0, 222.0, 1913.0, 1043327.0, 2063.0, 221.0, 90.0, 88.0, 55.0, 42.0, 32.0, 28.0, 14.0, 19.0, 10.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.37890625, -6.1697998046875, -5.960693359375, -5.7515869140625, -5.54248046875, -5.3333740234375, -5.124267578125, -4.9151611328125, -4.7060546875, -4.4969482421875, -4.287841796875, -4.0787353515625, -3.86962890625, -3.6605224609375, -3.451416015625, -3.2423095703125, -3.033203125, -2.8240966796875, -2.614990234375, -2.4058837890625, -2.19677734375, -1.9876708984375, -1.778564453125, -1.5694580078125, -1.3603515625, -1.1512451171875, -0.942138671875, -0.7330322265625, -0.52392578125, -0.3148193359375, -0.105712890625, 0.1033935546875, 0.3125, 0.5216064453125, 0.730712890625, 0.9398193359375, 1.14892578125, 1.3580322265625, 1.567138671875, 1.7762451171875, 1.9853515625, 2.1944580078125, 2.403564453125, 2.6126708984375, 2.82177734375, 3.0308837890625, 3.239990234375, 3.4490966796875, 3.658203125, 3.8673095703125, 4.076416015625, 4.2855224609375, 4.49462890625, 4.7037353515625, 4.912841796875, 5.1219482421875, 5.3310546875, 5.5401611328125, 5.749267578125, 5.9583740234375, 6.16748046875, 6.3765869140625, 6.585693359375, 6.7947998046875, 7.00390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 8.0, 18.0, 15.0, 15.0, 37.0, 33.0, 41.0, 61.0, 68.0, 82.0, 70.0, 80.0, 81.0, 65.0, 51.0, 52.0, 42.0, 44.0, 37.0, 22.0, 12.0, 18.0, 9.0, 4.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.55859375, -2.47479248046875, -2.3909912109375, -2.30718994140625, -2.223388671875, -2.13958740234375, -2.0557861328125, -1.97198486328125, -1.88818359375, -1.80438232421875, -1.7205810546875, -1.63677978515625, -1.552978515625, -1.46917724609375, -1.3853759765625, -1.30157470703125, -1.2177734375, -1.13397216796875, -1.0501708984375, -0.96636962890625, -0.882568359375, -0.79876708984375, -0.7149658203125, -0.63116455078125, -0.54736328125, -0.46356201171875, -0.3797607421875, -0.29595947265625, -0.212158203125, -0.12835693359375, -0.0445556640625, 0.03924560546875, 0.123046875, 0.20684814453125, 0.2906494140625, 0.37445068359375, 0.458251953125, 0.54205322265625, 0.6258544921875, 0.70965576171875, 0.79345703125, 0.87725830078125, 0.9610595703125, 1.04486083984375, 1.128662109375, 1.21246337890625, 1.2962646484375, 1.38006591796875, 1.4638671875, 1.54766845703125, 1.6314697265625, 1.71527099609375, 1.799072265625, 1.88287353515625, 1.9666748046875, 2.05047607421875, 2.13427734375, 2.21807861328125, 2.3018798828125, 2.38568115234375, 2.469482421875, 2.55328369140625, 2.6370849609375, 2.72088623046875, 2.8046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 11.0, 13.0, 11.0, 18.0, 29.0, 42.0, 63.0, 114.0, 238.0, 797.0, 5797.0, 157307.0, 857988.0, 23437.0, 1853.0, 389.0, 160.0, 82.0, 62.0, 26.0, 16.0, 16.0, 17.0, 11.0, 6.0, 7.0, 5.0, 6.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3671417236328125, -0.353668212890625, -0.3401947021484375, -0.32672119140625, -0.3132476806640625, -0.299774169921875, -0.2863006591796875, -0.2728271484375, -0.2593536376953125, -0.245880126953125, -0.2324066162109375, -0.21893310546875, -0.2054595947265625, -0.191986083984375, -0.1785125732421875, -0.1650390625, -0.1515655517578125, -0.138092041015625, -0.1246185302734375, -0.11114501953125, -0.0976715087890625, -0.084197998046875, -0.0707244873046875, -0.0572509765625, -0.0437774658203125, -0.030303955078125, -0.0168304443359375, -0.00335693359375, 0.0101165771484375, 0.023590087890625, 0.0370635986328125, 0.050537109375, 0.0640106201171875, 0.077484130859375, 0.0909576416015625, 0.10443115234375, 0.1179046630859375, 0.131378173828125, 0.1448516845703125, 0.1583251953125, 0.1717987060546875, 0.185272216796875, 0.1987457275390625, 0.21221923828125, 0.2256927490234375, 0.239166259765625, 0.2526397705078125, 0.26611328125, 0.2795867919921875, 0.293060302734375, 0.3065338134765625, 0.32000732421875, 0.3334808349609375, 0.346954345703125, 0.3604278564453125, 0.3739013671875, 0.3873748779296875, 0.400848388671875, 0.4143218994140625, 0.42779541015625, 0.4412689208984375, 0.454742431640625, 0.4682159423828125, 0.481689453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 4.0, 6.0, 10.0, 12.0, 11.0, 13.0, 20.0, 28.0, 33.0, 41.0, 54.0, 80.0, 117.0, 101.0, 118.0, 94.0, 57.0, 46.0, 36.0, 29.0, 21.0, 15.0, 16.0, 10.0, 3.0, 5.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.300739288330078e-05, -2.220459282398224e-05, -2.1401792764663696e-05, -2.0598992705345154e-05, -1.979619264602661e-05, -1.899339258670807e-05, -1.8190592527389526e-05, -1.7387792468070984e-05, -1.658499240875244e-05, -1.57821923494339e-05, -1.4979392290115356e-05, -1.4176592230796814e-05, -1.3373792171478271e-05, -1.2570992112159729e-05, -1.1768192052841187e-05, -1.0965391993522644e-05, -1.0162591934204102e-05, -9.359791874885559e-06, -8.556991815567017e-06, -7.754191756248474e-06, -6.951391696929932e-06, -6.148591637611389e-06, -5.345791578292847e-06, -4.542991518974304e-06, -3.7401914596557617e-06, -2.9373914003372192e-06, -2.1345913410186768e-06, -1.3317912817001343e-06, -5.289912223815918e-07, 2.738088369369507e-07, 1.0766088962554932e-06, 1.8794089555740356e-06, 2.682209014892578e-06, 3.4850090742111206e-06, 4.287809133529663e-06, 5.0906091928482056e-06, 5.893409252166748e-06, 6.6962093114852905e-06, 7.499009370803833e-06, 8.301809430122375e-06, 9.104609489440918e-06, 9.90740954875946e-06, 1.0710209608078003e-05, 1.1513009667396545e-05, 1.2315809726715088e-05, 1.311860978603363e-05, 1.3921409845352173e-05, 1.4724209904670715e-05, 1.5527009963989258e-05, 1.63298100233078e-05, 1.7132610082626343e-05, 1.7935410141944885e-05, 1.8738210201263428e-05, 1.954101026058197e-05, 2.0343810319900513e-05, 2.1146610379219055e-05, 2.1949410438537598e-05, 2.275221049785614e-05, 2.3555010557174683e-05, 2.4357810616493225e-05, 2.5160610675811768e-05, 2.596341073513031e-05, 2.6766210794448853e-05, 2.7569010853767395e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 8.0, 7.0, 3.0, 7.0, 12.0, 15.0, 28.0, 26.0, 46.0, 77.0, 155.0, 347.0, 1138.0, 7145.0, 125331.0, 863951.0, 45007.0, 3894.0, 769.0, 261.0, 128.0, 75.0, 43.0, 25.0, 19.0, 12.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.41667938232421875, -0.4048919677734375, -0.39310455322265625, -0.381317138671875, -0.36952972412109375, -0.3577423095703125, -0.34595489501953125, -0.33416748046875, -0.32238006591796875, -0.3105926513671875, -0.29880523681640625, -0.287017822265625, -0.27523040771484375, -0.2634429931640625, -0.25165557861328125, -0.2398681640625, -0.22808074951171875, -0.2162933349609375, -0.20450592041015625, -0.192718505859375, -0.18093109130859375, -0.1691436767578125, -0.15735626220703125, -0.14556884765625, -0.13378143310546875, -0.1219940185546875, -0.11020660400390625, -0.098419189453125, -0.08663177490234375, -0.0748443603515625, -0.06305694580078125, -0.05126953125, -0.03948211669921875, -0.0276947021484375, -0.01590728759765625, -0.004119873046875, 0.00766754150390625, 0.0194549560546875, 0.03124237060546875, 0.04302978515625, 0.05481719970703125, 0.0666046142578125, 0.07839202880859375, 0.090179443359375, 0.10196685791015625, 0.1137542724609375, 0.12554168701171875, 0.1373291015625, 0.14911651611328125, 0.1609039306640625, 0.17269134521484375, 0.184478759765625, 0.19626617431640625, 0.2080535888671875, 0.21984100341796875, 0.23162841796875, 0.24341583251953125, 0.2552032470703125, 0.26699066162109375, 0.278778076171875, 0.29056549072265625, 0.3023529052734375, 0.31414031982421875, 0.325927734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 6.0, 6.0, 14.0, 14.0, 30.0, 42.0, 50.0, 100.0, 134.0, 154.0, 156.0, 94.0, 69.0, 41.0, 31.0, 14.0, 10.0, 9.0, 5.0, 5.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.082275390625, -0.07939910888671875, -0.0765228271484375, -0.07364654541015625, -0.070770263671875, -0.06789398193359375, -0.0650177001953125, -0.06214141845703125, -0.05926513671875, -0.05638885498046875, -0.0535125732421875, -0.05063629150390625, -0.047760009765625, -0.04488372802734375, -0.0420074462890625, -0.03913116455078125, -0.0362548828125, -0.03337860107421875, -0.0305023193359375, -0.02762603759765625, -0.024749755859375, -0.02187347412109375, -0.0189971923828125, -0.01612091064453125, -0.01324462890625, -0.01036834716796875, -0.0074920654296875, -0.00461578369140625, -0.001739501953125, 0.00113677978515625, 0.0040130615234375, 0.00688934326171875, 0.009765625, 0.01264190673828125, 0.0155181884765625, 0.01839447021484375, 0.021270751953125, 0.02414703369140625, 0.0270233154296875, 0.02989959716796875, 0.03277587890625, 0.03565216064453125, 0.0385284423828125, 0.04140472412109375, 0.044281005859375, 0.04715728759765625, 0.0500335693359375, 0.05290985107421875, 0.0557861328125, 0.05866241455078125, 0.0615386962890625, 0.06441497802734375, 0.067291259765625, 0.07016754150390625, 0.0730438232421875, 0.07592010498046875, 0.07879638671875, 0.08167266845703125, 0.0845489501953125, 0.08742523193359375, 0.090301513671875, 0.09317779541015625, 0.0960540771484375, 0.09893035888671875, 0.101806640625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 69.0, 222.0, 442.0, 224.0, 46.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404793620109558, -1.185573697090149, -0.9663538932800293, -0.7471339702606201, -0.5279141068458557, -0.3086942434310913, -0.08947432041168213, 0.1297454833984375, 0.3489654064178467, 0.5681852698326111, 0.7874051332473755, 1.0066250562667847, 1.2258448600769043, 1.4450647830963135, 1.6642847061157227, 1.8835045099258423, 2.102724552154541, 2.32194447517395, 2.5411643981933594, 2.7603840827941895, 2.9796040058135986, 3.198823928833008, 3.418043851852417, 3.637263774871826, 3.8564834594726562, 4.075703144073486, 4.294923305511475, 4.514142990112305, 4.733363151550293, 4.952582836151123, 5.171802520751953, 5.391022682189941, 5.6102423667907715, 5.829462051391602, 6.04868221282959, 6.26790189743042, 6.487122058868408, 6.706341743469238, 6.925561904907227, 7.144781589508057, 7.364001274108887, 7.583220958709717, 7.802441120147705, 8.021660804748535, 8.240880966186523, 8.460100173950195, 8.679320335388184, 8.898540496826172, 9.11776065826416, 9.336980819702148, 9.55620002746582, 9.775420188903809, 9.994640350341797, 10.213859558105469, 10.433079719543457, 10.652299880981445, 10.871519088745117, 11.090739250183105, 11.309958457946777, 11.529178619384766, 11.748398780822754, 11.967618942260742, 12.186838150024414, 12.406058311462402, 12.62527847290039]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 7.0, 4.0, 9.0, 6.0, 9.0, 10.0, 19.0, 18.0, 24.0, 17.0, 21.0, 26.0, 30.0, 29.0, 26.0, 43.0, 37.0, 37.0, 44.0, 47.0, 57.0, 35.0, 39.0, 26.0, 34.0, 32.0, 36.0, 28.0, 31.0, 25.0, 29.0, 28.0, 25.0, 13.0, 15.0, 15.0, 9.0, 17.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.481558084487915, -2.410348892211914, -2.339139461517334, -2.267930269241333, -2.196721076965332, -2.125511646270752, -2.054302453994751, -1.98309326171875, -1.9118839502334595, -1.840674638748169, -1.769465446472168, -1.6982561349868774, -1.627046823501587, -1.555837631225586, -1.4846283197402954, -1.4134190082550049, -1.342209815979004, -1.2710005044937134, -1.1997913122177124, -1.1285820007324219, -1.057372808456421, -0.9861634969711304, -0.9149541854858398, -0.8437449336051941, -0.7725356817245483, -0.7013264298439026, -0.6301171779632568, -0.5589078664779663, -0.48769861459732056, -0.4164893627166748, -0.34528008103370667, -0.2740707993507385, -0.20286154747009277, -0.13165228068828583, -0.06044301390647888, 0.010766252875328064, 0.08197551965713501, 0.15318477153778076, 0.2243940532207489, 0.29560333490371704, 0.3668125867843628, 0.43802183866500854, 0.5092310905456543, 0.5804404020309448, 0.6516496539115906, 0.7228589057922363, 0.7940682172775269, 0.8652774691581726, 0.9364867210388184, 1.0076960325241089, 1.0789052248001099, 1.1501145362854004, 1.2213237285614014, 1.292533040046692, 1.3637423515319824, 1.4349515438079834, 1.506160855293274, 1.5773701667785645, 1.6485793590545654, 1.719788670539856, 1.7909979820251465, 1.8622071743011475, 1.933416485786438, 2.0046257972717285, 2.0758349895477295]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 5.0, 1.0, 10.0, 10.0, 19.0, 18.0, 17.0, 18.0, 28.0, 33.0, 43.0, 48.0, 91.0, 207.0, 725.0, 3338.0, 36439.0, 868158.0, 2988759.0, 279235.0, 14102.0, 2051.0, 480.0, 143.0, 65.0, 48.0, 31.0, 14.0, 27.0, 20.0, 20.0, 11.0, 10.0, 11.0, 8.0, 10.0, 4.0, 7.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.0390625, -1.9858551025390625, -1.932647705078125, -1.8794403076171875, -1.82623291015625, -1.7730255126953125, -1.719818115234375, -1.6666107177734375, -1.6134033203125, -1.5601959228515625, -1.506988525390625, -1.4537811279296875, -1.40057373046875, -1.3473663330078125, -1.294158935546875, -1.2409515380859375, -1.187744140625, -1.1345367431640625, -1.081329345703125, -1.0281219482421875, -0.97491455078125, -0.9217071533203125, -0.868499755859375, -0.8152923583984375, -0.7620849609375, -0.7088775634765625, -0.655670166015625, -0.6024627685546875, -0.54925537109375, -0.4960479736328125, -0.442840576171875, -0.3896331787109375, -0.33642578125, -0.2832183837890625, -0.230010986328125, -0.1768035888671875, -0.12359619140625, -0.0703887939453125, -0.017181396484375, 0.0360260009765625, 0.0892333984375, 0.1424407958984375, 0.195648193359375, 0.2488555908203125, 0.30206298828125, 0.3552703857421875, 0.408477783203125, 0.4616851806640625, 0.514892578125, 0.5680999755859375, 0.621307373046875, 0.6745147705078125, 0.72772216796875, 0.7809295654296875, 0.834136962890625, 0.8873443603515625, 0.9405517578125, 0.9937591552734375, 1.046966552734375, 1.1001739501953125, 1.15338134765625, 1.2065887451171875, 1.259796142578125, 1.3130035400390625, 1.3662109375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 9.0, 12.0, 17.0, 9.0, 14.0, 17.0, 21.0, 31.0, 36.0, 45.0, 39.0, 48.0, 46.0, 46.0, 43.0, 50.0, 52.0, 49.0, 42.0, 42.0, 48.0, 42.0, 26.0, 34.0, 25.0, 24.0, 19.0, 17.0, 18.0, 8.0, 11.0, 13.0, 6.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0], "bins": [-0.740234375, -0.7199249267578125, -0.699615478515625, -0.6793060302734375, -0.65899658203125, -0.6386871337890625, -0.618377685546875, -0.5980682373046875, -0.5777587890625, -0.5574493408203125, -0.537139892578125, -0.5168304443359375, -0.49652099609375, -0.4762115478515625, -0.455902099609375, -0.4355926513671875, -0.415283203125, -0.3949737548828125, -0.374664306640625, -0.3543548583984375, -0.33404541015625, -0.3137359619140625, -0.293426513671875, -0.2731170654296875, -0.2528076171875, -0.2324981689453125, -0.212188720703125, -0.1918792724609375, -0.17156982421875, -0.1512603759765625, -0.130950927734375, -0.1106414794921875, -0.09033203125, -0.0700225830078125, -0.049713134765625, -0.0294036865234375, -0.00909423828125, 0.0112152099609375, 0.031524658203125, 0.0518341064453125, 0.0721435546875, 0.0924530029296875, 0.112762451171875, 0.1330718994140625, 0.15338134765625, 0.1736907958984375, 0.194000244140625, 0.2143096923828125, 0.234619140625, 0.2549285888671875, 0.275238037109375, 0.2955474853515625, 0.31585693359375, 0.3361663818359375, 0.356475830078125, 0.3767852783203125, 0.3970947265625, 0.4174041748046875, 0.437713623046875, 0.4580230712890625, 0.47833251953125, 0.4986419677734375, 0.518951416015625, 0.5392608642578125, 0.5595703125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 12.0, 11.0, 13.0, 21.0, 41.0, 54.0, 58.0, 94.0, 157.0, 221.0, 413.0, 1681.0, 2390954.0, 1797857.0, 1569.0, 402.0, 257.0, 153.0, 97.0, 58.0, 55.0, 34.0, 12.0, 8.0, 11.0, 6.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.37725830078125, -5.2037353515625, -5.03021240234375, -4.856689453125, -4.68316650390625, -4.5096435546875, -4.33612060546875, -4.16259765625, -3.98907470703125, -3.8155517578125, -3.64202880859375, -3.468505859375, -3.29498291015625, -3.1214599609375, -2.94793701171875, -2.7744140625, -2.60089111328125, -2.4273681640625, -2.25384521484375, -2.080322265625, -1.90679931640625, -1.7332763671875, -1.55975341796875, -1.38623046875, -1.21270751953125, -1.0391845703125, -0.86566162109375, -0.692138671875, -0.51861572265625, -0.3450927734375, -0.17156982421875, 0.001953125, 0.17547607421875, 0.3489990234375, 0.52252197265625, 0.696044921875, 0.86956787109375, 1.0430908203125, 1.21661376953125, 1.39013671875, 1.56365966796875, 1.7371826171875, 1.91070556640625, 2.084228515625, 2.25775146484375, 2.4312744140625, 2.60479736328125, 2.7783203125, 2.95184326171875, 3.1253662109375, 3.29888916015625, 3.472412109375, 3.64593505859375, 3.8194580078125, 3.99298095703125, 4.16650390625, 4.34002685546875, 4.5135498046875, 4.68707275390625, 4.860595703125, 5.03411865234375, 5.2076416015625, 5.38116455078125, 5.5546875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 11.0, 5.0, 11.0, 21.0, 19.0, 28.0, 34.0, 47.0, 74.0, 119.0, 162.0, 249.0, 339.0, 544.0, 603.0, 542.0, 395.0, 284.0, 179.0, 123.0, 84.0, 68.0, 52.0, 31.0, 19.0, 12.0, 4.0, 8.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.323486328125, -0.3128814697265625, -0.302276611328125, -0.2916717529296875, -0.28106689453125, -0.2704620361328125, -0.259857177734375, -0.2492523193359375, -0.2386474609375, -0.2280426025390625, -0.217437744140625, -0.2068328857421875, -0.19622802734375, -0.1856231689453125, -0.175018310546875, -0.1644134521484375, -0.15380859375, -0.1432037353515625, -0.132598876953125, -0.1219940185546875, -0.11138916015625, -0.1007843017578125, -0.090179443359375, -0.0795745849609375, -0.0689697265625, -0.0583648681640625, -0.047760009765625, -0.0371551513671875, -0.02655029296875, -0.0159454345703125, -0.005340576171875, 0.0052642822265625, 0.015869140625, 0.0264739990234375, 0.037078857421875, 0.0476837158203125, 0.05828857421875, 0.0688934326171875, 0.079498291015625, 0.0901031494140625, 0.1007080078125, 0.1113128662109375, 0.121917724609375, 0.1325225830078125, 0.14312744140625, 0.1537322998046875, 0.164337158203125, 0.1749420166015625, 0.185546875, 0.1961517333984375, 0.206756591796875, 0.2173614501953125, 0.22796630859375, 0.2385711669921875, 0.249176025390625, 0.2597808837890625, 0.2703857421875, 0.2809906005859375, 0.291595458984375, 0.3022003173828125, 0.31280517578125, 0.3234100341796875, 0.334014892578125, 0.3446197509765625, 0.355224609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 11.0, 5.0, 13.0, 10.0, 30.0, 27.0, 56.0, 69.0, 62.0, 90.0, 99.0, 109.0, 96.0, 95.0, 76.0, 49.0, 37.0, 22.0, 15.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7718772888183594, -1.7314456701278687, -1.691014051437378, -1.6505823135375977, -1.610150694847107, -1.5697190761566162, -1.5292874574661255, -1.4888558387756348, -1.4484241008758545, -1.4079924821853638, -1.367560863494873, -1.3271291255950928, -1.286697506904602, -1.2462658882141113, -1.2058342695236206, -1.1654026508331299, -1.1249709129333496, -1.0845392942428589, -1.0441076755523682, -1.003675937652588, -0.9632443189620972, -0.9228127002716064, -0.8823810815811157, -0.8419494032859802, -0.8015178442001343, -0.7610862255096436, -0.7206545472145081, -0.6802229285240173, -0.6397912502288818, -0.5993596315383911, -0.5589280128479004, -0.5184963345527649, -0.4780645966529846, -0.4376329481601715, -0.3972012996673584, -0.3567696809768677, -0.3163380026817322, -0.27590638399124146, -0.23547473549842834, -0.19504308700561523, -0.15461143851280212, -0.11417979001998901, -0.0737481489777565, -0.03331650793552399, 0.0071151405572891235, 0.047546789050102234, 0.08797842264175415, 0.12841007113456726, 0.16884171962738037, 0.20927336812019348, 0.2497050166130066, 0.2901366353034973, 0.3305683135986328, 0.37099993228912354, 0.41143158078193665, 0.45186322927474976, 0.49229487776756287, 0.532726526260376, 0.5731581449508667, 0.6135898232460022, 0.6540214419364929, 0.6944531202316284, 0.7348847389221191, 0.7753163576126099, 0.8157480359077454]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 22.0, 16.0, 16.0, 17.0, 21.0, 21.0, 22.0, 32.0, 33.0, 38.0, 30.0, 41.0, 33.0, 30.0, 41.0, 37.0, 38.0, 44.0, 34.0, 37.0, 34.0, 38.0, 27.0, 33.0, 22.0, 24.0, 24.0, 30.0, 16.0, 11.0, 21.0, 10.0, 13.0, 5.0, 11.0, 5.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.529818594455719, -0.511722207069397, -0.49362581968307495, -0.47552940249443054, -0.4574330151081085, -0.4393366277217865, -0.4212402105331421, -0.40314382314682007, -0.38504743576049805, -0.366951048374176, -0.348854660987854, -0.3307582437992096, -0.3126618564128876, -0.29456546902656555, -0.27646905183792114, -0.2583726644515991, -0.2402762770652771, -0.22217988967895508, -0.20408348739147186, -0.18598708510398865, -0.16789069771766663, -0.1497943103313446, -0.1316979080438614, -0.11360150575637817, -0.09550511837005615, -0.07740872353315353, -0.059312328696250916, -0.0412159338593483, -0.02311953902244568, -0.00502314418554306, 0.013073250651359558, 0.031169652938842773, 0.04926598072052002, 0.06736237555742264, 0.08545877039432526, 0.10355516523122787, 0.1216515600681305, 0.13974794745445251, 0.15784434974193573, 0.17594075202941895, 0.19403713941574097, 0.212133526802063, 0.2302299290895462, 0.24832633137702942, 0.26642271876335144, 0.28451910614967346, 0.30261552333831787, 0.3207119107246399, 0.3388082981109619, 0.35690468549728394, 0.37500107288360596, 0.39309749007225037, 0.4111938774585724, 0.4292902648448944, 0.4473866820335388, 0.46548306941986084, 0.48357945680618286, 0.5016758441925049, 0.5197722315788269, 0.5378686189651489, 0.5559650659561157, 0.5740614533424377, 0.5921578407287598, 0.6102542281150818, 0.6283506155014038]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 7.0, 21.0, 17.0, 24.0, 64.0, 69.0, 115.0, 176.0, 292.0, 554.0, 1079.0, 2232.0, 4918.0, 12375.0, 34794.0, 111923.0, 323503.0, 355895.0, 134446.0, 40860.0, 14307.0, 5687.0, 2476.0, 1189.0, 628.0, 352.0, 201.0, 100.0, 68.0, 52.0, 29.0, 16.0, 19.0, 7.0, 11.0, 9.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.290771484375, -0.2822380065917969, -0.27370452880859375, -0.2651710510253906, -0.2566375732421875, -0.24810409545898438, -0.23957061767578125, -0.23103713989257812, -0.222503662109375, -0.21397018432617188, -0.20543670654296875, -0.19690322875976562, -0.1883697509765625, -0.17983627319335938, -0.17130279541015625, -0.16276931762695312, -0.15423583984375, -0.14570236206054688, -0.13716888427734375, -0.12863540649414062, -0.1201019287109375, -0.11156845092773438, -0.10303497314453125, -0.09450149536132812, -0.085968017578125, -0.07743453979492188, -0.06890106201171875, -0.060367584228515625, -0.0518341064453125, -0.043300628662109375, -0.03476715087890625, -0.026233673095703125, -0.0177001953125, -0.009166717529296875, -0.00063323974609375, 0.007900238037109375, 0.0164337158203125, 0.024967193603515625, 0.03350067138671875, 0.042034149169921875, 0.050567626953125, 0.059101104736328125, 0.06763458251953125, 0.07616806030273438, 0.0847015380859375, 0.09323501586914062, 0.10176849365234375, 0.11030197143554688, 0.11883544921875, 0.12736892700195312, 0.13590240478515625, 0.14443588256835938, 0.1529693603515625, 0.16150283813476562, 0.17003631591796875, 0.17856979370117188, 0.187103271484375, 0.19563674926757812, 0.20417022705078125, 0.21270370483398438, 0.2212371826171875, 0.22977066040039062, 0.23830413818359375, 0.24683761596679688, 0.25537109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 12.0, 11.0, 16.0, 22.0, 32.0, 22.0, 35.0, 44.0, 49.0, 60.0, 52.0, 59.0, 53.0, 55.0, 67.0, 44.0, 42.0, 48.0, 52.0, 34.0, 34.0, 25.0, 24.0, 22.0, 23.0, 16.0, 9.0, 8.0, 3.0, 8.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5341796875, -0.518310546875, -0.50244140625, -0.486572265625, -0.470703125, -0.454833984375, -0.43896484375, -0.423095703125, -0.4072265625, -0.391357421875, -0.37548828125, -0.359619140625, -0.34375, -0.327880859375, -0.31201171875, -0.296142578125, -0.2802734375, -0.264404296875, -0.24853515625, -0.232666015625, -0.216796875, -0.200927734375, -0.18505859375, -0.169189453125, -0.1533203125, -0.137451171875, -0.12158203125, -0.105712890625, -0.08984375, -0.073974609375, -0.05810546875, -0.042236328125, -0.0263671875, -0.010498046875, 0.00537109375, 0.021240234375, 0.037109375, 0.052978515625, 0.06884765625, 0.084716796875, 0.1005859375, 0.116455078125, 0.13232421875, 0.148193359375, 0.1640625, 0.179931640625, 0.19580078125, 0.211669921875, 0.2275390625, 0.243408203125, 0.25927734375, 0.275146484375, 0.291015625, 0.306884765625, 0.32275390625, 0.338623046875, 0.3544921875, 0.370361328125, 0.38623046875, 0.402099609375, 0.41796875, 0.433837890625, 0.44970703125, 0.465576171875, 0.4814453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 11.0, 16.0, 16.0, 29.0, 32.0, 60.0, 65.0, 101.0, 141.0, 232.0, 358.0, 666.0, 1180.0, 2272.0, 4653.0, 9945.0, 23500.0, 60956.0, 159110.0, 299690.0, 273060.0, 128722.0, 48323.0, 18990.0, 8138.0, 3870.0, 1836.0, 1037.0, 559.0, 353.0, 206.0, 108.0, 79.0, 53.0, 48.0, 32.0, 30.0, 24.0, 8.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.226806640625, -0.22048568725585938, -0.21416473388671875, -0.20784378051757812, -0.2015228271484375, -0.19520187377929688, -0.18888092041015625, -0.18255996704101562, -0.176239013671875, -0.16991806030273438, -0.16359710693359375, -0.15727615356445312, -0.1509552001953125, -0.14463424682617188, -0.13831329345703125, -0.13199234008789062, -0.12567138671875, -0.11935043334960938, -0.11302947998046875, -0.10670852661132812, -0.1003875732421875, -0.09406661987304688, -0.08774566650390625, -0.08142471313476562, -0.075103759765625, -0.06878280639648438, -0.06246185302734375, -0.056140899658203125, -0.0498199462890625, -0.043498992919921875, -0.03717803955078125, -0.030857086181640625, -0.0245361328125, -0.018215179443359375, -0.01189422607421875, -0.005573272705078125, 0.0007476806640625, 0.007068634033203125, 0.01338958740234375, 0.019710540771484375, 0.026031494140625, 0.032352447509765625, 0.03867340087890625, 0.044994354248046875, 0.0513153076171875, 0.057636260986328125, 0.06395721435546875, 0.07027816772460938, 0.07659912109375, 0.08292007446289062, 0.08924102783203125, 0.09556198120117188, 0.1018829345703125, 0.10820388793945312, 0.11452484130859375, 0.12084579467773438, 0.127166748046875, 0.13348770141601562, 0.13980865478515625, 0.14612960815429688, 0.1524505615234375, 0.15877151489257812, 0.16509246826171875, 0.17141342163085938, 0.177734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 8.0, 21.0, 13.0, 27.0, 24.0, 23.0, 28.0, 27.0, 28.0, 29.0, 50.0, 43.0, 38.0, 45.0, 55.0, 35.0, 43.0, 39.0, 50.0, 32.0, 41.0, 39.0, 39.0, 30.0, 24.0, 26.0, 23.0, 26.0, 18.0, 8.0, 8.0, 6.0, 5.0, 8.0, 6.0, 6.0, 5.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75634765625, -0.73394775390625, -0.7115478515625, -0.68914794921875, -0.666748046875, -0.64434814453125, -0.6219482421875, -0.59954833984375, -0.5771484375, -0.55474853515625, -0.5323486328125, -0.50994873046875, -0.487548828125, -0.46514892578125, -0.4427490234375, -0.42034912109375, -0.39794921875, -0.37554931640625, -0.3531494140625, -0.33074951171875, -0.308349609375, -0.28594970703125, -0.2635498046875, -0.24114990234375, -0.21875, -0.19635009765625, -0.1739501953125, -0.15155029296875, -0.129150390625, -0.10675048828125, -0.0843505859375, -0.06195068359375, -0.03955078125, -0.01715087890625, 0.0052490234375, 0.02764892578125, 0.050048828125, 0.07244873046875, 0.0948486328125, 0.11724853515625, 0.1396484375, 0.16204833984375, 0.1844482421875, 0.20684814453125, 0.229248046875, 0.25164794921875, 0.2740478515625, 0.29644775390625, 0.31884765625, 0.34124755859375, 0.3636474609375, 0.38604736328125, 0.408447265625, 0.43084716796875, 0.4532470703125, 0.47564697265625, 0.498046875, 0.52044677734375, 0.5428466796875, 0.56524658203125, 0.587646484375, 0.61004638671875, 0.6324462890625, 0.65484619140625, 0.67724609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 16.0, 19.0, 27.0, 40.0, 35.0, 75.0, 119.0, 159.0, 280.0, 435.0, 753.0, 1406.0, 2595.0, 5296.0, 11821.0, 29889.0, 86641.0, 258426.0, 381891.0, 174126.0, 56296.0, 20449.0, 8735.0, 4094.0, 2106.0, 1146.0, 599.0, 368.0, 248.0, 134.0, 101.0, 48.0, 47.0, 35.0, 22.0, 16.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.080078125, -0.07752037048339844, -0.07496261596679688, -0.07240486145019531, -0.06984710693359375, -0.06728935241699219, -0.06473159790039062, -0.06217384338378906, -0.0596160888671875, -0.05705833435058594, -0.054500579833984375, -0.05194282531738281, -0.04938507080078125, -0.04682731628417969, -0.044269561767578125, -0.04171180725097656, -0.039154052734375, -0.03659629821777344, -0.034038543701171875, -0.03148078918457031, -0.02892303466796875, -0.026365280151367188, -0.023807525634765625, -0.021249771118164062, -0.0186920166015625, -0.016134262084960938, -0.013576507568359375, -0.011018753051757812, -0.00846099853515625, -0.0059032440185546875, -0.003345489501953125, -0.0007877349853515625, 0.00177001953125, 0.0043277740478515625, 0.006885528564453125, 0.009443283081054688, 0.01200103759765625, 0.014558792114257812, 0.017116546630859375, 0.019674301147460938, 0.0222320556640625, 0.024789810180664062, 0.027347564697265625, 0.029905319213867188, 0.03246307373046875, 0.03502082824707031, 0.037578582763671875, 0.04013633728027344, 0.042694091796875, 0.04525184631347656, 0.047809600830078125, 0.05036735534667969, 0.05292510986328125, 0.05548286437988281, 0.058040618896484375, 0.06059837341308594, 0.0631561279296875, 0.06571388244628906, 0.06827163696289062, 0.07082939147949219, 0.07338714599609375, 0.07594490051269531, 0.07850265502929688, 0.08106040954589844, 0.0836181640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 22.0, 27.0, 33.0, 48.0, 58.0, 64.0, 80.0, 82.0, 102.0, 87.0, 78.0, 74.0, 63.0, 40.0, 30.0, 19.0, 9.0, 10.0, 11.0, 4.0, 5.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.143880844116211e-05, -4.984065890312195e-05, -4.824250936508179e-05, -4.6644359827041626e-05, -4.5046210289001465e-05, -4.3448060750961304e-05, -4.184991121292114e-05, -4.025176167488098e-05, -3.865361213684082e-05, -3.705546259880066e-05, -3.54573130607605e-05, -3.385916352272034e-05, -3.2261013984680176e-05, -3.0662864446640015e-05, -2.9064714908599854e-05, -2.7466565370559692e-05, -2.586841583251953e-05, -2.427026629447937e-05, -2.267211675643921e-05, -2.1073967218399048e-05, -1.9475817680358887e-05, -1.7877668142318726e-05, -1.6279518604278564e-05, -1.4681369066238403e-05, -1.3083219528198242e-05, -1.1485069990158081e-05, -9.88692045211792e-06, -8.288770914077759e-06, -6.690621376037598e-06, -5.0924718379974365e-06, -3.4943222999572754e-06, -1.8961727619171143e-06, -2.980232238769531e-07, 1.300126314163208e-06, 2.898275852203369e-06, 4.49642539024353e-06, 6.094574928283691e-06, 7.692724466323853e-06, 9.290874004364014e-06, 1.0889023542404175e-05, 1.2487173080444336e-05, 1.4085322618484497e-05, 1.5683472156524658e-05, 1.728162169456482e-05, 1.887977123260498e-05, 2.047792077064514e-05, 2.2076070308685303e-05, 2.3674219846725464e-05, 2.5272369384765625e-05, 2.6870518922805786e-05, 2.8468668460845947e-05, 3.006681799888611e-05, 3.166496753692627e-05, 3.326311707496643e-05, 3.486126661300659e-05, 3.645941615104675e-05, 3.8057565689086914e-05, 3.9655715227127075e-05, 4.1253864765167236e-05, 4.28520143032074e-05, 4.445016384124756e-05, 4.604831337928772e-05, 4.764646291732788e-05, 4.924461245536804e-05, 5.08427619934082e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 12.0, 17.0, 25.0, 56.0, 160.0, 638.0, 7256.0, 411791.0, 617014.0, 10438.0, 833.0, 157.0, 59.0, 36.0, 19.0, 12.0, 11.0, 9.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4028167724609375, -0.391326904296875, -0.3798370361328125, -0.36834716796875, -0.3568572998046875, -0.345367431640625, -0.3338775634765625, -0.3223876953125, -0.3108978271484375, -0.299407958984375, -0.2879180908203125, -0.27642822265625, -0.2649383544921875, -0.253448486328125, -0.2419586181640625, -0.23046875, -0.2189788818359375, -0.207489013671875, -0.1959991455078125, -0.18450927734375, -0.1730194091796875, -0.161529541015625, -0.1500396728515625, -0.1385498046875, -0.1270599365234375, -0.115570068359375, -0.1040802001953125, -0.09259033203125, -0.0811004638671875, -0.069610595703125, -0.0581207275390625, -0.046630859375, -0.0351409912109375, -0.023651123046875, -0.0121612548828125, -0.00067138671875, 0.0108184814453125, 0.022308349609375, 0.0337982177734375, 0.0452880859375, 0.0567779541015625, 0.068267822265625, 0.0797576904296875, 0.09124755859375, 0.1027374267578125, 0.114227294921875, 0.1257171630859375, 0.13720703125, 0.1486968994140625, 0.160186767578125, 0.1716766357421875, 0.18316650390625, 0.1946563720703125, 0.206146240234375, 0.2176361083984375, 0.2291259765625, 0.2406158447265625, 0.252105712890625, 0.2635955810546875, 0.27508544921875, 0.2865753173828125, 0.298065185546875, 0.3095550537109375, 0.321044921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 3.0, 10.0, 11.0, 13.0, 17.0, 17.0, 31.0, 15.0, 25.0, 35.0, 40.0, 42.0, 39.0, 51.0, 37.0, 44.0, 53.0, 51.0, 52.0, 55.0, 48.0, 39.0, 36.0, 32.0, 16.0, 27.0, 24.0, 16.0, 17.0, 13.0, 12.0, 11.0, 4.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0], "bins": [-0.0187530517578125, -0.0182039737701416, -0.017654895782470703, -0.017105817794799805, -0.016556739807128906, -0.016007661819458008, -0.01545858383178711, -0.014909505844116211, -0.014360427856445312, -0.013811349868774414, -0.013262271881103516, -0.012713193893432617, -0.012164115905761719, -0.01161503791809082, -0.011065959930419922, -0.010516881942749023, -0.009967803955078125, -0.009418725967407227, -0.008869647979736328, -0.00832056999206543, -0.007771492004394531, -0.007222414016723633, -0.006673336029052734, -0.006124258041381836, -0.0055751800537109375, -0.005026102066040039, -0.004477024078369141, -0.003927946090698242, -0.0033788681030273438, -0.0028297901153564453, -0.002280712127685547, -0.0017316341400146484, -0.00118255615234375, -0.0006334781646728516, -8.440017700195312e-05, 0.0004646778106689453, 0.0010137557983398438, 0.0015628337860107422, 0.0021119117736816406, 0.002660989761352539, 0.0032100677490234375, 0.003759145736694336, 0.004308223724365234, 0.004857301712036133, 0.005406379699707031, 0.00595545768737793, 0.006504535675048828, 0.0070536136627197266, 0.007602691650390625, 0.008151769638061523, 0.008700847625732422, 0.00924992561340332, 0.009799003601074219, 0.010348081588745117, 0.010897159576416016, 0.011446237564086914, 0.011995315551757812, 0.012544393539428711, 0.01309347152709961, 0.013642549514770508, 0.014191627502441406, 0.014740705490112305, 0.015289783477783203, 0.0158388614654541, 0.016387939453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 7.0, 5.0, 7.0, 10.0, 14.0, 17.0, 31.0, 42.0, 67.0, 54.0, 73.0, 91.0, 102.0, 95.0, 91.0, 70.0, 62.0, 47.0, 29.0, 29.0, 14.0, 12.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7695910930633545, -0.7489527463912964, -0.7283143401145935, -0.7076759934425354, -0.6870375871658325, -0.6663992404937744, -0.6457608342170715, -0.6251224875450134, -0.6044840812683105, -0.5838457345962524, -0.5632073283195496, -0.5425689816474915, -0.5219305753707886, -0.5012922286987305, -0.48065385222435, -0.4600154757499695, -0.4393771290779114, -0.4187387526035309, -0.3981003761291504, -0.3774619996547699, -0.3568236231803894, -0.3361852765083313, -0.3155469000339508, -0.2949085235595703, -0.2742701470851898, -0.2536317706108093, -0.23299339413642883, -0.21235503256320953, -0.19171665608882904, -0.17107827961444855, -0.15043991804122925, -0.12980154156684875, -0.10916322469711304, -0.08852484822273254, -0.06788647919893265, -0.04724810644984245, -0.02660973370075226, -0.005971357226371765, 0.014667011797428131, 0.03530538082122803, 0.05594375729560852, 0.07658213376998901, 0.09722050279378891, 0.1178588718175888, 0.1384972482919693, 0.1591356247663498, 0.1797739863395691, 0.20041236281394958, 0.22105073928833008, 0.24168911576271057, 0.26232749223709106, 0.28296586871147156, 0.30360424518585205, 0.32424259185791016, 0.34488096833229065, 0.36551934480667114, 0.38615772128105164, 0.40679609775543213, 0.4274344742298126, 0.4480728507041931, 0.4687111973762512, 0.4893496036529541, 0.5099879503250122, 0.5306262969970703, 0.5512647032737732]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 9.0, 9.0, 16.0, 20.0, 19.0, 19.0, 25.0, 27.0, 42.0, 36.0, 34.0, 49.0, 39.0, 52.0, 38.0, 55.0, 53.0, 42.0, 56.0, 32.0, 39.0, 37.0, 34.0, 31.0, 27.0, 30.0, 21.0, 15.0, 16.0, 12.0, 8.0, 15.0, 8.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.4578585922718048, -0.4452306628227234, -0.43260273337364197, -0.41997480392456055, -0.40734684467315674, -0.3947189152240753, -0.3820909857749939, -0.3694630563259125, -0.35683512687683105, -0.34420719742774963, -0.3315792679786682, -0.3189513087272644, -0.306323379278183, -0.29369544982910156, -0.28106752038002014, -0.2684395909309387, -0.2558116316795349, -0.2431837022304535, -0.23055575788021088, -0.21792782843112946, -0.20529988408088684, -0.19267195463180542, -0.180044025182724, -0.16741609573364258, -0.15478815138339996, -0.14216022193431854, -0.12953227758407593, -0.1169043481349945, -0.10427641123533249, -0.09164847433567047, -0.07902054488658905, -0.06639260798692703, -0.05376464128494263, -0.04113670438528061, -0.02850877121090889, -0.01588083803653717, -0.0032529011368751526, 0.009375035762786865, 0.022002965211868286, 0.034630902111530304, 0.04725883901119232, 0.05988677591085434, 0.07251471281051636, 0.08514264225959778, 0.0977705791592598, 0.11039851605892181, 0.12302644550800323, 0.13565438985824585, 0.14828231930732727, 0.1609102487564087, 0.1735381931066513, 0.18616612255573273, 0.19879406690597534, 0.21142199635505676, 0.22404992580413818, 0.2366778552532196, 0.24930579960346222, 0.26193374395370483, 0.27456167340278625, 0.2871896028518677, 0.2998175323009491, 0.3124454617500305, 0.3250734210014343, 0.33770135045051575, 0.35032927989959717]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 9.0, 22.0, 25.0, 32.0, 46.0, 80.0, 172.0, 323.0, 649.0, 1437.0, 3674.0, 10147.0, 34505.0, 165257.0, 575628.0, 198774.0, 39231.0, 11307.0, 4126.0, 1654.0, 698.0, 348.0, 164.0, 101.0, 48.0, 31.0, 17.0, 17.0, 7.0, 5.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55078125, -0.5327529907226562, -0.5147247314453125, -0.49669647216796875, -0.478668212890625, -0.46063995361328125, -0.4426116943359375, -0.42458343505859375, -0.40655517578125, -0.38852691650390625, -0.3704986572265625, -0.35247039794921875, -0.334442138671875, -0.31641387939453125, -0.2983856201171875, -0.28035736083984375, -0.2623291015625, -0.24430084228515625, -0.2262725830078125, -0.20824432373046875, -0.190216064453125, -0.17218780517578125, -0.1541595458984375, -0.13613128662109375, -0.11810302734375, -0.10007476806640625, -0.0820465087890625, -0.06401824951171875, -0.045989990234375, -0.02796173095703125, -0.0099334716796875, 0.00809478759765625, 0.026123046875, 0.04415130615234375, 0.0621795654296875, 0.08020782470703125, 0.098236083984375, 0.11626434326171875, 0.1342926025390625, 0.15232086181640625, 0.17034912109375, 0.18837738037109375, 0.2064056396484375, 0.22443389892578125, 0.242462158203125, 0.26049041748046875, 0.2785186767578125, 0.29654693603515625, 0.3145751953125, 0.33260345458984375, 0.3506317138671875, 0.36865997314453125, 0.386688232421875, 0.40471649169921875, 0.4227447509765625, 0.44077301025390625, 0.45880126953125, 0.47682952880859375, 0.4948577880859375, 0.5128860473632812, 0.530914306640625, 0.5489425659179688, 0.5669708251953125, 0.5849990844726562, 0.60302734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 12.0, 3.0, 8.0, 8.0, 26.0, 12.0, 24.0, 35.0, 23.0, 33.0, 32.0, 35.0, 47.0, 50.0, 57.0, 43.0, 61.0, 51.0, 46.0, 58.0, 37.0, 35.0, 45.0, 35.0, 27.0, 26.0, 19.0, 20.0, 20.0, 9.0, 6.0, 17.0, 11.0, 10.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0], "bins": [-1.0927734375, -1.0632858276367188, -1.0337982177734375, -1.0043106079101562, -0.974822998046875, -0.9453353881835938, -0.9158477783203125, -0.8863601684570312, -0.85687255859375, -0.8273849487304688, -0.7978973388671875, -0.7684097290039062, -0.738922119140625, -0.7094345092773438, -0.6799468994140625, -0.6504592895507812, -0.6209716796875, -0.5914840698242188, -0.5619964599609375, -0.5325088500976562, -0.503021240234375, -0.47353363037109375, -0.4440460205078125, -0.41455841064453125, -0.38507080078125, -0.35558319091796875, -0.3260955810546875, -0.29660797119140625, -0.267120361328125, -0.23763275146484375, -0.2081451416015625, -0.17865753173828125, -0.149169921875, -0.11968231201171875, -0.0901947021484375, -0.06070709228515625, -0.031219482421875, -0.00173187255859375, 0.0277557373046875, 0.05724334716796875, 0.08673095703125, 0.11621856689453125, 0.1457061767578125, 0.17519378662109375, 0.204681396484375, 0.23416900634765625, 0.2636566162109375, 0.29314422607421875, 0.3226318359375, 0.35211944580078125, 0.3816070556640625, 0.41109466552734375, 0.440582275390625, 0.47006988525390625, 0.4995574951171875, 0.5290451049804688, 0.55853271484375, 0.5880203247070312, 0.6175079345703125, 0.6469955444335938, 0.676483154296875, 0.7059707641601562, 0.7354583740234375, 0.7649459838867188, 0.79443359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 8.0, 19.0, 12.0, 15.0, 17.0, 11.0, 22.0, 17.0, 23.0, 22.0, 30.0, 34.0, 42.0, 39.0, 53.0, 95.0, 464.0, 41114.0, 1003683.0, 2213.0, 167.0, 69.0, 69.0, 45.0, 34.0, 30.0, 25.0, 18.0, 21.0, 19.0, 16.0, 21.0, 8.0, 10.0, 9.0, 9.0, 3.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.4453125, -3.3350830078125, -3.224853515625, -3.1146240234375, -3.00439453125, -2.8941650390625, -2.783935546875, -2.6737060546875, -2.5634765625, -2.4532470703125, -2.343017578125, -2.2327880859375, -2.12255859375, -2.0123291015625, -1.902099609375, -1.7918701171875, -1.681640625, -1.5714111328125, -1.461181640625, -1.3509521484375, -1.24072265625, -1.1304931640625, -1.020263671875, -0.9100341796875, -0.7998046875, -0.6895751953125, -0.579345703125, -0.4691162109375, -0.35888671875, -0.2486572265625, -0.138427734375, -0.0281982421875, 0.08203125, 0.1922607421875, 0.302490234375, 0.4127197265625, 0.52294921875, 0.6331787109375, 0.743408203125, 0.8536376953125, 0.9638671875, 1.0740966796875, 1.184326171875, 1.2945556640625, 1.40478515625, 1.5150146484375, 1.625244140625, 1.7354736328125, 1.845703125, 1.9559326171875, 2.066162109375, 2.1763916015625, 2.28662109375, 2.3968505859375, 2.507080078125, 2.6173095703125, 2.7275390625, 2.8377685546875, 2.947998046875, 3.0582275390625, 3.16845703125, 3.2786865234375, 3.388916015625, 3.4991455078125, 3.609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 16.0, 10.0, 10.0, 12.0, 25.0, 13.0, 21.0, 24.0, 29.0, 24.0, 32.0, 30.0, 52.0, 29.0, 33.0, 35.0, 48.0, 46.0, 30.0, 48.0, 29.0, 40.0, 45.0, 39.0, 38.0, 29.0, 27.0, 19.0, 18.0, 24.0, 12.0, 12.0, 13.0, 16.0, 6.0, 8.0, 3.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7724609375, -0.747314453125, -0.72216796875, -0.697021484375, -0.671875, -0.646728515625, -0.62158203125, -0.596435546875, -0.5712890625, -0.546142578125, -0.52099609375, -0.495849609375, -0.470703125, -0.445556640625, -0.42041015625, -0.395263671875, -0.3701171875, -0.344970703125, -0.31982421875, -0.294677734375, -0.26953125, -0.244384765625, -0.21923828125, -0.194091796875, -0.1689453125, -0.143798828125, -0.11865234375, -0.093505859375, -0.068359375, -0.043212890625, -0.01806640625, 0.007080078125, 0.0322265625, 0.057373046875, 0.08251953125, 0.107666015625, 0.1328125, 0.157958984375, 0.18310546875, 0.208251953125, 0.2333984375, 0.258544921875, 0.28369140625, 0.308837890625, 0.333984375, 0.359130859375, 0.38427734375, 0.409423828125, 0.4345703125, 0.459716796875, 0.48486328125, 0.510009765625, 0.53515625, 0.560302734375, 0.58544921875, 0.610595703125, 0.6357421875, 0.660888671875, 0.68603515625, 0.711181640625, 0.736328125, 0.761474609375, 0.78662109375, 0.811767578125, 0.8369140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 5.0, 2.0, 7.0, 4.0, 8.0, 12.0, 21.0, 50.0, 71.0, 129.0, 336.0, 1209.0, 8953.0, 267491.0, 745744.0, 21480.0, 2117.0, 505.0, 204.0, 86.0, 49.0, 24.0, 21.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.62109375, -0.6063613891601562, -0.5916290283203125, -0.5768966674804688, -0.562164306640625, -0.5474319458007812, -0.5326995849609375, -0.5179672241210938, -0.50323486328125, -0.48850250244140625, -0.4737701416015625, -0.45903778076171875, -0.444305419921875, -0.42957305908203125, -0.4148406982421875, -0.40010833740234375, -0.3853759765625, -0.37064361572265625, -0.3559112548828125, -0.34117889404296875, -0.326446533203125, -0.31171417236328125, -0.2969818115234375, -0.28224945068359375, -0.26751708984375, -0.25278472900390625, -0.2380523681640625, -0.22332000732421875, -0.208587646484375, -0.19385528564453125, -0.1791229248046875, -0.16439056396484375, -0.149658203125, -0.13492584228515625, -0.1201934814453125, -0.10546112060546875, -0.090728759765625, -0.07599639892578125, -0.0612640380859375, -0.04653167724609375, -0.03179931640625, -0.01706695556640625, -0.0023345947265625, 0.01239776611328125, 0.027130126953125, 0.04186248779296875, 0.0565948486328125, 0.07132720947265625, 0.0860595703125, 0.10079193115234375, 0.1155242919921875, 0.13025665283203125, 0.144989013671875, 0.15972137451171875, 0.1744537353515625, 0.18918609619140625, 0.20391845703125, 0.21865081787109375, 0.2333831787109375, 0.24811553955078125, 0.262847900390625, 0.27758026123046875, 0.2923126220703125, 0.30704498291015625, 0.32177734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 10.0, 19.0, 37.0, 34.0, 45.0, 59.0, 98.0, 105.0, 131.0, 111.0, 103.0, 69.0, 43.0, 35.0, 24.0, 16.0, 14.0, 11.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.473592758178711e-05, -2.367887645959854e-05, -2.2621825337409973e-05, -2.1564774215221405e-05, -2.0507723093032837e-05, -1.945067197084427e-05, -1.83936208486557e-05, -1.7336569726467133e-05, -1.6279518604278564e-05, -1.5222467482089996e-05, -1.4165416359901428e-05, -1.310836523771286e-05, -1.2051314115524292e-05, -1.0994262993335724e-05, -9.937211871147156e-06, -8.880160748958588e-06, -7.82310962677002e-06, -6.766058504581451e-06, -5.709007382392883e-06, -4.651956260204315e-06, -3.594905138015747e-06, -2.537854015827179e-06, -1.4808028936386108e-06, -4.237517714500427e-07, 6.332993507385254e-07, 1.6903504729270935e-06, 2.7474015951156616e-06, 3.8044527173042297e-06, 4.861503839492798e-06, 5.918554961681366e-06, 6.975606083869934e-06, 8.032657206058502e-06, 9.08970832824707e-06, 1.0146759450435638e-05, 1.1203810572624207e-05, 1.2260861694812775e-05, 1.3317912817001343e-05, 1.4374963939189911e-05, 1.543201506137848e-05, 1.6489066183567047e-05, 1.7546117305755615e-05, 1.8603168427944183e-05, 1.966021955013275e-05, 2.071727067232132e-05, 2.1774321794509888e-05, 2.2831372916698456e-05, 2.3888424038887024e-05, 2.4945475161075592e-05, 2.600252628326416e-05, 2.7059577405452728e-05, 2.8116628527641296e-05, 2.9173679649829865e-05, 3.0230730772018433e-05, 3.1287781894207e-05, 3.234483301639557e-05, 3.340188413858414e-05, 3.4458935260772705e-05, 3.551598638296127e-05, 3.657303750514984e-05, 3.763008862733841e-05, 3.868713974952698e-05, 3.9744190871715546e-05, 4.0801241993904114e-05, 4.185829311609268e-05, 4.291534423828125e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 2.0, 7.0, 11.0, 9.0, 14.0, 11.0, 26.0, 31.0, 58.0, 71.0, 115.0, 232.0, 354.0, 794.0, 1570.0, 3912.0, 11426.0, 46652.0, 276876.0, 559407.0, 113028.0, 22418.0, 6582.0, 2418.0, 1137.0, 581.0, 308.0, 184.0, 100.0, 54.0, 46.0, 34.0, 16.0, 14.0, 10.0, 8.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.19580078125, -0.18973159790039062, -0.18366241455078125, -0.17759323120117188, -0.1715240478515625, -0.16545486450195312, -0.15938568115234375, -0.15331649780273438, -0.147247314453125, -0.14117813110351562, -0.13510894775390625, -0.12903976440429688, -0.1229705810546875, -0.11690139770507812, -0.11083221435546875, -0.10476303100585938, -0.09869384765625, -0.09262466430664062, -0.08655548095703125, -0.08048629760742188, -0.0744171142578125, -0.06834793090820312, -0.06227874755859375, -0.056209564208984375, -0.050140380859375, -0.044071197509765625, -0.03800201416015625, -0.031932830810546875, -0.0258636474609375, -0.019794464111328125, -0.01372528076171875, -0.007656097412109375, -0.0015869140625, 0.004482269287109375, 0.01055145263671875, 0.016620635986328125, 0.0226898193359375, 0.028759002685546875, 0.03482818603515625, 0.040897369384765625, 0.046966552734375, 0.053035736083984375, 0.05910491943359375, 0.06517410278320312, 0.0712432861328125, 0.07731246948242188, 0.08338165283203125, 0.08945083618164062, 0.09552001953125, 0.10158920288085938, 0.10765838623046875, 0.11372756958007812, 0.1197967529296875, 0.12586593627929688, 0.13193511962890625, 0.13800430297851562, 0.144073486328125, 0.15014266967773438, 0.15621185302734375, 0.16228103637695312, 0.1683502197265625, 0.17441940307617188, 0.18048858642578125, 0.18655776977539062, 0.192626953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 13.0, 10.0, 19.0, 23.0, 22.0, 30.0, 37.0, 59.0, 58.0, 77.0, 80.0, 85.0, 87.0, 69.0, 61.0, 60.0, 46.0, 39.0, 29.0, 18.0, 10.0, 15.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.088623046875, -0.08614444732666016, -0.08366584777832031, -0.08118724822998047, -0.07870864868164062, -0.07623004913330078, -0.07375144958496094, -0.0712728500366211, -0.06879425048828125, -0.0663156509399414, -0.06383705139160156, -0.06135845184326172, -0.058879852294921875, -0.05640125274658203, -0.05392265319824219, -0.051444053649902344, -0.0489654541015625, -0.046486854553222656, -0.04400825500488281, -0.04152965545654297, -0.039051055908203125, -0.03657245635986328, -0.03409385681152344, -0.031615257263183594, -0.02913665771484375, -0.026658058166503906, -0.024179458618164062, -0.02170085906982422, -0.019222259521484375, -0.01674365997314453, -0.014265060424804688, -0.011786460876464844, -0.009307861328125, -0.006829261779785156, -0.0043506622314453125, -0.0018720626831054688, 0.000606536865234375, 0.0030851364135742188, 0.0055637359619140625, 0.008042335510253906, 0.01052093505859375, 0.012999534606933594, 0.015478134155273438, 0.01795673370361328, 0.020435333251953125, 0.02291393280029297, 0.025392532348632812, 0.027871131896972656, 0.0303497314453125, 0.032828330993652344, 0.03530693054199219, 0.03778553009033203, 0.040264129638671875, 0.04274272918701172, 0.04522132873535156, 0.047699928283691406, 0.05017852783203125, 0.052657127380371094, 0.05513572692871094, 0.05761432647705078, 0.060092926025390625, 0.06257152557373047, 0.06505012512207031, 0.06752872467041016, 0.07000732421875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 30.0, 65.0, 186.0, 317.0, 270.0, 96.0, 30.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.866697072982788, -1.718356966972351, -1.5700169801712036, -1.4216768741607666, -1.2733368873596191, -1.1249967813491821, -0.9766566753387451, -0.8283166885375977, -0.6799765825271606, -0.5316365361213684, -0.3832964599132538, -0.23495638370513916, -0.08661633729934692, 0.06172370910644531, 0.21006381511688232, 0.3584038019180298, 0.5067439079284668, 0.655083954334259, 0.8034240007400513, 0.9517641067504883, 1.1001040935516357, 1.2484441995620728, 1.3967843055725098, 1.5451242923736572, 1.6934643983840942, 1.8418045043945312, 1.9901444911956787, 2.138484477996826, 2.2868247032165527, 2.4351646900177, 2.5835046768188477, 2.731844902038574, 2.8801846504211426, 3.02852463722229, 3.1768648624420166, 3.325204849243164, 3.4735448360443115, 3.621884822845459, 3.7702250480651855, 3.918565034866333, 4.0669050216674805, 4.215245246887207, 4.363584995269775, 4.511925220489502, 4.6602654457092285, 4.808605194091797, 4.956945419311523, 5.10528564453125, 5.253625869750977, 5.401966094970703, 5.5503058433532715, 5.698646068572998, 5.846986293792725, 5.995326042175293, 6.1436662673950195, 6.292006492614746, 6.4403462409973145, 6.588686466217041, 6.737026214599609, 6.885366439819336, 7.0337066650390625, 7.182046413421631, 7.330386638641357, 7.478726387023926, 7.627066612243652]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 21.0, 12.0, 18.0, 20.0, 30.0, 21.0, 32.0, 31.0, 37.0, 44.0, 36.0, 35.0, 40.0, 54.0, 44.0, 48.0, 36.0, 34.0, 49.0, 38.0, 22.0, 37.0, 28.0, 29.0, 33.0, 32.0, 22.0, 21.0, 20.0, 14.0, 3.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 7.0, 7.0, 1.0, 4.0], "bins": [-1.5705806016921997, -1.5312174558639526, -1.4918543100357056, -1.452491044998169, -1.4131278991699219, -1.3737647533416748, -1.3344016075134277, -1.2950384616851807, -1.2556753158569336, -1.2163121700286865, -1.1769490242004395, -1.1375857591629028, -1.0982226133346558, -1.0588594675064087, -1.0194963216781616, -0.9801331758499146, -0.9407699108123779, -0.9014067649841309, -0.862043559551239, -0.8226804137229919, -0.7833172082901001, -0.743954062461853, -0.704590916633606, -0.6652277708053589, -0.625864565372467, -0.58650141954422, -0.5471382141113281, -0.507775068283081, -0.4684118926525116, -0.42904871702194214, -0.38968557119369507, -0.3503223955631256, -0.3109592795372009, -0.27159610390663147, -0.2322329431772232, -0.19286978244781494, -0.15350660681724548, -0.11414343118667603, -0.07478027045726776, -0.0354171097278595, 0.003946065902709961, 0.04330923408269882, 0.08267240226268768, 0.12203557044267654, 0.1613987386226654, 0.20076191425323486, 0.24012507498264313, 0.2794882357120514, 0.31885141134262085, 0.3582145869731903, 0.39757776260375977, 0.43694090843200684, 0.4763040840625763, 0.5156672596931458, 0.5550304055213928, 0.5943936109542847, 0.6337567567825317, 0.6731199026107788, 0.7124831080436707, 0.7518462538719177, 0.7912094593048096, 0.8305726051330566, 0.8699357509613037, 0.9092988967895508, 0.9486621022224426]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 10.0, 20.0, 16.0, 25.0, 33.0, 37.0, 62.0, 100.0, 117.0, 211.0, 402.0, 755.0, 1639.0, 3867.0, 10631.0, 37752.0, 161126.0, 634401.0, 1622708.0, 1251378.0, 356881.0, 78183.0, 20939.0, 7156.0, 2875.0, 1278.0, 628.0, 354.0, 226.0, 123.0, 95.0, 52.0, 43.0, 30.0, 27.0, 10.0, 8.0, 18.0, 4.0, 9.0, 5.0, 6.0, 2.0, 4.0, 4.0, 2.0], "bins": [-0.77880859375, -0.7576370239257812, -0.7364654541015625, -0.7152938842773438, -0.694122314453125, -0.6729507446289062, -0.6517791748046875, -0.6306076049804688, -0.60943603515625, -0.5882644653320312, -0.5670928955078125, -0.5459213256835938, -0.524749755859375, -0.5035781860351562, -0.4824066162109375, -0.46123504638671875, -0.4400634765625, -0.41889190673828125, -0.3977203369140625, -0.37654876708984375, -0.355377197265625, -0.33420562744140625, -0.3130340576171875, -0.29186248779296875, -0.27069091796875, -0.24951934814453125, -0.2283477783203125, -0.20717620849609375, -0.186004638671875, -0.16483306884765625, -0.1436614990234375, -0.12248992919921875, -0.101318359375, -0.08014678955078125, -0.0589752197265625, -0.03780364990234375, -0.016632080078125, 0.00453948974609375, 0.0257110595703125, 0.04688262939453125, 0.06805419921875, 0.08922576904296875, 0.1103973388671875, 0.13156890869140625, 0.152740478515625, 0.17391204833984375, 0.1950836181640625, 0.21625518798828125, 0.2374267578125, 0.25859832763671875, 0.2797698974609375, 0.30094146728515625, 0.322113037109375, 0.34328460693359375, 0.3644561767578125, 0.38562774658203125, 0.40679931640625, 0.42797088623046875, 0.4491424560546875, 0.47031402587890625, 0.491485595703125, 0.5126571655273438, 0.5338287353515625, 0.5550003051757812, 0.576171875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 10.0, 7.0, 10.0, 16.0, 21.0, 19.0, 18.0, 23.0, 26.0, 34.0, 25.0, 33.0, 41.0, 41.0, 40.0, 43.0, 39.0, 43.0, 40.0, 32.0, 41.0, 45.0, 43.0, 41.0, 34.0, 22.0, 24.0, 27.0, 31.0, 10.0, 11.0, 18.0, 13.0, 12.0, 9.0, 6.0, 7.0, 7.0, 6.0, 4.0, 9.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.50244140625, -0.48583221435546875, -0.4692230224609375, -0.45261383056640625, -0.436004638671875, -0.41939544677734375, -0.4027862548828125, -0.38617706298828125, -0.36956787109375, -0.35295867919921875, -0.3363494873046875, -0.31974029541015625, -0.303131103515625, -0.28652191162109375, -0.2699127197265625, -0.25330352783203125, -0.2366943359375, -0.22008514404296875, -0.2034759521484375, -0.18686676025390625, -0.170257568359375, -0.15364837646484375, -0.1370391845703125, -0.12042999267578125, -0.10382080078125, -0.08721160888671875, -0.0706024169921875, -0.05399322509765625, -0.037384033203125, -0.02077484130859375, -0.0041656494140625, 0.01244354248046875, 0.029052734375, 0.04566192626953125, 0.0622711181640625, 0.07888031005859375, 0.095489501953125, 0.11209869384765625, 0.1287078857421875, 0.14531707763671875, 0.16192626953125, 0.17853546142578125, 0.1951446533203125, 0.21175384521484375, 0.228363037109375, 0.24497222900390625, 0.2615814208984375, 0.27819061279296875, 0.2947998046875, 0.31140899658203125, 0.3280181884765625, 0.34462738037109375, 0.361236572265625, 0.37784576416015625, 0.3944549560546875, 0.41106414794921875, 0.42767333984375, 0.44428253173828125, 0.4608917236328125, 0.47750091552734375, 0.494110107421875, 0.5107192993164062, 0.5273284912109375, 0.5439376831054688, 0.560546875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 0.0, 6.0, 2.0, 5.0, 7.0, 11.0, 14.0, 20.0, 24.0, 38.0, 95.0, 247.0, 887.0, 11384.0, 3667564.0, 508921.0, 4136.0, 553.0, 173.0, 77.0, 43.0, 26.0, 18.0, 7.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.881195068359375, -2.78778076171875, -2.694366455078125, -2.6009521484375, -2.507537841796875, -2.41412353515625, -2.320709228515625, -2.227294921875, -2.133880615234375, -2.04046630859375, -1.947052001953125, -1.8536376953125, -1.760223388671875, -1.66680908203125, -1.573394775390625, -1.47998046875, -1.386566162109375, -1.29315185546875, -1.199737548828125, -1.1063232421875, -1.012908935546875, -0.91949462890625, -0.826080322265625, -0.732666015625, -0.639251708984375, -0.54583740234375, -0.452423095703125, -0.3590087890625, -0.265594482421875, -0.17218017578125, -0.078765869140625, 0.0146484375, 0.108062744140625, 0.20147705078125, 0.294891357421875, 0.3883056640625, 0.481719970703125, 0.57513427734375, 0.668548583984375, 0.761962890625, 0.855377197265625, 0.94879150390625, 1.042205810546875, 1.1356201171875, 1.229034423828125, 1.32244873046875, 1.415863037109375, 1.50927734375, 1.602691650390625, 1.69610595703125, 1.789520263671875, 1.8829345703125, 1.976348876953125, 2.06976318359375, 2.163177490234375, 2.256591796875, 2.350006103515625, 2.44342041015625, 2.536834716796875, 2.6302490234375, 2.723663330078125, 2.81707763671875, 2.910491943359375, 3.00390625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 14.0, 14.0, 17.0, 32.0, 48.0, 62.0, 99.0, 150.0, 243.0, 348.0, 529.0, 624.0, 582.0, 435.0, 318.0, 187.0, 128.0, 79.0, 63.0, 33.0, 18.0, 10.0, 8.0, 8.0, 5.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.28562164306640625, -0.2753448486328125, -0.26506805419921875, -0.254791259765625, -0.24451446533203125, -0.2342376708984375, -0.22396087646484375, -0.21368408203125, -0.20340728759765625, -0.1931304931640625, -0.18285369873046875, -0.172576904296875, -0.16230010986328125, -0.1520233154296875, -0.14174652099609375, -0.1314697265625, -0.12119293212890625, -0.1109161376953125, -0.10063934326171875, -0.090362548828125, -0.08008575439453125, -0.0698089599609375, -0.05953216552734375, -0.04925537109375, -0.03897857666015625, -0.0287017822265625, -0.01842498779296875, -0.008148193359375, 0.00212860107421875, 0.0124053955078125, 0.02268218994140625, 0.032958984375, 0.04323577880859375, 0.0535125732421875, 0.06378936767578125, 0.074066162109375, 0.08434295654296875, 0.0946197509765625, 0.10489654541015625, 0.11517333984375, 0.12545013427734375, 0.1357269287109375, 0.14600372314453125, 0.156280517578125, 0.16655731201171875, 0.1768341064453125, 0.18711090087890625, 0.1973876953125, 0.20766448974609375, 0.2179412841796875, 0.22821807861328125, 0.238494873046875, 0.24877166748046875, 0.2590484619140625, 0.26932525634765625, 0.27960205078125, 0.28987884521484375, 0.3001556396484375, 0.31043243408203125, 0.320709228515625, 0.33098602294921875, 0.3412628173828125, 0.35153961181640625, 0.36181640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 8.0, 6.0, 8.0, 17.0, 10.0, 30.0, 46.0, 48.0, 55.0, 79.0, 79.0, 83.0, 92.0, 76.0, 81.0, 75.0, 49.0, 39.0, 34.0, 14.0, 23.0, 10.0, 7.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8511802554130554, -0.8184229731559753, -0.7856656312942505, -0.7529083490371704, -0.7201510071754456, -0.6873937249183655, -0.6546363830566406, -0.6218791007995605, -0.5891218185424805, -0.5563645362854004, -0.5236071944236755, -0.49084991216659546, -0.4580925703048706, -0.4253352880477905, -0.39257797598838806, -0.3598206639289856, -0.32706332206726074, -0.2943060100078583, -0.2615486979484558, -0.22879140079021454, -0.19603408873081207, -0.1632767766714096, -0.13051947951316833, -0.09776216745376587, -0.0650048553943634, -0.032247547060251236, 0.0005097612738609314, 0.0332670658826828, 0.06602437794208527, 0.09878169000148773, 0.131538987159729, 0.16429629921913147, 0.1970536708831787, 0.22981098294258118, 0.26256829500198364, 0.2953255772590637, 0.3280829191207886, 0.36084020137786865, 0.3935975134372711, 0.4263548254966736, 0.45911213755607605, 0.4918694496154785, 0.5246267318725586, 0.5573840737342834, 0.5901413559913635, 0.6228986978530884, 0.6556559801101685, 0.6884132623672485, 0.7211706042289734, 0.7539278864860535, 0.7866852283477783, 0.8194425106048584, 0.8521998524665833, 0.8849571347236633, 0.9177144765853882, 0.9504717588424683, 0.9832290410995483, 1.0159863233566284, 1.0487436056137085, 1.0815010070800781, 1.1142582893371582, 1.1470155715942383, 1.1797728538513184, 1.2125301361083984, 1.245287537574768]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 5.0, 13.0, 15.0, 14.0, 21.0, 18.0, 18.0, 30.0, 30.0, 20.0, 33.0, 36.0, 42.0, 35.0, 38.0, 29.0, 35.0, 42.0, 30.0, 33.0, 34.0, 31.0, 42.0, 39.0, 27.0, 42.0, 34.0, 28.0, 12.0, 26.0, 20.0, 14.0, 12.0, 10.0, 9.0, 15.0, 4.0, 10.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.5185228586196899, -0.5017445087432861, -0.4849661886692047, -0.4681878387928009, -0.4514095187187195, -0.4346311688423157, -0.41785281896591187, -0.40107449889183044, -0.384296178817749, -0.3675178289413452, -0.3507395088672638, -0.33396115899086, -0.31718283891677856, -0.30040448904037476, -0.28362613916397095, -0.2668478190898895, -0.2500694692134857, -0.2332911342382431, -0.2165127992630005, -0.19973444938659668, -0.18295612931251526, -0.16617777943611145, -0.14939944446086884, -0.13262110948562622, -0.1158427745103836, -0.09906443953514099, -0.08228610455989838, -0.06550776213407516, -0.04872942715883255, -0.031951092183589935, -0.015172749757766724, 0.0016055852174758911, 0.018383920192718506, 0.03516225516796112, 0.051940593868494034, 0.06871893256902695, 0.08549726754426956, 0.10227560251951218, 0.11905394494533539, 0.135832279920578, 0.15261061489582062, 0.16938894987106323, 0.18616728484630585, 0.20294561982154846, 0.21972396969795227, 0.2365022897720337, 0.2532806396484375, 0.2700589895248413, 0.28683730959892273, 0.30361565947532654, 0.32039397954940796, 0.33717232942581177, 0.3539506494998932, 0.370728999376297, 0.3875073194503784, 0.4042856693267822, 0.42106401920318604, 0.43784236907958984, 0.45462068915367126, 0.4713990390300751, 0.4881773591041565, 0.5049557089805603, 0.5217340588569641, 0.5385123491287231, 0.555290699005127]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 20.0, 21.0, 37.0, 72.0, 97.0, 176.0, 373.0, 735.0, 1642.0, 3897.0, 11171.0, 42439.0, 214452.0, 542285.0, 178330.0, 36270.0, 10069.0, 3461.0, 1475.0, 715.0, 358.0, 169.0, 104.0, 62.0, 43.0, 21.0, 15.0, 13.0, 8.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3232421875, -0.3138580322265625, -0.304473876953125, -0.2950897216796875, -0.28570556640625, -0.2763214111328125, -0.266937255859375, -0.2575531005859375, -0.2481689453125, -0.2387847900390625, -0.229400634765625, -0.2200164794921875, -0.21063232421875, -0.2012481689453125, -0.191864013671875, -0.1824798583984375, -0.173095703125, -0.1637115478515625, -0.154327392578125, -0.1449432373046875, -0.13555908203125, -0.1261749267578125, -0.116790771484375, -0.1074066162109375, -0.0980224609375, -0.0886383056640625, -0.079254150390625, -0.0698699951171875, -0.06048583984375, -0.0511016845703125, -0.041717529296875, -0.0323333740234375, -0.02294921875, -0.0135650634765625, -0.004180908203125, 0.0052032470703125, 0.01458740234375, 0.0239715576171875, 0.033355712890625, 0.0427398681640625, 0.0521240234375, 0.0615081787109375, 0.070892333984375, 0.0802764892578125, 0.08966064453125, 0.0990447998046875, 0.108428955078125, 0.1178131103515625, 0.127197265625, 0.1365814208984375, 0.145965576171875, 0.1553497314453125, 0.16473388671875, 0.1741180419921875, 0.183502197265625, 0.1928863525390625, 0.2022705078125, 0.2116546630859375, 0.221038818359375, 0.2304229736328125, 0.23980712890625, 0.2491912841796875, 0.258575439453125, 0.2679595947265625, 0.27734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 13.0, 16.0, 14.0, 19.0, 14.0, 23.0, 38.0, 46.0, 30.0, 39.0, 32.0, 41.0, 49.0, 46.0, 38.0, 50.0, 37.0, 52.0, 47.0, 43.0, 41.0, 35.0, 29.0, 38.0, 21.0, 24.0, 22.0, 22.0, 13.0, 13.0, 4.0, 10.0, 11.0, 7.0, 7.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4228515625, -0.4109535217285156, -0.39905548095703125, -0.3871574401855469, -0.3752593994140625, -0.3633613586425781, -0.35146331787109375, -0.3395652770996094, -0.327667236328125, -0.3157691955566406, -0.30387115478515625, -0.2919731140136719, -0.2800750732421875, -0.2681770324707031, -0.25627899169921875, -0.24438095092773438, -0.23248291015625, -0.22058486938476562, -0.20868682861328125, -0.19678878784179688, -0.1848907470703125, -0.17299270629882812, -0.16109466552734375, -0.14919662475585938, -0.137298583984375, -0.12540054321289062, -0.11350250244140625, -0.10160446166992188, -0.0897064208984375, -0.07780838012695312, -0.06591033935546875, -0.054012298583984375, -0.0421142578125, -0.030216217041015625, -0.01831817626953125, -0.006420135498046875, 0.0054779052734375, 0.017375946044921875, 0.02927398681640625, 0.041172027587890625, 0.053070068359375, 0.06496810913085938, 0.07686614990234375, 0.08876419067382812, 0.1006622314453125, 0.11256027221679688, 0.12445831298828125, 0.13635635375976562, 0.14825439453125, 0.16015243530273438, 0.17205047607421875, 0.18394851684570312, 0.1958465576171875, 0.20774459838867188, 0.21964263916015625, 0.23154067993164062, 0.243438720703125, 0.2553367614746094, 0.26723480224609375, 0.2791328430175781, 0.2910308837890625, 0.3029289245605469, 0.31482696533203125, 0.3267250061035156, 0.338623046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 8.0, 15.0, 11.0, 20.0, 37.0, 39.0, 54.0, 82.0, 104.0, 127.0, 198.0, 258.0, 443.0, 659.0, 1146.0, 1939.0, 3555.0, 6500.0, 12991.0, 26670.0, 57439.0, 121500.0, 225691.0, 263449.0, 167863.0, 82192.0, 37751.0, 18020.0, 8790.0, 4565.0, 2548.0, 1410.0, 800.0, 524.0, 306.0, 243.0, 171.0, 112.0, 70.0, 46.0, 45.0, 34.0, 19.0, 22.0, 14.0, 16.0, 12.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.126953125, -0.12301445007324219, -0.11907577514648438, -0.11513710021972656, -0.11119842529296875, -0.10725975036621094, -0.10332107543945312, -0.09938240051269531, -0.0954437255859375, -0.09150505065917969, -0.08756637573242188, -0.08362770080566406, -0.07968902587890625, -0.07575035095214844, -0.07181167602539062, -0.06787300109863281, -0.063934326171875, -0.05999565124511719, -0.056056976318359375, -0.05211830139160156, -0.04817962646484375, -0.04424095153808594, -0.040302276611328125, -0.03636360168457031, -0.0324249267578125, -0.028486251831054688, -0.024547576904296875, -0.020608901977539062, -0.01667022705078125, -0.012731552124023438, -0.008792877197265625, -0.0048542022705078125, -0.00091552734375, 0.0030231475830078125, 0.006961822509765625, 0.010900497436523438, 0.01483917236328125, 0.018777847290039062, 0.022716522216796875, 0.026655197143554688, 0.0305938720703125, 0.03453254699707031, 0.038471221923828125, 0.04240989685058594, 0.04634857177734375, 0.05028724670410156, 0.054225921630859375, 0.05816459655761719, 0.062103271484375, 0.06604194641113281, 0.06998062133789062, 0.07391929626464844, 0.07785797119140625, 0.08179664611816406, 0.08573532104492188, 0.08967399597167969, 0.0936126708984375, 0.09755134582519531, 0.10149002075195312, 0.10542869567871094, 0.10936737060546875, 0.11330604553222656, 0.11724472045898438, 0.12118339538574219, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 4.0, 8.0, 12.0, 12.0, 18.0, 18.0, 18.0, 23.0, 34.0, 33.0, 33.0, 42.0, 41.0, 47.0, 46.0, 52.0, 52.0, 50.0, 50.0, 60.0, 49.0, 37.0, 37.0, 33.0, 27.0, 25.0, 28.0, 28.0, 17.0, 20.0, 17.0, 7.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8594894409179688, -0.8337249755859375, -0.8079605102539062, -0.782196044921875, -0.7564315795898438, -0.7306671142578125, -0.7049026489257812, -0.67913818359375, -0.6533737182617188, -0.6276092529296875, -0.6018447875976562, -0.576080322265625, -0.5503158569335938, -0.5245513916015625, -0.49878692626953125, -0.4730224609375, -0.44725799560546875, -0.4214935302734375, -0.39572906494140625, -0.369964599609375, -0.34420013427734375, -0.3184356689453125, -0.29267120361328125, -0.26690673828125, -0.24114227294921875, -0.2153778076171875, -0.18961334228515625, -0.163848876953125, -0.13808441162109375, -0.1123199462890625, -0.08655548095703125, -0.060791015625, -0.03502655029296875, -0.0092620849609375, 0.01650238037109375, 0.042266845703125, 0.06803131103515625, 0.0937957763671875, 0.11956024169921875, 0.14532470703125, 0.17108917236328125, 0.1968536376953125, 0.22261810302734375, 0.248382568359375, 0.27414703369140625, 0.2999114990234375, 0.32567596435546875, 0.3514404296875, 0.37720489501953125, 0.4029693603515625, 0.42873382568359375, 0.454498291015625, 0.48026275634765625, 0.5060272216796875, 0.5317916870117188, 0.55755615234375, 0.5833206176757812, 0.6090850830078125, 0.6348495483398438, 0.660614013671875, 0.6863784790039062, 0.7121429443359375, 0.7379074096679688, 0.763671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 10.0, 6.0, 6.0, 9.0, 18.0, 22.0, 49.0, 64.0, 100.0, 158.0, 232.0, 464.0, 773.0, 1458.0, 2794.0, 6185.0, 15956.0, 52279.0, 251472.0, 527223.0, 135476.0, 32943.0, 11193.0, 4710.0, 2247.0, 1118.0, 625.0, 366.0, 202.0, 124.0, 80.0, 65.0, 43.0, 28.0, 15.0, 11.0, 9.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09442138671875, -0.09130668640136719, -0.08819198608398438, -0.08507728576660156, -0.08196258544921875, -0.07884788513183594, -0.07573318481445312, -0.07261848449707031, -0.0695037841796875, -0.06638908386230469, -0.06327438354492188, -0.06015968322753906, -0.05704498291015625, -0.05393028259277344, -0.050815582275390625, -0.04770088195800781, -0.044586181640625, -0.04147148132324219, -0.038356781005859375, -0.03524208068847656, -0.03212738037109375, -0.029012680053710938, -0.025897979736328125, -0.022783279418945312, -0.0196685791015625, -0.016553878784179688, -0.013439178466796875, -0.010324478149414062, -0.00720977783203125, -0.0040950775146484375, -0.000980377197265625, 0.0021343231201171875, 0.0052490234375, 0.008363723754882812, 0.011478424072265625, 0.014593124389648438, 0.01770782470703125, 0.020822525024414062, 0.023937225341796875, 0.027051925659179688, 0.0301666259765625, 0.03328132629394531, 0.036396026611328125, 0.03951072692871094, 0.04262542724609375, 0.04574012756347656, 0.048854827880859375, 0.05196952819824219, 0.055084228515625, 0.05819892883300781, 0.061313629150390625, 0.06442832946777344, 0.06754302978515625, 0.07065773010253906, 0.07377243041992188, 0.07688713073730469, 0.0800018310546875, 0.08311653137207031, 0.08623123168945312, 0.08934593200683594, 0.09246063232421875, 0.09557533264160156, 0.09869003295898438, 0.10180473327636719, 0.10491943359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 8.0, 7.0, 2.0, 6.0, 10.0, 15.0, 17.0, 26.0, 32.0, 36.0, 52.0, 76.0, 88.0, 101.0, 116.0, 88.0, 66.0, 71.0, 33.0, 36.0, 29.0, 25.0, 17.0, 9.0, 8.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.029273986816406e-05, -3.9070844650268555e-05, -3.784894943237305e-05, -3.662705421447754e-05, -3.540515899658203e-05, -3.4183263778686523e-05, -3.2961368560791016e-05, -3.173947334289551e-05, -3.0517578125e-05, -2.9295682907104492e-05, -2.8073787689208984e-05, -2.6851892471313477e-05, -2.562999725341797e-05, -2.440810203552246e-05, -2.3186206817626953e-05, -2.1964311599731445e-05, -2.0742416381835938e-05, -1.952052116394043e-05, -1.8298625946044922e-05, -1.7076730728149414e-05, -1.5854835510253906e-05, -1.4632940292358398e-05, -1.341104507446289e-05, -1.2189149856567383e-05, -1.0967254638671875e-05, -9.745359420776367e-06, -8.52346420288086e-06, -7.3015689849853516e-06, -6.079673767089844e-06, -4.857778549194336e-06, -3.635883331298828e-06, -2.4139881134033203e-06, -1.1920928955078125e-06, 2.9802322387695312e-08, 1.2516975402832031e-06, 2.473592758178711e-06, 3.6954879760742188e-06, 4.9173831939697266e-06, 6.139278411865234e-06, 7.361173629760742e-06, 8.58306884765625e-06, 9.804964065551758e-06, 1.1026859283447266e-05, 1.2248754501342773e-05, 1.3470649719238281e-05, 1.4692544937133789e-05, 1.5914440155029297e-05, 1.7136335372924805e-05, 1.8358230590820312e-05, 1.958012580871582e-05, 2.0802021026611328e-05, 2.2023916244506836e-05, 2.3245811462402344e-05, 2.446770668029785e-05, 2.568960189819336e-05, 2.6911497116088867e-05, 2.8133392333984375e-05, 2.9355287551879883e-05, 3.057718276977539e-05, 3.17990779876709e-05, 3.3020973205566406e-05, 3.4242868423461914e-05, 3.546476364135742e-05, 3.668665885925293e-05, 3.790855407714844e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 9.0, 7.0, 8.0, 15.0, 24.0, 16.0, 31.0, 27.0, 61.0, 71.0, 125.0, 205.0, 367.0, 831.0, 1722.0, 3892.0, 10159.0, 32736.0, 142787.0, 540271.0, 241091.0, 49782.0, 14516.0, 5313.0, 2228.0, 1051.0, 496.0, 261.0, 119.0, 102.0, 65.0, 27.0, 27.0, 23.0, 16.0, 14.0, 11.0, 6.0, 12.0, 7.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1136474609375, -0.1101675033569336, -0.10668754577636719, -0.10320758819580078, -0.09972763061523438, -0.09624767303466797, -0.09276771545410156, -0.08928775787353516, -0.08580780029296875, -0.08232784271240234, -0.07884788513183594, -0.07536792755126953, -0.07188796997070312, -0.06840801239013672, -0.06492805480957031, -0.061448097229003906, -0.0579681396484375, -0.054488182067871094, -0.05100822448730469, -0.04752826690673828, -0.044048309326171875, -0.04056835174560547, -0.03708839416503906, -0.033608436584472656, -0.03012847900390625, -0.026648521423339844, -0.023168563842773438, -0.01968860626220703, -0.016208648681640625, -0.012728691101074219, -0.009248733520507812, -0.005768775939941406, -0.002288818359375, 0.0011911392211914062, 0.0046710968017578125, 0.008151054382324219, 0.011631011962890625, 0.015110969543457031, 0.018590927124023438, 0.022070884704589844, 0.02555084228515625, 0.029030799865722656, 0.03251075744628906, 0.03599071502685547, 0.039470672607421875, 0.04295063018798828, 0.04643058776855469, 0.049910545349121094, 0.0533905029296875, 0.056870460510253906, 0.06035041809082031, 0.06383037567138672, 0.06731033325195312, 0.07079029083251953, 0.07427024841308594, 0.07775020599365234, 0.08123016357421875, 0.08471012115478516, 0.08819007873535156, 0.09167003631591797, 0.09514999389648438, 0.09862995147705078, 0.10210990905761719, 0.1055898666381836, 0.10906982421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 10.0, 18.0, 24.0, 24.0, 44.0, 52.0, 60.0, 89.0, 90.0, 103.0, 109.0, 88.0, 69.0, 56.0, 33.0, 26.0, 19.0, 7.0, 12.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02734375, -0.026418685913085938, -0.025493621826171875, -0.024568557739257812, -0.02364349365234375, -0.022718429565429688, -0.021793365478515625, -0.020868301391601562, -0.0199432373046875, -0.019018173217773438, -0.018093109130859375, -0.017168045043945312, -0.01624298095703125, -0.015317916870117188, -0.014392852783203125, -0.013467788696289062, -0.012542724609375, -0.011617660522460938, -0.010692596435546875, -0.009767532348632812, -0.00884246826171875, -0.007917404174804688, -0.006992340087890625, -0.0060672760009765625, -0.0051422119140625, -0.0042171478271484375, -0.003292083740234375, -0.0023670196533203125, -0.00144195556640625, -0.0005168914794921875, 0.000408172607421875, 0.0013332366943359375, 0.00225830078125, 0.0031833648681640625, 0.004108428955078125, 0.0050334930419921875, 0.00595855712890625, 0.0068836212158203125, 0.007808685302734375, 0.008733749389648438, 0.0096588134765625, 0.010583877563476562, 0.011508941650390625, 0.012434005737304688, 0.01335906982421875, 0.014284133911132812, 0.015209197998046875, 0.016134262084960938, 0.017059326171875, 0.017984390258789062, 0.018909454345703125, 0.019834518432617188, 0.02075958251953125, 0.021684646606445312, 0.022609710693359375, 0.023534774780273438, 0.0244598388671875, 0.025384902954101562, 0.026309967041015625, 0.027235031127929688, 0.02816009521484375, 0.029085159301757812, 0.030010223388671875, 0.030935287475585938, 0.0318603515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 8.0, 7.0, 7.0, 11.0, 11.0, 19.0, 30.0, 51.0, 62.0, 101.0, 107.0, 121.0, 100.0, 99.0, 86.0, 68.0, 32.0, 28.0, 25.0, 9.0, 5.0, 2.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.640224277973175, -0.6162078976631165, -0.5921915173530579, -0.5681751370429993, -0.5441587567329407, -0.5201423764228821, -0.4961259663105011, -0.4721095860004425, -0.4480932056903839, -0.4240768253803253, -0.4000604450702667, -0.37604403495788574, -0.35202765464782715, -0.32801127433776855, -0.30399489402770996, -0.27997851371765137, -0.2559621334075928, -0.23194575309753418, -0.20792937278747559, -0.1839129775762558, -0.1598965972661972, -0.1358802169561386, -0.11186382174491882, -0.08784744143486023, -0.06383106112480164, -0.039814677089452744, -0.01579829305410385, 0.00821809470653534, 0.03223447501659393, 0.05625085532665253, 0.08026725053787231, 0.10428363084793091, 0.1283000111579895, 0.1523163914680481, 0.1763327717781067, 0.20034916698932648, 0.22436554729938507, 0.24838192760944366, 0.27239832282066345, 0.29641470313072205, 0.32043108344078064, 0.34444746375083923, 0.3684638440608978, 0.3924802541732788, 0.4164966344833374, 0.440513014793396, 0.4645293951034546, 0.4885457754135132, 0.5125621557235718, 0.5365785360336304, 0.560594916343689, 0.5846112966537476, 0.6086276769638062, 0.6326440572738647, 0.6566604375839233, 0.6806768178939819, 0.7046931982040405, 0.7287095785140991, 0.7527259588241577, 0.7767423391342163, 0.8007587194442749, 0.8247750997543335, 0.8487914800643921, 0.8728078603744507, 0.896824300289154]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 7.0, 9.0, 8.0, 4.0, 15.0, 11.0, 24.0, 15.0, 26.0, 30.0, 31.0, 29.0, 41.0, 33.0, 48.0, 38.0, 37.0, 47.0, 45.0, 38.0, 35.0, 38.0, 40.0, 46.0, 50.0, 40.0, 38.0, 21.0, 20.0, 25.0, 12.0, 23.0, 14.0, 11.0, 11.0, 11.0, 7.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.3793233633041382, -0.36853253841400146, -0.35774171352386475, -0.346950888633728, -0.3361600637435913, -0.3253692388534546, -0.31457841396331787, -0.30378758907318115, -0.29299676418304443, -0.2822059392929077, -0.271415114402771, -0.2606242895126343, -0.24983346462249756, -0.23904263973236084, -0.22825182974338531, -0.2174610048532486, -0.20667019486427307, -0.19587936997413635, -0.18508854508399963, -0.17429772019386292, -0.1635068953037262, -0.15271607041358948, -0.14192526042461395, -0.13113443553447723, -0.12034361064434052, -0.1095527857542038, -0.09876196086406708, -0.08797114342451096, -0.07718031853437424, -0.06638949364423752, -0.055598676204681396, -0.04480785131454468, -0.03401699662208557, -0.023226173594594002, -0.012435350567102432, -0.001644529402256012, 0.009146295487880707, 0.019937120378017426, 0.030727937817573547, 0.041518762707710266, 0.052309587597846985, 0.0631004124879837, 0.07389123737812042, 0.08468205481767654, 0.09547287970781326, 0.10626370459794998, 0.1170545220375061, 0.12784534692764282, 0.13863617181777954, 0.14942699670791626, 0.16021782159805298, 0.1710086464881897, 0.18179947137832642, 0.19259029626846313, 0.20338110625743866, 0.21417193114757538, 0.2249627560377121, 0.23575358092784882, 0.24654440581798553, 0.25733521580696106, 0.2681260406970978, 0.2789168655872345, 0.2897076904773712, 0.30049851536750793, 0.31128934025764465]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 11.0, 13.0, 17.0, 31.0, 44.0, 89.0, 148.0, 291.0, 543.0, 1118.0, 2534.0, 6316.0, 18711.0, 74946.0, 360513.0, 443783.0, 102408.0, 23876.0, 7557.0, 2940.0, 1283.0, 648.0, 298.0, 148.0, 92.0, 57.0, 36.0, 30.0, 17.0, 8.0, 7.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.64697265625, -0.6299896240234375, -0.613006591796875, -0.5960235595703125, -0.57904052734375, -0.5620574951171875, -0.545074462890625, -0.5280914306640625, -0.5111083984375, -0.4941253662109375, -0.477142333984375, -0.4601593017578125, -0.44317626953125, -0.4261932373046875, -0.409210205078125, -0.3922271728515625, -0.375244140625, -0.3582611083984375, -0.341278076171875, -0.3242950439453125, -0.30731201171875, -0.2903289794921875, -0.273345947265625, -0.2563629150390625, -0.2393798828125, -0.2223968505859375, -0.205413818359375, -0.1884307861328125, -0.17144775390625, -0.1544647216796875, -0.137481689453125, -0.1204986572265625, -0.103515625, -0.0865325927734375, -0.069549560546875, -0.0525665283203125, -0.03558349609375, -0.0186004638671875, -0.001617431640625, 0.0153656005859375, 0.0323486328125, 0.0493316650390625, 0.066314697265625, 0.0832977294921875, 0.10028076171875, 0.1172637939453125, 0.134246826171875, 0.1512298583984375, 0.168212890625, 0.1851959228515625, 0.202178955078125, 0.2191619873046875, 0.23614501953125, 0.2531280517578125, 0.270111083984375, 0.2870941162109375, 0.3040771484375, 0.3210601806640625, 0.338043212890625, 0.3550262451171875, 0.37200927734375, 0.3889923095703125, 0.405975341796875, 0.4229583740234375, 0.43994140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 9.0, 14.0, 14.0, 24.0, 25.0, 28.0, 31.0, 36.0, 40.0, 44.0, 49.0, 38.0, 46.0, 44.0, 58.0, 45.0, 54.0, 53.0, 44.0, 50.0, 42.0, 38.0, 42.0, 14.0, 18.0, 18.0, 15.0, 9.0, 5.0, 12.0, 10.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.98828125, -0.9619369506835938, -0.9355926513671875, -0.9092483520507812, -0.882904052734375, -0.8565597534179688, -0.8302154541015625, -0.8038711547851562, -0.77752685546875, -0.7511825561523438, -0.7248382568359375, -0.6984939575195312, -0.672149658203125, -0.6458053588867188, -0.6194610595703125, -0.5931167602539062, -0.5667724609375, -0.5404281616210938, -0.5140838623046875, -0.48773956298828125, -0.461395263671875, -0.43505096435546875, -0.4087066650390625, -0.38236236572265625, -0.35601806640625, -0.32967376708984375, -0.3033294677734375, -0.27698516845703125, -0.250640869140625, -0.22429656982421875, -0.1979522705078125, -0.17160797119140625, -0.145263671875, -0.11891937255859375, -0.0925750732421875, -0.06623077392578125, -0.039886474609375, -0.01354217529296875, 0.0128021240234375, 0.03914642333984375, 0.06549072265625, 0.09183502197265625, 0.1181793212890625, 0.14452362060546875, 0.170867919921875, 0.19721221923828125, 0.2235565185546875, 0.24990081787109375, 0.2762451171875, 0.30258941650390625, 0.3289337158203125, 0.35527801513671875, 0.381622314453125, 0.40796661376953125, 0.4343109130859375, 0.46065521240234375, 0.48699951171875, 0.5133438110351562, 0.5396881103515625, 0.5660324096679688, 0.592376708984375, 0.6187210083007812, 0.6450653076171875, 0.6714096069335938, 0.69775390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 5.0, 6.0, 8.0, 9.0, 14.0, 8.0, 13.0, 21.0, 22.0, 16.0, 20.0, 42.0, 39.0, 48.0, 72.0, 102.0, 175.0, 412.0, 2527.0, 436067.0, 604778.0, 3116.0, 393.0, 195.0, 117.0, 67.0, 42.0, 34.0, 27.0, 26.0, 26.0, 18.0, 15.0, 18.0, 15.0, 8.0, 5.0, 6.0, 7.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7832489013671875, -1.712005615234375, -1.6407623291015625, -1.56951904296875, -1.4982757568359375, -1.427032470703125, -1.3557891845703125, -1.2845458984375, -1.2133026123046875, -1.142059326171875, -1.0708160400390625, -0.99957275390625, -0.9283294677734375, -0.857086181640625, -0.7858428955078125, -0.714599609375, -0.6433563232421875, -0.572113037109375, -0.5008697509765625, -0.42962646484375, -0.3583831787109375, -0.287139892578125, -0.2158966064453125, -0.1446533203125, -0.0734100341796875, -0.002166748046875, 0.0690765380859375, 0.14031982421875, 0.2115631103515625, 0.282806396484375, 0.3540496826171875, 0.42529296875, 0.4965362548828125, 0.567779541015625, 0.6390228271484375, 0.71026611328125, 0.7815093994140625, 0.852752685546875, 0.9239959716796875, 0.9952392578125, 1.0664825439453125, 1.137725830078125, 1.2089691162109375, 1.28021240234375, 1.3514556884765625, 1.422698974609375, 1.4939422607421875, 1.565185546875, 1.6364288330078125, 1.707672119140625, 1.7789154052734375, 1.85015869140625, 1.9214019775390625, 1.992645263671875, 2.0638885498046875, 2.1351318359375, 2.2063751220703125, 2.277618408203125, 2.3488616943359375, 2.42010498046875, 2.4913482666015625, 2.562591552734375, 2.6338348388671875, 2.705078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 4.0, 9.0, 6.0, 10.0, 13.0, 14.0, 12.0, 21.0, 22.0, 19.0, 25.0, 36.0, 28.0, 35.0, 33.0, 34.0, 37.0, 43.0, 38.0, 36.0, 45.0, 42.0, 56.0, 49.0, 41.0, 33.0, 29.0, 29.0, 30.0, 27.0, 23.0, 22.0, 19.0, 8.0, 17.0, 11.0, 10.0, 8.0, 4.0, 5.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5878219604492188, -0.5652923583984375, -0.5427627563476562, -0.520233154296875, -0.49770355224609375, -0.4751739501953125, -0.45264434814453125, -0.43011474609375, -0.40758514404296875, -0.3850555419921875, -0.36252593994140625, -0.339996337890625, -0.31746673583984375, -0.2949371337890625, -0.27240753173828125, -0.2498779296875, -0.22734832763671875, -0.2048187255859375, -0.18228912353515625, -0.159759521484375, -0.13722991943359375, -0.1147003173828125, -0.09217071533203125, -0.06964111328125, -0.04711151123046875, -0.0245819091796875, -0.00205230712890625, 0.020477294921875, 0.04300689697265625, 0.0655364990234375, 0.08806610107421875, 0.110595703125, 0.13312530517578125, 0.1556549072265625, 0.17818450927734375, 0.200714111328125, 0.22324371337890625, 0.2457733154296875, 0.26830291748046875, 0.29083251953125, 0.31336212158203125, 0.3358917236328125, 0.35842132568359375, 0.380950927734375, 0.40348052978515625, 0.4260101318359375, 0.44853973388671875, 0.4710693359375, 0.49359893798828125, 0.5161285400390625, 0.5386581420898438, 0.561187744140625, 0.5837173461914062, 0.6062469482421875, 0.6287765502929688, 0.65130615234375, 0.6738357543945312, 0.6963653564453125, 0.7188949584960938, 0.741424560546875, 0.7639541625976562, 0.7864837646484375, 0.8090133666992188, 0.83154296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 3.0, 4.0, 8.0, 4.0, 5.0, 6.0, 14.0, 16.0, 18.0, 20.0, 48.0, 64.0, 115.0, 185.0, 363.0, 978.0, 3424.0, 20922.0, 227741.0, 688270.0, 92504.0, 10286.0, 2137.0, 659.0, 304.0, 157.0, 98.0, 59.0, 51.0, 29.0, 23.0, 13.0, 8.0, 3.0, 0.0, 6.0, 4.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.23551177978515625, -0.2282257080078125, -0.22093963623046875, -0.213653564453125, -0.20636749267578125, -0.1990814208984375, -0.19179534912109375, -0.18450927734375, -0.17722320556640625, -0.1699371337890625, -0.16265106201171875, -0.155364990234375, -0.14807891845703125, -0.1407928466796875, -0.13350677490234375, -0.126220703125, -0.11893463134765625, -0.1116485595703125, -0.10436248779296875, -0.097076416015625, -0.08979034423828125, -0.0825042724609375, -0.07521820068359375, -0.06793212890625, -0.06064605712890625, -0.0533599853515625, -0.04607391357421875, -0.038787841796875, -0.03150177001953125, -0.0242156982421875, -0.01692962646484375, -0.0096435546875, -0.00235748291015625, 0.0049285888671875, 0.01221466064453125, 0.019500732421875, 0.02678680419921875, 0.0340728759765625, 0.04135894775390625, 0.04864501953125, 0.05593109130859375, 0.0632171630859375, 0.07050323486328125, 0.077789306640625, 0.08507537841796875, 0.0923614501953125, 0.09964752197265625, 0.10693359375, 0.11421966552734375, 0.1215057373046875, 0.12879180908203125, 0.136077880859375, 0.14336395263671875, 0.1506500244140625, 0.15793609619140625, 0.16522216796875, 0.17250823974609375, 0.1797943115234375, 0.18708038330078125, 0.194366455078125, 0.20165252685546875, 0.2089385986328125, 0.21622467041015625, 0.2235107421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 7.0, 9.0, 6.0, 11.0, 11.0, 18.0, 23.0, 28.0, 33.0, 41.0, 66.0, 68.0, 85.0, 73.0, 87.0, 85.0, 55.0, 59.0, 50.0, 39.0, 32.0, 21.0, 18.0, 22.0, 13.0, 11.0, 8.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0384788513183594e-05, -1.9783154129981995e-05, -1.9181519746780396e-05, -1.8579885363578796e-05, -1.7978250980377197e-05, -1.7376616597175598e-05, -1.6774982213974e-05, -1.61733478307724e-05, -1.55717134475708e-05, -1.4970079064369202e-05, -1.4368444681167603e-05, -1.3766810297966003e-05, -1.3165175914764404e-05, -1.2563541531562805e-05, -1.1961907148361206e-05, -1.1360272765159607e-05, -1.0758638381958008e-05, -1.0157003998756409e-05, -9.55536961555481e-06, -8.95373523235321e-06, -8.352100849151611e-06, -7.750466465950012e-06, -7.148832082748413e-06, -6.547197699546814e-06, -5.945563316345215e-06, -5.343928933143616e-06, -4.742294549942017e-06, -4.1406601667404175e-06, -3.5390257835388184e-06, -2.9373914003372192e-06, -2.33575701713562e-06, -1.734122633934021e-06, -1.1324882507324219e-06, -5.308538675308228e-07, 7.078051567077637e-08, 6.724148988723755e-07, 1.2740492820739746e-06, 1.8756836652755737e-06, 2.477318048477173e-06, 3.078952431678772e-06, 3.680586814880371e-06, 4.28222119808197e-06, 4.883855581283569e-06, 5.4854899644851685e-06, 6.087124347686768e-06, 6.688758730888367e-06, 7.290393114089966e-06, 7.892027497291565e-06, 8.493661880493164e-06, 9.095296263694763e-06, 9.696930646896362e-06, 1.0298565030097961e-05, 1.090019941329956e-05, 1.150183379650116e-05, 1.2103468179702759e-05, 1.2705102562904358e-05, 1.3306736946105957e-05, 1.3908371329307556e-05, 1.4510005712509155e-05, 1.5111640095710754e-05, 1.5713274478912354e-05, 1.6314908862113953e-05, 1.6916543245315552e-05, 1.751817762851715e-05, 1.811981201171875e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 8.0, 17.0, 17.0, 28.0, 39.0, 90.0, 121.0, 244.0, 507.0, 1457.0, 5766.0, 38865.0, 432503.0, 510913.0, 48250.0, 6854.0, 1678.0, 608.0, 244.0, 135.0, 68.0, 39.0, 34.0, 19.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24290847778320312, -0.23532867431640625, -0.22774887084960938, -0.2201690673828125, -0.21258926391601562, -0.20500946044921875, -0.19742965698242188, -0.189849853515625, -0.18227005004882812, -0.17469024658203125, -0.16711044311523438, -0.1595306396484375, -0.15195083618164062, -0.14437103271484375, -0.13679122924804688, -0.12921142578125, -0.12163162231445312, -0.11405181884765625, -0.10647201538085938, -0.0988922119140625, -0.09131240844726562, -0.08373260498046875, -0.07615280151367188, -0.068572998046875, -0.060993194580078125, -0.05341339111328125, -0.045833587646484375, -0.0382537841796875, -0.030673980712890625, -0.02309417724609375, -0.015514373779296875, -0.0079345703125, -0.000354766845703125, 0.00722503662109375, 0.014804840087890625, 0.0223846435546875, 0.029964447021484375, 0.03754425048828125, 0.045124053955078125, 0.052703857421875, 0.060283660888671875, 0.06786346435546875, 0.07544326782226562, 0.0830230712890625, 0.09060287475585938, 0.09818267822265625, 0.10576248168945312, 0.11334228515625, 0.12092208862304688, 0.12850189208984375, 0.13608169555664062, 0.1436614990234375, 0.15124130249023438, 0.15882110595703125, 0.16640090942382812, 0.173980712890625, 0.18156051635742188, 0.18914031982421875, 0.19672012329101562, 0.2042999267578125, 0.21187973022460938, 0.21945953369140625, 0.22703933715820312, 0.234619140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 9.0, 11.0, 16.0, 15.0, 31.0, 32.0, 60.0, 69.0, 96.0, 95.0, 103.0, 94.0, 90.0, 74.0, 41.0, 41.0, 23.0, 23.0, 19.0, 14.0, 7.0, 5.0, 5.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.095947265625, -0.09324359893798828, -0.09053993225097656, -0.08783626556396484, -0.08513259887695312, -0.0824289321899414, -0.07972526550292969, -0.07702159881591797, -0.07431793212890625, -0.07161426544189453, -0.06891059875488281, -0.0662069320678711, -0.06350326538085938, -0.060799598693847656, -0.05809593200683594, -0.05539226531982422, -0.0526885986328125, -0.04998493194580078, -0.04728126525878906, -0.044577598571777344, -0.041873931884765625, -0.039170265197753906, -0.03646659851074219, -0.03376293182373047, -0.03105926513671875, -0.02835559844970703, -0.025651931762695312, -0.022948265075683594, -0.020244598388671875, -0.017540931701660156, -0.014837265014648438, -0.012133598327636719, -0.009429931640625, -0.006726264953613281, -0.0040225982666015625, -0.0013189315795898438, 0.001384735107421875, 0.004088401794433594, 0.0067920684814453125, 0.009495735168457031, 0.01219940185546875, 0.014903068542480469, 0.017606735229492188, 0.020310401916503906, 0.023014068603515625, 0.025717735290527344, 0.028421401977539062, 0.03112506866455078, 0.0338287353515625, 0.03653240203857422, 0.03923606872558594, 0.041939735412597656, 0.044643402099609375, 0.047347068786621094, 0.05005073547363281, 0.05275440216064453, 0.05545806884765625, 0.05816173553466797, 0.06086540222167969, 0.0635690689086914, 0.06627273559570312, 0.06897640228271484, 0.07168006896972656, 0.07438373565673828, 0.07708740234375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 9.0, 9.0, 12.0, 21.0, 39.0, 59.0, 97.0, 124.0, 155.0, 136.0, 119.0, 86.0, 56.0, 33.0, 20.0, 10.0, 6.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.120443820953369, -2.0594565868377686, -1.998469352722168, -1.9374819993972778, -1.8764947652816772, -1.8155075311660767, -1.7545201778411865, -1.693532943725586, -1.6325457096099854, -1.5715584754943848, -1.5105712413787842, -1.449583888053894, -1.3885966539382935, -1.3276094198226929, -1.2666220664978027, -1.2056348323822021, -1.1446475982666016, -1.083660364151001, -1.0226731300354004, -0.9616857767105103, -0.9006985425949097, -0.8397113084793091, -0.7787240147590637, -0.7177367210388184, -0.6567494869232178, -0.5957622528076172, -0.5347749590873718, -0.47378769516944885, -0.4128004312515259, -0.3518131673336029, -0.29082590341567993, -0.22983863949775696, -0.16885149478912354, -0.10786423087120056, -0.04687696695327759, 0.014110296964645386, 0.07509756088256836, 0.13608482480049133, 0.1970720887184143, 0.2580593526363373, 0.31904661655426025, 0.3800338804721832, 0.4410211443901062, 0.5020084381103516, 0.5629956722259521, 0.6239829063415527, 0.6849702000617981, 0.7459574937820435, 0.806944727897644, 0.8679319620132446, 0.92891925573349, 0.9899065494537354, 1.050893783569336, 1.1118810176849365, 1.172868251800537, 1.2338556051254272, 1.2948428392410278, 1.3558300733566284, 1.4168174266815186, 1.4778046607971191, 1.5387918949127197, 1.5997791290283203, 1.660766363143921, 1.721753716468811, 1.7827409505844116]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 7.0, 11.0, 10.0, 14.0, 15.0, 19.0, 18.0, 20.0, 24.0, 26.0, 33.0, 29.0, 22.0, 43.0, 41.0, 34.0, 38.0, 34.0, 43.0, 40.0, 45.0, 38.0, 33.0, 34.0, 38.0, 34.0, 33.0, 23.0, 30.0, 22.0, 21.0, 19.0, 16.0, 16.0, 8.0, 10.0, 8.0, 5.0, 8.0, 7.0, 9.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0975044965744019, -1.0619765520095825, -1.0264486074447632, -0.9909206628799438, -0.9553927183151245, -0.9198647737503052, -0.8843368291854858, -0.8488088846206665, -0.8132809400558472, -0.7777529954910278, -0.7422250509262085, -0.7066971063613892, -0.6711691617965698, -0.6356412172317505, -0.6001132726669312, -0.5645853281021118, -0.5290573835372925, -0.49352943897247314, -0.4580014944076538, -0.4224735498428345, -0.38694560527801514, -0.3514176607131958, -0.31588971614837646, -0.28036177158355713, -0.2448338270187378, -0.20930588245391846, -0.17377793788909912, -0.13824999332427979, -0.10272204875946045, -0.06719410419464111, -0.03166615962982178, 0.0038617849349975586, 0.039389848709106445, 0.07491779327392578, 0.11044573783874512, 0.14597368240356445, 0.1815016269683838, 0.21702957153320312, 0.25255751609802246, 0.2880854606628418, 0.32361340522766113, 0.35914134979248047, 0.3946692943572998, 0.43019723892211914, 0.4657251834869385, 0.5012531280517578, 0.5367810726165771, 0.5723090171813965, 0.6078369617462158, 0.6433649063110352, 0.6788928508758545, 0.7144207954406738, 0.7499487400054932, 0.7854766845703125, 0.8210046291351318, 0.8565325736999512, 0.8920605182647705, 0.9275884628295898, 0.9631164073944092, 0.9986443519592285, 1.0341722965240479, 1.0697002410888672, 1.1052281856536865, 1.1407561302185059, 1.1762840747833252]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 13.0, 9.0, 11.0, 10.0, 21.0, 20.0, 36.0, 38.0, 47.0, 82.0, 111.0, 169.0, 333.0, 658.0, 1611.0, 4309.0, 15341.0, 79019.0, 492022.0, 1958639.0, 1346955.0, 240984.0, 39026.0, 9359.0, 3025.0, 1161.0, 523.0, 281.0, 144.0, 93.0, 59.0, 38.0, 29.0, 17.0, 15.0, 12.0, 17.0, 9.0, 10.0, 7.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7798614501953125, -0.754547119140625, -0.7292327880859375, -0.70391845703125, -0.6786041259765625, -0.653289794921875, -0.6279754638671875, -0.6026611328125, -0.5773468017578125, -0.552032470703125, -0.5267181396484375, -0.50140380859375, -0.4760894775390625, -0.450775146484375, -0.4254608154296875, -0.400146484375, -0.3748321533203125, -0.349517822265625, -0.3242034912109375, -0.29888916015625, -0.2735748291015625, -0.248260498046875, -0.2229461669921875, -0.1976318359375, -0.1723175048828125, -0.147003173828125, -0.1216888427734375, -0.09637451171875, -0.0710601806640625, -0.045745849609375, -0.0204315185546875, 0.0048828125, 0.0301971435546875, 0.055511474609375, 0.0808258056640625, 0.10614013671875, 0.1314544677734375, 0.156768798828125, 0.1820831298828125, 0.2073974609375, 0.2327117919921875, 0.258026123046875, 0.2833404541015625, 0.30865478515625, 0.3339691162109375, 0.359283447265625, 0.3845977783203125, 0.409912109375, 0.4352264404296875, 0.460540771484375, 0.4858551025390625, 0.51116943359375, 0.5364837646484375, 0.561798095703125, 0.5871124267578125, 0.6124267578125, 0.6377410888671875, 0.663055419921875, 0.6883697509765625, 0.71368408203125, 0.7389984130859375, 0.764312744140625, 0.7896270751953125, 0.81494140625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 7.0, 5.0, 16.0, 11.0, 15.0, 15.0, 20.0, 19.0, 35.0, 31.0, 40.0, 46.0, 36.0, 44.0, 54.0, 36.0, 35.0, 40.0, 52.0, 42.0, 53.0, 46.0, 39.0, 29.0, 37.0, 21.0, 28.0, 20.0, 23.0, 14.0, 12.0, 10.0, 12.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.60986328125, -0.5925750732421875, -0.575286865234375, -0.5579986572265625, -0.54071044921875, -0.5234222412109375, -0.506134033203125, -0.4888458251953125, -0.4715576171875, -0.4542694091796875, -0.436981201171875, -0.4196929931640625, -0.40240478515625, -0.3851165771484375, -0.367828369140625, -0.3505401611328125, -0.333251953125, -0.3159637451171875, -0.298675537109375, -0.2813873291015625, -0.26409912109375, -0.2468109130859375, -0.229522705078125, -0.2122344970703125, -0.1949462890625, -0.1776580810546875, -0.160369873046875, -0.1430816650390625, -0.12579345703125, -0.1085052490234375, -0.091217041015625, -0.0739288330078125, -0.056640625, -0.0393524169921875, -0.022064208984375, -0.0047760009765625, 0.01251220703125, 0.0298004150390625, 0.047088623046875, 0.0643768310546875, 0.0816650390625, 0.0989532470703125, 0.116241455078125, 0.1335296630859375, 0.15081787109375, 0.1681060791015625, 0.185394287109375, 0.2026824951171875, 0.219970703125, 0.2372589111328125, 0.254547119140625, 0.2718353271484375, 0.28912353515625, 0.3064117431640625, 0.323699951171875, 0.3409881591796875, 0.3582763671875, 0.3755645751953125, 0.392852783203125, 0.4101409912109375, 0.42742919921875, 0.4447174072265625, 0.462005615234375, 0.4792938232421875, 0.49658203125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 13.0, 6.0, 8.0, 16.0, 14.0, 23.0, 24.0, 35.0, 61.0, 89.0, 139.0, 296.0, 802.0, 5189.0, 243191.0, 3897024.0, 43932.0, 2277.0, 510.0, 219.0, 114.0, 77.0, 66.0, 38.0, 28.0, 21.0, 7.0, 14.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.7950286865234375, -1.731658935546875, -1.6682891845703125, -1.60491943359375, -1.5415496826171875, -1.478179931640625, -1.4148101806640625, -1.3514404296875, -1.2880706787109375, -1.224700927734375, -1.1613311767578125, -1.09796142578125, -1.0345916748046875, -0.971221923828125, -0.9078521728515625, -0.844482421875, -0.7811126708984375, -0.717742919921875, -0.6543731689453125, -0.59100341796875, -0.5276336669921875, -0.464263916015625, -0.4008941650390625, -0.3375244140625, -0.2741546630859375, -0.210784912109375, -0.1474151611328125, -0.08404541015625, -0.0206756591796875, 0.042694091796875, 0.1060638427734375, 0.16943359375, 0.2328033447265625, 0.296173095703125, 0.3595428466796875, 0.42291259765625, 0.4862823486328125, 0.549652099609375, 0.6130218505859375, 0.6763916015625, 0.7397613525390625, 0.803131103515625, 0.8665008544921875, 0.92987060546875, 0.9932403564453125, 1.056610107421875, 1.1199798583984375, 1.183349609375, 1.2467193603515625, 1.310089111328125, 1.3734588623046875, 1.43682861328125, 1.5001983642578125, 1.563568115234375, 1.6269378662109375, 1.6903076171875, 1.7536773681640625, 1.817047119140625, 1.8804168701171875, 1.94378662109375, 2.0071563720703125, 2.070526123046875, 2.1338958740234375, 2.197265625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 13.0, 17.0, 19.0, 23.0, 35.0, 45.0, 45.0, 73.0, 122.0, 154.0, 226.0, 297.0, 428.0, 535.0, 510.0, 404.0, 321.0, 234.0, 165.0, 112.0, 91.0, 56.0, 35.0, 23.0, 26.0, 17.0, 7.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.17945289611816406, -0.17226028442382812, -0.1650676727294922, -0.15787506103515625, -0.1506824493408203, -0.14348983764648438, -0.13629722595214844, -0.1291046142578125, -0.12191200256347656, -0.11471939086914062, -0.10752677917480469, -0.10033416748046875, -0.09314155578613281, -0.08594894409179688, -0.07875633239746094, -0.071563720703125, -0.06437110900878906, -0.057178497314453125, -0.04998588562011719, -0.04279327392578125, -0.03560066223144531, -0.028408050537109375, -0.021215438842773438, -0.0140228271484375, -0.0068302154541015625, 0.000362396240234375, 0.0075550079345703125, 0.01474761962890625, 0.021940231323242188, 0.029132843017578125, 0.03632545471191406, 0.04351806640625, 0.05071067810058594, 0.057903289794921875, 0.06509590148925781, 0.07228851318359375, 0.07948112487792969, 0.08667373657226562, 0.09386634826660156, 0.1010589599609375, 0.10825157165527344, 0.11544418334960938, 0.12263679504394531, 0.12982940673828125, 0.1370220184326172, 0.14421463012695312, 0.15140724182128906, 0.158599853515625, 0.16579246520996094, 0.17298507690429688, 0.1801776885986328, 0.18737030029296875, 0.1945629119873047, 0.20175552368164062, 0.20894813537597656, 0.2161407470703125, 0.22333335876464844, 0.23052597045898438, 0.2377185821533203, 0.24491119384765625, 0.2521038055419922, 0.2592964172363281, 0.26648902893066406, 0.273681640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 3.0, 7.0, 11.0, 8.0, 24.0, 34.0, 38.0, 67.0, 93.0, 98.0, 125.0, 134.0, 95.0, 70.0, 53.0, 45.0, 39.0, 15.0, 17.0, 6.0, 4.0, 6.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9110559225082397, -0.8727821111679077, -0.8345083594322205, -0.7962346076965332, -0.7579607963562012, -0.7196869850158691, -0.6814132332801819, -0.6431394815444946, -0.6048656702041626, -0.5665918588638306, -0.5283181071281433, -0.49004432559013367, -0.451770544052124, -0.4134967625141144, -0.37522298097610474, -0.3369491994380951, -0.29867541790008545, -0.2604016363620758, -0.22212785482406616, -0.18385407328605652, -0.14558029174804688, -0.10730651021003723, -0.06903272867202759, -0.030758947134017944, 0.007514834403991699, 0.04578861594200134, 0.08406239748001099, 0.12233617901802063, 0.16060996055603027, 0.19888374209403992, 0.23715752363204956, 0.2754313051700592, 0.3137049674987793, 0.35197874903678894, 0.3902525305747986, 0.4285263121128082, 0.46680009365081787, 0.5050739049911499, 0.5433476567268372, 0.5816214084625244, 0.6198952198028564, 0.6581690311431885, 0.6964427828788757, 0.734716534614563, 0.772990345954895, 0.811264157295227, 0.8495379090309143, 0.8878116607666016, 0.9260854721069336, 0.9643592834472656, 1.0026330947875977, 1.0409067869186401, 1.0791805982589722, 1.1174544095993042, 1.1557281017303467, 1.1940019130706787, 1.2322757244110107, 1.2705495357513428, 1.3088233470916748, 1.3470970392227173, 1.3853708505630493, 1.4236446619033813, 1.4619183540344238, 1.5001921653747559, 1.538465976715088]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 6.0, 8.0, 17.0, 21.0, 24.0, 16.0, 14.0, 21.0, 31.0, 25.0, 22.0, 31.0, 28.0, 36.0, 35.0, 41.0, 39.0, 32.0, 40.0, 30.0, 48.0, 30.0, 32.0, 31.0, 23.0, 21.0, 26.0, 37.0, 28.0, 27.0, 21.0, 14.0, 20.0, 9.0, 17.0, 8.0, 8.0, 10.0, 4.0, 6.0, 5.0, 7.0, 5.0, 3.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.45690181851387024, -0.4425037205219269, -0.4281056523323059, -0.41370755434036255, -0.3993094861507416, -0.3849113881587982, -0.37051331996917725, -0.3561152219772339, -0.3417171239852905, -0.32731902599334717, -0.3129209578037262, -0.29852285981178284, -0.28412479162216187, -0.2697266936302185, -0.25532859563827515, -0.24093052744865417, -0.226532444357872, -0.21213436126708984, -0.19773627817630768, -0.1833381950855255, -0.16894009709358215, -0.1545420140028, -0.14014393091201782, -0.12574583292007446, -0.1113477572798729, -0.09694967418909073, -0.08255158364772797, -0.0681535005569458, -0.05375541374087334, -0.03935732692480087, -0.024959243834018707, -0.010561153292655945, 0.0038369297981262207, 0.018235016614198685, 0.03263310343027115, 0.047031186521053314, 0.06142927333712578, 0.07582736015319824, 0.09022544324398041, 0.10462353378534317, 0.11902161687612534, 0.1334197074174881, 0.14781779050827026, 0.16221587359905243, 0.1766139566898346, 0.19101205468177795, 0.20541012287139893, 0.21980822086334229, 0.23420630395412445, 0.24860438704490662, 0.26300248503685, 0.27740055322647095, 0.2917986512184143, 0.30619674921035767, 0.32059481739997864, 0.334992915391922, 0.34939098358154297, 0.36378908157348633, 0.3781871497631073, 0.39258524775505066, 0.40698331594467163, 0.421381413936615, 0.43577951192855835, 0.4501775801181793, 0.4645756781101227]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 11.0, 19.0, 20.0, 40.0, 85.0, 189.0, 426.0, 1794.0, 11772.0, 134190.0, 736437.0, 147911.0, 12897.0, 1887.0, 473.0, 184.0, 93.0, 49.0, 29.0, 19.0, 6.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35302734375, -0.3424949645996094, -0.33196258544921875, -0.3214302062988281, -0.3108978271484375, -0.3003654479980469, -0.28983306884765625, -0.2793006896972656, -0.268768310546875, -0.2582359313964844, -0.24770355224609375, -0.23717117309570312, -0.2266387939453125, -0.21610641479492188, -0.20557403564453125, -0.19504165649414062, -0.18450927734375, -0.17397689819335938, -0.16344451904296875, -0.15291213989257812, -0.1423797607421875, -0.13184738159179688, -0.12131500244140625, -0.11078262329101562, -0.100250244140625, -0.08971786499023438, -0.07918548583984375, -0.06865310668945312, -0.0581207275390625, -0.047588348388671875, -0.03705596923828125, -0.026523590087890625, -0.0159912109375, -0.005458831787109375, 0.00507354736328125, 0.015605926513671875, 0.0261383056640625, 0.036670684814453125, 0.04720306396484375, 0.057735443115234375, 0.068267822265625, 0.07880020141601562, 0.08933258056640625, 0.09986495971679688, 0.1103973388671875, 0.12092971801757812, 0.13146209716796875, 0.14199447631835938, 0.15252685546875, 0.16305923461914062, 0.17359161376953125, 0.18412399291992188, 0.1946563720703125, 0.20518875122070312, 0.21572113037109375, 0.22625350952148438, 0.236785888671875, 0.24731826782226562, 0.25785064697265625, 0.2683830261230469, 0.2789154052734375, 0.2894477844238281, 0.29998016357421875, 0.3105125427246094, 0.321044921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 7.0, 10.0, 9.0, 11.0, 23.0, 17.0, 22.0, 28.0, 33.0, 39.0, 45.0, 47.0, 54.0, 58.0, 45.0, 59.0, 58.0, 45.0, 47.0, 42.0, 44.0, 41.0, 40.0, 29.0, 31.0, 23.0, 19.0, 15.0, 10.0, 7.0, 11.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.4765625, -0.4632568359375, -0.449951171875, -0.4366455078125, -0.42333984375, -0.4100341796875, -0.396728515625, -0.3834228515625, -0.3701171875, -0.3568115234375, -0.343505859375, -0.3302001953125, -0.31689453125, -0.3035888671875, -0.290283203125, -0.2769775390625, -0.263671875, -0.2503662109375, -0.237060546875, -0.2237548828125, -0.21044921875, -0.1971435546875, -0.183837890625, -0.1705322265625, -0.1572265625, -0.1439208984375, -0.130615234375, -0.1173095703125, -0.10400390625, -0.0906982421875, -0.077392578125, -0.0640869140625, -0.05078125, -0.0374755859375, -0.024169921875, -0.0108642578125, 0.00244140625, 0.0157470703125, 0.029052734375, 0.0423583984375, 0.0556640625, 0.0689697265625, 0.082275390625, 0.0955810546875, 0.10888671875, 0.1221923828125, 0.135498046875, 0.1488037109375, 0.162109375, 0.1754150390625, 0.188720703125, 0.2020263671875, 0.21533203125, 0.2286376953125, 0.241943359375, 0.2552490234375, 0.2685546875, 0.2818603515625, 0.295166015625, 0.3084716796875, 0.32177734375, 0.3350830078125, 0.348388671875, 0.3616943359375, 0.375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 13.0, 9.0, 6.0, 8.0, 22.0, 24.0, 32.0, 56.0, 73.0, 110.0, 182.0, 242.0, 428.0, 694.0, 1366.0, 2864.0, 6578.0, 16814.0, 46302.0, 127870.0, 287929.0, 313299.0, 153183.0, 55964.0, 20068.0, 7533.0, 3237.0, 1529.0, 839.0, 440.0, 280.0, 169.0, 104.0, 77.0, 57.0, 45.0, 23.0, 25.0, 15.0, 10.0, 5.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11260986328125, -0.10860157012939453, -0.10459327697753906, -0.1005849838256836, -0.09657669067382812, -0.09256839752197266, -0.08856010437011719, -0.08455181121826172, -0.08054351806640625, -0.07653522491455078, -0.07252693176269531, -0.06851863861083984, -0.06451034545898438, -0.060502052307128906, -0.05649375915527344, -0.05248546600341797, -0.0484771728515625, -0.04446887969970703, -0.04046058654785156, -0.036452293395996094, -0.032444000244140625, -0.028435707092285156, -0.024427413940429688, -0.02041912078857422, -0.01641082763671875, -0.012402534484863281, -0.008394241333007812, -0.004385948181152344, -0.000377655029296875, 0.0036306381225585938, 0.0076389312744140625, 0.011647224426269531, 0.015655517578125, 0.01966381072998047, 0.023672103881835938, 0.027680397033691406, 0.031688690185546875, 0.035696983337402344, 0.03970527648925781, 0.04371356964111328, 0.04772186279296875, 0.05173015594482422, 0.05573844909667969, 0.059746742248535156, 0.06375503540039062, 0.0677633285522461, 0.07177162170410156, 0.07577991485595703, 0.0797882080078125, 0.08379650115966797, 0.08780479431152344, 0.0918130874633789, 0.09582138061523438, 0.09982967376708984, 0.10383796691894531, 0.10784626007080078, 0.11185455322265625, 0.11586284637451172, 0.11987113952636719, 0.12387943267822266, 0.12788772583007812, 0.1318960189819336, 0.13590431213378906, 0.13991260528564453, 0.1439208984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 5.0, 5.0, 11.0, 11.0, 12.0, 20.0, 9.0, 23.0, 17.0, 22.0, 22.0, 30.0, 31.0, 23.0, 38.0, 45.0, 51.0, 28.0, 47.0, 46.0, 50.0, 43.0, 42.0, 59.0, 41.0, 33.0, 36.0, 22.0, 28.0, 32.0, 25.0, 16.0, 15.0, 16.0, 8.0, 12.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.619781494140625, -0.59747314453125, -0.575164794921875, -0.5528564453125, -0.530548095703125, -0.50823974609375, -0.485931396484375, -0.463623046875, -0.441314697265625, -0.41900634765625, -0.396697998046875, -0.3743896484375, -0.352081298828125, -0.32977294921875, -0.307464599609375, -0.28515625, -0.262847900390625, -0.24053955078125, -0.218231201171875, -0.1959228515625, -0.173614501953125, -0.15130615234375, -0.128997802734375, -0.106689453125, -0.084381103515625, -0.06207275390625, -0.039764404296875, -0.0174560546875, 0.004852294921875, 0.02716064453125, 0.049468994140625, 0.07177734375, 0.094085693359375, 0.11639404296875, 0.138702392578125, 0.1610107421875, 0.183319091796875, 0.20562744140625, 0.227935791015625, 0.250244140625, 0.272552490234375, 0.29486083984375, 0.317169189453125, 0.3394775390625, 0.361785888671875, 0.38409423828125, 0.406402587890625, 0.4287109375, 0.451019287109375, 0.47332763671875, 0.495635986328125, 0.5179443359375, 0.540252685546875, 0.56256103515625, 0.584869384765625, 0.607177734375, 0.629486083984375, 0.65179443359375, 0.674102783203125, 0.6964111328125, 0.718719482421875, 0.74102783203125, 0.763336181640625, 0.78564453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 10.0, 19.0, 35.0, 47.0, 85.0, 142.0, 233.0, 403.0, 846.0, 1865.0, 4684.0, 14723.0, 58215.0, 274625.0, 496409.0, 149104.0, 32217.0, 9032.0, 3133.0, 1304.0, 646.0, 318.0, 164.0, 113.0, 66.0, 39.0, 16.0, 10.0, 6.0, 5.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0615234375, -0.059493064880371094, -0.05746269226074219, -0.05543231964111328, -0.053401947021484375, -0.05137157440185547, -0.04934120178222656, -0.047310829162597656, -0.04528045654296875, -0.043250083923339844, -0.04121971130371094, -0.03918933868408203, -0.037158966064453125, -0.03512859344482422, -0.03309822082519531, -0.031067848205566406, -0.0290374755859375, -0.027007102966308594, -0.024976730346679688, -0.02294635772705078, -0.020915985107421875, -0.01888561248779297, -0.016855239868164062, -0.014824867248535156, -0.01279449462890625, -0.010764122009277344, -0.008733749389648438, -0.006703376770019531, -0.004673004150390625, -0.0026426315307617188, -0.0006122589111328125, 0.0014181137084960938, 0.003448486328125, 0.005478858947753906, 0.0075092315673828125, 0.009539604187011719, 0.011569976806640625, 0.013600349426269531, 0.015630722045898438, 0.017661094665527344, 0.01969146728515625, 0.021721839904785156, 0.023752212524414062, 0.02578258514404297, 0.027812957763671875, 0.02984333038330078, 0.03187370300292969, 0.033904075622558594, 0.0359344482421875, 0.037964820861816406, 0.03999519348144531, 0.04202556610107422, 0.044055938720703125, 0.04608631134033203, 0.04811668395996094, 0.050147056579589844, 0.05217742919921875, 0.054207801818847656, 0.05623817443847656, 0.05826854705810547, 0.060298919677734375, 0.06232929229736328, 0.06435966491699219, 0.0663900375366211, 0.06842041015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 3.0, 8.0, 3.0, 15.0, 10.0, 19.0, 39.0, 34.0, 37.0, 51.0, 47.0, 82.0, 82.0, 71.0, 89.0, 85.0, 89.0, 53.0, 41.0, 33.0, 23.0, 20.0, 16.0, 10.0, 10.0, 6.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.8431805074214935e-05, -1.773051917552948e-05, -1.7029233276844025e-05, -1.632794737815857e-05, -1.5626661479473114e-05, -1.4925375580787659e-05, -1.4224089682102203e-05, -1.3522803783416748e-05, -1.2821517884731293e-05, -1.2120231986045837e-05, -1.1418946087360382e-05, -1.0717660188674927e-05, -1.0016374289989471e-05, -9.315088391304016e-06, -8.61380249261856e-06, -7.912516593933105e-06, -7.21123069524765e-06, -6.509944796562195e-06, -5.8086588978767395e-06, -5.107372999191284e-06, -4.406087100505829e-06, -3.7048012018203735e-06, -3.0035153031349182e-06, -2.302229404449463e-06, -1.6009435057640076e-06, -8.996576070785522e-07, -1.9837170839309692e-07, 5.029141902923584e-07, 1.2042000889778137e-06, 1.905485987663269e-06, 2.6067718863487244e-06, 3.3080577850341797e-06, 4.009343683719635e-06, 4.71062958240509e-06, 5.411915481090546e-06, 6.113201379776001e-06, 6.814487278461456e-06, 7.515773177146912e-06, 8.217059075832367e-06, 8.918344974517822e-06, 9.619630873203278e-06, 1.0320916771888733e-05, 1.1022202670574188e-05, 1.1723488569259644e-05, 1.2424774467945099e-05, 1.3126060366630554e-05, 1.382734626531601e-05, 1.4528632164001465e-05, 1.522991806268692e-05, 1.5931203961372375e-05, 1.663248986005783e-05, 1.7333775758743286e-05, 1.803506165742874e-05, 1.8736347556114197e-05, 1.9437633454799652e-05, 2.0138919353485107e-05, 2.0840205252170563e-05, 2.1541491150856018e-05, 2.2242777049541473e-05, 2.294406294822693e-05, 2.3645348846912384e-05, 2.434663474559784e-05, 2.5047920644283295e-05, 2.574920654296875e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 30.0, 45.0, 59.0, 81.0, 123.0, 203.0, 423.0, 894.0, 2348.0, 6912.0, 23209.0, 88493.0, 323779.0, 415026.0, 136397.0, 34999.0, 9858.0, 3155.0, 1190.0, 502.0, 263.0, 148.0, 85.0, 64.0, 45.0, 25.0, 22.0, 22.0, 16.0, 7.0, 7.0, 13.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.060089111328125, -0.05827665328979492, -0.056464195251464844, -0.054651737213134766, -0.05283927917480469, -0.05102682113647461, -0.04921436309814453, -0.04740190505981445, -0.045589447021484375, -0.0437769889831543, -0.04196453094482422, -0.04015207290649414, -0.03833961486816406, -0.036527156829833984, -0.034714698791503906, -0.03290224075317383, -0.03108978271484375, -0.029277324676513672, -0.027464866638183594, -0.025652408599853516, -0.023839950561523438, -0.02202749252319336, -0.02021503448486328, -0.018402576446533203, -0.016590118408203125, -0.014777660369873047, -0.012965202331542969, -0.01115274429321289, -0.009340286254882812, -0.007527828216552734, -0.005715370178222656, -0.003902912139892578, -0.0020904541015625, -0.0002779960632324219, 0.0015344619750976562, 0.0033469200134277344, 0.0051593780517578125, 0.006971836090087891, 0.008784294128417969, 0.010596752166748047, 0.012409210205078125, 0.014221668243408203, 0.01603412628173828, 0.01784658432006836, 0.019659042358398438, 0.021471500396728516, 0.023283958435058594, 0.025096416473388672, 0.02690887451171875, 0.028721332550048828, 0.030533790588378906, 0.032346248626708984, 0.03415870666503906, 0.03597116470336914, 0.03778362274169922, 0.0395960807800293, 0.041408538818359375, 0.04322099685668945, 0.04503345489501953, 0.04684591293334961, 0.04865837097167969, 0.050470829010009766, 0.052283287048339844, 0.05409574508666992, 0.055908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 8.0, 17.0, 22.0, 14.0, 17.0, 20.0, 19.0, 35.0, 36.0, 43.0, 58.0, 79.0, 64.0, 65.0, 76.0, 63.0, 56.0, 50.0, 31.0, 40.0, 25.0, 28.0, 20.0, 27.0, 11.0, 13.0, 11.0, 6.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014404296875, -0.013987421989440918, -0.013570547103881836, -0.013153672218322754, -0.012736797332763672, -0.01231992244720459, -0.011903047561645508, -0.011486172676086426, -0.011069297790527344, -0.010652422904968262, -0.01023554801940918, -0.009818673133850098, -0.009401798248291016, -0.008984923362731934, -0.008568048477172852, -0.00815117359161377, -0.0077342987060546875, -0.0073174238204956055, -0.0069005489349365234, -0.006483674049377441, -0.006066799163818359, -0.005649924278259277, -0.005233049392700195, -0.004816174507141113, -0.004399299621582031, -0.003982424736022949, -0.003565549850463867, -0.003148674964904785, -0.002731800079345703, -0.002314925193786621, -0.001898050308227539, -0.001481175422668457, -0.001064300537109375, -0.000647425651550293, -0.00023055076599121094, 0.0001863241195678711, 0.0006031990051269531, 0.0010200738906860352, 0.0014369487762451172, 0.0018538236618041992, 0.0022706985473632812, 0.0026875734329223633, 0.0031044483184814453, 0.0035213232040405273, 0.003938198089599609, 0.004355072975158691, 0.0047719478607177734, 0.0051888227462768555, 0.0056056976318359375, 0.0060225725173950195, 0.0064394474029541016, 0.006856322288513184, 0.007273197174072266, 0.007690072059631348, 0.00810694694519043, 0.008523821830749512, 0.008940696716308594, 0.009357571601867676, 0.009774446487426758, 0.01019132137298584, 0.010608196258544922, 0.011025071144104004, 0.011441946029663086, 0.011858820915222168, 0.01227569580078125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 10.0, 10.0, 17.0, 42.0, 70.0, 118.0, 171.0, 201.0, 141.0, 85.0, 59.0, 30.0, 16.0, 13.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970798134803772, -0.9376470446586609, -0.904495894908905, -0.871344804763794, -0.8381936550140381, -0.805042564868927, -0.7718914747238159, -0.7387403249740601, -0.705589234828949, -0.6724381446838379, -0.639286994934082, -0.606135904788971, -0.5729848146438599, -0.539833664894104, -0.5066825747489929, -0.47353145480155945, -0.440380334854126, -0.4072292149066925, -0.37407809495925903, -0.34092700481414795, -0.3077758848667145, -0.274624764919281, -0.24147365987300873, -0.20832255482673645, -0.17517143487930298, -0.1420203149318695, -0.10886920988559723, -0.07571809738874435, -0.04256698489189148, -0.009415864944458008, 0.02373524010181427, 0.05688634514808655, 0.09003746509552002, 0.1231885775923729, 0.15633969008922577, 0.18949079513549805, 0.22264191508293152, 0.255793035030365, 0.2889441251754761, 0.32209524512290955, 0.355246365070343, 0.3883974850177765, 0.42154860496520996, 0.45469969511032104, 0.4878508150577545, 0.521001935005188, 0.5541530251502991, 0.5873041152954102, 0.620455265045166, 0.6536063551902771, 0.686757504940033, 0.719908595085144, 0.7530597448348999, 0.786210834980011, 0.8193619251251221, 0.8525130748748779, 0.885664165019989, 0.9188152551651001, 0.951966404914856, 0.985117495059967, 1.0182685852050781, 1.051419734954834, 1.0845708847045898, 1.1177219152450562, 1.150873064994812]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 7.0, 8.0, 5.0, 17.0, 18.0, 27.0, 30.0, 25.0, 35.0, 41.0, 42.0, 42.0, 60.0, 56.0, 60.0, 46.0, 50.0, 61.0, 50.0, 33.0, 41.0, 40.0, 46.0, 24.0, 27.0, 19.0, 14.0, 11.0, 10.0, 5.0, 10.0, 8.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4869082570075989, -0.4742285907268524, -0.46154892444610596, -0.4488692283630371, -0.43618956208229065, -0.4235098958015442, -0.41083022952079773, -0.39815056324005127, -0.3854708671569824, -0.37279120087623596, -0.3601115345954895, -0.34743183851242065, -0.3347521722316742, -0.32207250595092773, -0.3093928396701813, -0.2967131733894348, -0.28403347730636597, -0.2713538110256195, -0.25867414474487305, -0.2459944635629654, -0.23331478238105774, -0.22063511610031128, -0.20795544981956482, -0.19527576863765717, -0.1825961172580719, -0.16991645097732544, -0.15723676979541779, -0.14455710351467133, -0.13187742233276367, -0.11919775605201721, -0.10651808232069016, -0.0938384085893631, -0.08115872740745544, -0.06847905367612839, -0.05579937994480133, -0.04311970993876457, -0.030440036207437515, -0.017760366201400757, -0.0050806924700737, 0.007598981261253357, 0.020278654992580414, 0.03295832872390747, 0.04563800245523453, 0.058317672461271286, 0.07099734246730804, 0.0836770161986351, 0.09635668992996216, 0.10903636366128922, 0.12171603739261627, 0.13439570367336273, 0.14707538485527039, 0.15975505113601685, 0.1724347323179245, 0.18511439859867096, 0.1977940797805786, 0.21047374606132507, 0.22315341234207153, 0.235833078622818, 0.24851275980472565, 0.2611924409866333, 0.27387210726737976, 0.2865517735481262, 0.2992314398288727, 0.31191110610961914, 0.324590802192688]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 6.0, 16.0, 19.0, 35.0, 39.0, 86.0, 370.0, 3843.0, 470761.0, 568387.0, 4371.0, 383.0, 98.0, 49.0, 22.0, 18.0, 13.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.0644378662109375, -1.999969482421875, -1.9355010986328125, -1.87103271484375, -1.8065643310546875, -1.742095947265625, -1.6776275634765625, -1.6131591796875, -1.5486907958984375, -1.484222412109375, -1.4197540283203125, -1.35528564453125, -1.2908172607421875, -1.226348876953125, -1.1618804931640625, -1.097412109375, -1.0329437255859375, -0.968475341796875, -0.9040069580078125, -0.83953857421875, -0.7750701904296875, -0.710601806640625, -0.6461334228515625, -0.5816650390625, -0.5171966552734375, -0.452728271484375, -0.3882598876953125, -0.32379150390625, -0.2593231201171875, -0.194854736328125, -0.1303863525390625, -0.06591796875, -0.0014495849609375, 0.063018798828125, 0.1274871826171875, 0.19195556640625, 0.2564239501953125, 0.320892333984375, 0.3853607177734375, 0.4498291015625, 0.5142974853515625, 0.578765869140625, 0.6432342529296875, 0.70770263671875, 0.7721710205078125, 0.836639404296875, 0.9011077880859375, 0.965576171875, 1.0300445556640625, 1.094512939453125, 1.1589813232421875, 1.22344970703125, 1.2879180908203125, 1.352386474609375, 1.4168548583984375, 1.4813232421875, 1.5457916259765625, 1.610260009765625, 1.6747283935546875, 1.73919677734375, 1.8036651611328125, 1.868133544921875, 1.9326019287109375, 1.9970703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 16.0, 25.0, 30.0, 43.0, 76.0, 102.0, 124.0, 133.0, 115.0, 102.0, 86.0, 60.0, 36.0, 25.0, 22.0, 10.0, 8.0, 2.0, 2.0], "bins": [-3.03125, -2.9737701416015625, -2.916290283203125, -2.8588104248046875, -2.80133056640625, -2.7438507080078125, -2.686370849609375, -2.6288909912109375, -2.5714111328125, -2.5139312744140625, -2.456451416015625, -2.3989715576171875, -2.34149169921875, -2.2840118408203125, -2.226531982421875, -2.1690521240234375, -2.111572265625, -2.0540924072265625, -1.996612548828125, -1.9391326904296875, -1.88165283203125, -1.8241729736328125, -1.766693115234375, -1.7092132568359375, -1.6517333984375, -1.5942535400390625, -1.536773681640625, -1.4792938232421875, -1.42181396484375, -1.3643341064453125, -1.306854248046875, -1.2493743896484375, -1.19189453125, -1.1344146728515625, -1.076934814453125, -1.0194549560546875, -0.96197509765625, -0.9044952392578125, -0.847015380859375, -0.7895355224609375, -0.7320556640625, -0.6745758056640625, -0.617095947265625, -0.5596160888671875, -0.50213623046875, -0.4446563720703125, -0.387176513671875, -0.3296966552734375, -0.272216796875, -0.2147369384765625, -0.157257080078125, -0.0997772216796875, -0.04229736328125, 0.0151824951171875, 0.072662353515625, 0.1301422119140625, 0.1876220703125, 0.2451019287109375, 0.302581787109375, 0.3600616455078125, 0.41754150390625, 0.4750213623046875, 0.532501220703125, 0.5899810791015625, 0.6474609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 7.0, 13.0, 7.0, 18.0, 15.0, 22.0, 42.0, 59.0, 70.0, 106.0, 117.0, 127.0, 216.0, 291.0, 555.0, 2601.0, 33212.0, 734423.0, 264754.0, 9416.0, 1126.0, 385.0, 243.0, 180.0, 122.0, 96.0, 79.0, 66.0, 49.0, 45.0, 14.0, 22.0, 13.0, 11.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.2431640625, -1.2093734741210938, -1.1755828857421875, -1.1417922973632812, -1.108001708984375, -1.0742111206054688, -1.0404205322265625, -1.0066299438476562, -0.97283935546875, -0.9390487670898438, -0.9052581787109375, -0.8714675903320312, -0.837677001953125, -0.8038864135742188, -0.7700958251953125, -0.7363052368164062, -0.7025146484375, -0.6687240600585938, -0.6349334716796875, -0.6011428833007812, -0.567352294921875, -0.5335617065429688, -0.4997711181640625, -0.46598052978515625, -0.43218994140625, -0.39839935302734375, -0.3646087646484375, -0.33081817626953125, -0.297027587890625, -0.26323699951171875, -0.2294464111328125, -0.19565582275390625, -0.161865234375, -0.12807464599609375, -0.0942840576171875, -0.06049346923828125, -0.026702880859375, 0.00708770751953125, 0.0408782958984375, 0.07466888427734375, 0.10845947265625, 0.14225006103515625, 0.1760406494140625, 0.20983123779296875, 0.243621826171875, 0.27741241455078125, 0.3112030029296875, 0.34499359130859375, 0.3787841796875, 0.41257476806640625, 0.4463653564453125, 0.48015594482421875, 0.513946533203125, 0.5477371215820312, 0.5815277099609375, 0.6153182983398438, 0.64910888671875, 0.6828994750976562, 0.7166900634765625, 0.7504806518554688, 0.784271240234375, 0.8180618286132812, 0.8518524169921875, 0.8856430053710938, 0.91943359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 10.0, 16.0, 13.0, 17.0, 20.0, 16.0, 22.0, 25.0, 22.0, 30.0, 25.0, 39.0, 38.0, 38.0, 38.0, 40.0, 36.0, 31.0, 34.0, 45.0, 35.0, 42.0, 41.0, 33.0, 31.0, 35.0, 26.0, 31.0, 19.0, 17.0, 17.0, 15.0, 19.0, 9.0, 8.0, 8.0, 5.0, 5.0, 5.0, 4.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6005859375, -0.5823593139648438, -0.5641326904296875, -0.5459060668945312, -0.527679443359375, -0.5094528198242188, -0.4912261962890625, -0.47299957275390625, -0.45477294921875, -0.43654632568359375, -0.4183197021484375, -0.40009307861328125, -0.381866455078125, -0.36363983154296875, -0.3454132080078125, -0.32718658447265625, -0.3089599609375, -0.29073333740234375, -0.2725067138671875, -0.25428009033203125, -0.236053466796875, -0.21782684326171875, -0.1996002197265625, -0.18137359619140625, -0.16314697265625, -0.14492034912109375, -0.1266937255859375, -0.10846710205078125, -0.090240478515625, -0.07201385498046875, -0.0537872314453125, -0.03556060791015625, -0.017333984375, 0.00089263916015625, 0.0191192626953125, 0.03734588623046875, 0.055572509765625, 0.07379913330078125, 0.0920257568359375, 0.11025238037109375, 0.12847900390625, 0.14670562744140625, 0.1649322509765625, 0.18315887451171875, 0.201385498046875, 0.21961212158203125, 0.2378387451171875, 0.25606536865234375, 0.2742919921875, 0.29251861572265625, 0.3107452392578125, 0.32897186279296875, 0.347198486328125, 0.36542510986328125, 0.3836517333984375, 0.40187835693359375, 0.42010498046875, 0.43833160400390625, 0.4565582275390625, 0.47478485107421875, 0.493011474609375, 0.5112380981445312, 0.5294647216796875, 0.5476913452148438, 0.56591796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 10.0, 10.0, 11.0, 8.0, 18.0, 27.0, 36.0, 42.0, 63.0, 100.0, 161.0, 304.0, 665.0, 1864.0, 7142.0, 36723.0, 244075.0, 572795.0, 153429.0, 23449.0, 4904.0, 1453.0, 515.0, 253.0, 138.0, 114.0, 62.0, 49.0, 28.0, 18.0, 17.0, 14.0, 8.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.162109375, -0.15677261352539062, -0.15143585205078125, -0.14609909057617188, -0.1407623291015625, -0.13542556762695312, -0.13008880615234375, -0.12475204467773438, -0.119415283203125, -0.11407852172851562, -0.10874176025390625, -0.10340499877929688, -0.0980682373046875, -0.09273147583007812, -0.08739471435546875, -0.08205795288085938, -0.07672119140625, -0.07138442993164062, -0.06604766845703125, -0.060710906982421875, -0.0553741455078125, -0.050037384033203125, -0.04470062255859375, -0.039363861083984375, -0.034027099609375, -0.028690338134765625, -0.02335357666015625, -0.018016815185546875, -0.0126800537109375, -0.007343292236328125, -0.00200653076171875, 0.003330230712890625, 0.0086669921875, 0.014003753662109375, 0.01934051513671875, 0.024677276611328125, 0.0300140380859375, 0.035350799560546875, 0.04068756103515625, 0.046024322509765625, 0.051361083984375, 0.056697845458984375, 0.06203460693359375, 0.06737136840820312, 0.0727081298828125, 0.07804489135742188, 0.08338165283203125, 0.08871841430664062, 0.09405517578125, 0.09939193725585938, 0.10472869873046875, 0.11006546020507812, 0.1154022216796875, 0.12073898315429688, 0.12607574462890625, 0.13141250610351562, 0.136749267578125, 0.14208602905273438, 0.14742279052734375, 0.15275955200195312, 0.1580963134765625, 0.16343307495117188, 0.16876983642578125, 0.17410659790039062, 0.179443359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 11.0, 14.0, 19.0, 21.0, 42.0, 43.0, 68.0, 80.0, 98.0, 115.0, 103.0, 82.0, 95.0, 53.0, 46.0, 45.0, 18.0, 13.0, 4.0, 2.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.528594970703125e-05, -3.437511622905731e-05, -3.3464282751083374e-05, -3.2553449273109436e-05, -3.16426157951355e-05, -3.073178231716156e-05, -2.9820948839187622e-05, -2.8910115361213684e-05, -2.7999281883239746e-05, -2.7088448405265808e-05, -2.617761492729187e-05, -2.5266781449317932e-05, -2.4355947971343994e-05, -2.3445114493370056e-05, -2.2534281015396118e-05, -2.162344753742218e-05, -2.0712614059448242e-05, -1.9801780581474304e-05, -1.8890947103500366e-05, -1.7980113625526428e-05, -1.706928014755249e-05, -1.6158446669578552e-05, -1.5247613191604614e-05, -1.4336779713630676e-05, -1.3425946235656738e-05, -1.25151127576828e-05, -1.1604279279708862e-05, -1.0693445801734924e-05, -9.782612323760986e-06, -8.871778845787048e-06, -7.96094536781311e-06, -7.050111889839172e-06, -6.139278411865234e-06, -5.228444933891296e-06, -4.317611455917358e-06, -3.4067779779434204e-06, -2.4959444999694824e-06, -1.5851110219955444e-06, -6.742775440216064e-07, 2.3655593395233154e-07, 1.1473894119262695e-06, 2.0582228899002075e-06, 2.9690563678741455e-06, 3.8798898458480835e-06, 4.7907233238220215e-06, 5.7015568017959595e-06, 6.6123902797698975e-06, 7.5232237577438354e-06, 8.434057235717773e-06, 9.344890713691711e-06, 1.025572419166565e-05, 1.1166557669639587e-05, 1.2077391147613525e-05, 1.2988224625587463e-05, 1.3899058103561401e-05, 1.480989158153534e-05, 1.5720725059509277e-05, 1.6631558537483215e-05, 1.7542392015457153e-05, 1.845322549343109e-05, 1.936405897140503e-05, 2.0274892449378967e-05, 2.1185725927352905e-05, 2.2096559405326843e-05, 2.300739288330078e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 12.0, 7.0, 14.0, 16.0, 28.0, 51.0, 67.0, 110.0, 251.0, 516.0, 1706.0, 8177.0, 83566.0, 729317.0, 204609.0, 15988.0, 2730.0, 729.0, 293.0, 137.0, 89.0, 46.0, 24.0, 22.0, 14.0, 8.0, 9.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.2811851501464844, -0.27257537841796875, -0.2639656066894531, -0.2553558349609375, -0.24674606323242188, -0.23813629150390625, -0.22952651977539062, -0.220916748046875, -0.21230697631835938, -0.20369720458984375, -0.19508743286132812, -0.1864776611328125, -0.17786788940429688, -0.16925811767578125, -0.16064834594726562, -0.15203857421875, -0.14342880249023438, -0.13481903076171875, -0.12620925903320312, -0.1175994873046875, -0.10898971557617188, -0.10037994384765625, -0.09177017211914062, -0.083160400390625, -0.07455062866210938, -0.06594085693359375, -0.057331085205078125, -0.0487213134765625, -0.040111541748046875, -0.03150177001953125, -0.022891998291015625, -0.0142822265625, -0.005672454833984375, 0.00293731689453125, 0.011547088623046875, 0.0201568603515625, 0.028766632080078125, 0.03737640380859375, 0.045986175537109375, 0.054595947265625, 0.06320571899414062, 0.07181549072265625, 0.08042526245117188, 0.0890350341796875, 0.09764480590820312, 0.10625457763671875, 0.11486434936523438, 0.12347412109375, 0.13208389282226562, 0.14069366455078125, 0.14930343627929688, 0.1579132080078125, 0.16652297973632812, 0.17513275146484375, 0.18374252319335938, 0.192352294921875, 0.20096206665039062, 0.20957183837890625, 0.21818161010742188, 0.2267913818359375, 0.23540115356445312, 0.24401092529296875, 0.2526206970214844, 0.26123046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 12.0, 9.0, 17.0, 27.0, 33.0, 45.0, 44.0, 46.0, 61.0, 65.0, 63.0, 84.0, 88.0, 67.0, 45.0, 47.0, 47.0, 41.0, 34.0, 23.0, 18.0, 18.0, 17.0, 11.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07257080078125, -0.07035064697265625, -0.0681304931640625, -0.06591033935546875, -0.063690185546875, -0.06147003173828125, -0.0592498779296875, -0.05702972412109375, -0.0548095703125, -0.05258941650390625, -0.0503692626953125, -0.04814910888671875, -0.045928955078125, -0.04370880126953125, -0.0414886474609375, -0.03926849365234375, -0.03704833984375, -0.03482818603515625, -0.0326080322265625, -0.03038787841796875, -0.028167724609375, -0.02594757080078125, -0.0237274169921875, -0.02150726318359375, -0.019287109375, -0.01706695556640625, -0.0148468017578125, -0.01262664794921875, -0.010406494140625, -0.00818634033203125, -0.0059661865234375, -0.00374603271484375, -0.00152587890625, 0.00069427490234375, 0.0029144287109375, 0.00513458251953125, 0.007354736328125, 0.00957489013671875, 0.0117950439453125, 0.01401519775390625, 0.0162353515625, 0.01845550537109375, 0.0206756591796875, 0.02289581298828125, 0.025115966796875, 0.02733612060546875, 0.0295562744140625, 0.03177642822265625, 0.03399658203125, 0.03621673583984375, 0.0384368896484375, 0.04065704345703125, 0.042877197265625, 0.04509735107421875, 0.0473175048828125, 0.04953765869140625, 0.0517578125, 0.05397796630859375, 0.0561981201171875, 0.05841827392578125, 0.060638427734375, 0.06285858154296875, 0.0650787353515625, 0.06729888916015625, 0.06951904296875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 14.0, 49.0, 254.0, 436.0, 194.0, 49.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.422909736633301, -4.248702049255371, -4.074494361877441, -3.9002864360809326, -3.726078510284424, -3.551870822906494, -3.3776631355285645, -3.2034554481506348, -3.029247522354126, -2.8550398349761963, -2.6808319091796875, -2.506624221801758, -2.332416534423828, -2.1582086086273193, -1.9840009212493896, -1.8097931146621704, -1.6355853080749512, -1.461377501487732, -1.2871696949005127, -1.112962007522583, -0.9387542009353638, -0.7645463943481445, -0.5903387069702148, -0.4161309003829956, -0.24192309379577637, -0.06771531701087952, 0.10649245977401733, 0.2807002067565918, 0.45490801334381104, 0.6291158199310303, 0.80332350730896, 0.9775313138961792, 1.1517391204833984, 1.3259469270706177, 1.500154733657837, 1.6743624210357666, 1.8485702276229858, 2.022778034210205, 2.1969857215881348, 2.3711934089660645, 2.5454013347625732, 2.719609022140503, 2.8938169479370117, 3.0680246353149414, 3.242232322692871, 3.41644024848938, 3.5906479358673096, 3.7648558616638184, 3.939063549041748, 4.113271236419678, 4.287478923797607, 4.461687088012695, 4.635894775390625, 4.810102462768555, 4.984310150146484, 5.158517837524414, 5.332725524902344, 5.506933212280273, 5.681140899658203, 5.855348587036133, 6.029556751251221, 6.20376443862915, 6.37797212600708, 6.55217981338501, 6.726387977600098]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 12.0, 12.0, 16.0, 30.0, 36.0, 33.0, 26.0, 43.0, 45.0, 52.0, 51.0, 70.0, 63.0, 58.0, 61.0, 47.0, 59.0, 41.0, 45.0, 42.0, 33.0, 26.0, 30.0, 16.0, 10.0, 15.0, 8.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-2.1548409461975098, -2.104698896408081, -2.0545566082000732, -2.0044145584106445, -1.9542725086212158, -1.9041303396224976, -1.8539881706237793, -1.8038461208343506, -1.7537039518356323, -1.703561782836914, -1.6534197330474854, -1.603277564048767, -1.5531355142593384, -1.5029933452606201, -1.4528512954711914, -1.4027091264724731, -1.3525669574737549, -1.3024247884750366, -1.252282738685608, -1.2021405696868896, -1.151998519897461, -1.1018563508987427, -1.0517141819000244, -1.0015721321105957, -0.951430082321167, -0.9012879729270935, -0.85114586353302, -0.8010036945343018, -0.7508615851402283, -0.7007194757461548, -0.6505773663520813, -0.6004352569580078, -0.5502930879592896, -0.5001509785652161, -0.4500088393688202, -0.3998667299747467, -0.34972459077835083, -0.29958248138427734, -0.24944037199020386, -0.19929823279380798, -0.1491561233997345, -0.09901399910449982, -0.048871882259845734, 0.0012702345848083496, 0.05141235888004303, 0.10155448317527771, 0.1516965925693512, 0.20183873176574707, 0.25198084115982056, 0.30212295055389404, 0.3522650897502899, 0.4024071991443634, 0.4525493383407593, 0.5026914477348328, 0.5528335571289062, 0.6029757261276245, 0.6531177759170532, 0.7032598853111267, 0.7534019947052002, 0.8035441637039185, 0.8536862730979919, 0.9038283824920654, 0.9539704918861389, 1.0041126012802124, 1.0542547702789307]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 14.0, 8.0, 18.0, 17.0, 22.0, 49.0, 57.0, 95.0, 161.0, 258.0, 451.0, 856.0, 1619.0, 3725.0, 8922.0, 26944.0, 103671.0, 436046.0, 1433083.0, 1533489.0, 486195.0, 111491.0, 29328.0, 9631.0, 3793.0, 1919.0, 992.0, 539.0, 329.0, 184.0, 126.0, 70.0, 52.0, 41.0, 20.0, 26.0, 12.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5667800903320312, -0.5490875244140625, -0.5313949584960938, -0.513702392578125, -0.49600982666015625, -0.4783172607421875, -0.46062469482421875, -0.44293212890625, -0.42523956298828125, -0.4075469970703125, -0.38985443115234375, -0.372161865234375, -0.35446929931640625, -0.3367767333984375, -0.31908416748046875, -0.3013916015625, -0.28369903564453125, -0.2660064697265625, -0.24831390380859375, -0.230621337890625, -0.21292877197265625, -0.1952362060546875, -0.17754364013671875, -0.15985107421875, -0.14215850830078125, -0.1244659423828125, -0.10677337646484375, -0.089080810546875, -0.07138824462890625, -0.0536956787109375, -0.03600311279296875, -0.018310546875, -0.00061798095703125, 0.0170745849609375, 0.03476715087890625, 0.052459716796875, 0.07015228271484375, 0.0878448486328125, 0.10553741455078125, 0.12322998046875, 0.14092254638671875, 0.1586151123046875, 0.17630767822265625, 0.194000244140625, 0.21169281005859375, 0.2293853759765625, 0.24707794189453125, 0.2647705078125, 0.28246307373046875, 0.3001556396484375, 0.31784820556640625, 0.335540771484375, 0.35323333740234375, 0.3709259033203125, 0.38861846923828125, 0.40631103515625, 0.42400360107421875, 0.4416961669921875, 0.45938873291015625, 0.477081298828125, 0.49477386474609375, 0.5124664306640625, 0.5301589965820312, 0.5478515625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 12.0, 9.0, 16.0, 14.0, 17.0, 24.0, 22.0, 44.0, 26.0, 36.0, 40.0, 44.0, 52.0, 39.0, 51.0, 55.0, 41.0, 46.0, 54.0, 49.0, 44.0, 33.0, 37.0, 29.0, 26.0, 28.0, 26.0, 14.0, 15.0, 8.0, 16.0, 5.0, 4.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6513671875, -0.633209228515625, -0.61505126953125, -0.596893310546875, -0.5787353515625, -0.560577392578125, -0.54241943359375, -0.524261474609375, -0.506103515625, -0.487945556640625, -0.46978759765625, -0.451629638671875, -0.4334716796875, -0.415313720703125, -0.39715576171875, -0.378997802734375, -0.36083984375, -0.342681884765625, -0.32452392578125, -0.306365966796875, -0.2882080078125, -0.270050048828125, -0.25189208984375, -0.233734130859375, -0.215576171875, -0.197418212890625, -0.17926025390625, -0.161102294921875, -0.1429443359375, -0.124786376953125, -0.10662841796875, -0.088470458984375, -0.0703125, -0.052154541015625, -0.03399658203125, -0.015838623046875, 0.0023193359375, 0.020477294921875, 0.03863525390625, 0.056793212890625, 0.074951171875, 0.093109130859375, 0.11126708984375, 0.129425048828125, 0.1475830078125, 0.165740966796875, 0.18389892578125, 0.202056884765625, 0.22021484375, 0.238372802734375, 0.25653076171875, 0.274688720703125, 0.2928466796875, 0.311004638671875, 0.32916259765625, 0.347320556640625, 0.365478515625, 0.383636474609375, 0.40179443359375, 0.419952392578125, 0.4381103515625, 0.456268310546875, 0.47442626953125, 0.492584228515625, 0.5107421875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 13.0, 12.0, 17.0, 29.0, 68.0, 139.0, 271.0, 615.0, 2707.0, 40349.0, 3943700.0, 199586.0, 5217.0, 920.0, 315.0, 157.0, 78.0, 27.0, 26.0, 15.0, 4.0, 5.0, 7.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.3656768798828125, -1.302642822265625, -1.2396087646484375, -1.17657470703125, -1.1135406494140625, -1.050506591796875, -0.9874725341796875, -0.9244384765625, -0.8614044189453125, -0.798370361328125, -0.7353363037109375, -0.67230224609375, -0.6092681884765625, -0.546234130859375, -0.4832000732421875, -0.420166015625, -0.3571319580078125, -0.294097900390625, -0.2310638427734375, -0.16802978515625, -0.1049957275390625, -0.041961669921875, 0.0210723876953125, 0.0841064453125, 0.1471405029296875, 0.210174560546875, 0.2732086181640625, 0.33624267578125, 0.3992767333984375, 0.462310791015625, 0.5253448486328125, 0.58837890625, 0.6514129638671875, 0.714447021484375, 0.7774810791015625, 0.84051513671875, 0.9035491943359375, 0.966583251953125, 1.0296173095703125, 1.0926513671875, 1.1556854248046875, 1.218719482421875, 1.2817535400390625, 1.34478759765625, 1.4078216552734375, 1.470855712890625, 1.5338897705078125, 1.596923828125, 1.6599578857421875, 1.722991943359375, 1.7860260009765625, 1.84906005859375, 1.9120941162109375, 1.975128173828125, 2.0381622314453125, 2.1011962890625, 2.1642303466796875, 2.227264404296875, 2.2902984619140625, 2.35333251953125, 2.4163665771484375, 2.479400634765625, 2.5424346923828125, 2.60546875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 12.0, 4.0, 11.0, 15.0, 23.0, 38.0, 45.0, 65.0, 116.0, 152.0, 268.0, 424.0, 522.0, 591.0, 534.0, 396.0, 278.0, 181.0, 129.0, 93.0, 52.0, 37.0, 22.0, 19.0, 11.0, 12.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.26291847229003906, -0.2550849914550781, -0.2472515106201172, -0.23941802978515625, -0.2315845489501953, -0.22375106811523438, -0.21591758728027344, -0.2080841064453125, -0.20025062561035156, -0.19241714477539062, -0.1845836639404297, -0.17675018310546875, -0.1689167022705078, -0.16108322143554688, -0.15324974060058594, -0.145416259765625, -0.13758277893066406, -0.12974929809570312, -0.12191581726074219, -0.11408233642578125, -0.10624885559082031, -0.09841537475585938, -0.09058189392089844, -0.0827484130859375, -0.07491493225097656, -0.06708145141601562, -0.05924797058105469, -0.05141448974609375, -0.04358100891113281, -0.035747528076171875, -0.027914047241210938, -0.02008056640625, -0.012247085571289062, -0.004413604736328125, 0.0034198760986328125, 0.01125335693359375, 0.019086837768554688, 0.026920318603515625, 0.03475379943847656, 0.0425872802734375, 0.05042076110839844, 0.058254241943359375, 0.06608772277832031, 0.07392120361328125, 0.08175468444824219, 0.08958816528320312, 0.09742164611816406, 0.105255126953125, 0.11308860778808594, 0.12092208862304688, 0.1287555694580078, 0.13658905029296875, 0.1444225311279297, 0.15225601196289062, 0.16008949279785156, 0.1679229736328125, 0.17575645446777344, 0.18358993530273438, 0.1914234161376953, 0.19925689697265625, 0.2070903778076172, 0.21492385864257812, 0.22275733947753906, 0.2305908203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 16.0, 30.0, 48.0, 68.0, 80.0, 132.0, 129.0, 157.0, 87.0, 86.0, 57.0, 52.0, 21.0, 10.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0451819896697998, -1.0011907815933228, -0.9571995735168457, -0.9132083654403687, -0.8692171573638916, -0.8252259492874146, -0.7812348008155823, -0.7372435927391052, -0.6932523846626282, -0.6492611765861511, -0.6052699685096741, -0.5612788200378418, -0.5172876119613647, -0.4732963740825653, -0.42930519580841064, -0.3853139877319336, -0.34132277965545654, -0.2973315715789795, -0.25334036350250244, -0.20934918522834778, -0.16535797715187073, -0.12136676907539368, -0.07737559080123901, -0.03338438272476196, 0.010606825351715088, 0.05459802597761154, 0.098589226603508, 0.14258041977882385, 0.1865716278553009, 0.23056283593177795, 0.2745540142059326, 0.31854522228240967, 0.36253654956817627, 0.4065277576446533, 0.45051896572113037, 0.49451014399528503, 0.5385013818740845, 0.5824925899505615, 0.6264837384223938, 0.6704749464988708, 0.7144661545753479, 0.758457362651825, 0.802448570728302, 0.8464397192001343, 0.8904309272766113, 0.9344221353530884, 0.9784133434295654, 1.0224045515060425, 1.0663957595825195, 1.1103869676589966, 1.1543781757354736, 1.1983693838119507, 1.2423605918884277, 1.2863517999649048, 1.3303430080413818, 1.3743340969085693, 1.418325424194336, 1.462316632270813, 1.50630784034729, 1.550299048423767, 1.5942902565002441, 1.6382814645767212, 1.6822726726531982, 1.7262637615203857, 1.7702549695968628]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 7.0, 17.0, 8.0, 12.0, 15.0, 19.0, 22.0, 27.0, 21.0, 21.0, 31.0, 40.0, 33.0, 38.0, 39.0, 36.0, 37.0, 52.0, 41.0, 45.0, 35.0, 37.0, 52.0, 33.0, 23.0, 30.0, 36.0, 20.0, 16.0, 35.0, 12.0, 16.0, 12.0, 7.0, 11.0, 9.0, 10.0, 5.0, 6.0, 2.0, 5.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5159679055213928, -0.49996817111968994, -0.48396843671798706, -0.46796873211860657, -0.4519689977169037, -0.4359692633152008, -0.4199695587158203, -0.40396982431411743, -0.38797008991241455, -0.37197035551071167, -0.3559706211090088, -0.3399709165096283, -0.3239711821079254, -0.30797144770622253, -0.29197174310684204, -0.27597200870513916, -0.2599722743034363, -0.2439725399017334, -0.2279728204011917, -0.21197310090065002, -0.19597336649894714, -0.17997363209724426, -0.16397391259670258, -0.1479741930961609, -0.131974458694458, -0.11597473174333572, -0.09997500479221344, -0.08397527784109116, -0.06797555088996887, -0.05197582393884659, -0.035976096987724304, -0.01997637003660202, -0.003976583480834961, 0.012023143470287323, 0.028022870421409607, 0.04402259737253189, 0.060022324323654175, 0.07602205127477646, 0.09202177822589874, 0.10802150517702103, 0.12402123212814331, 0.1400209665298462, 0.15602068603038788, 0.17202040553092957, 0.18802013993263245, 0.20401987433433533, 0.22001959383487701, 0.2360193133354187, 0.2520190477371216, 0.26801878213882446, 0.28401851654052734, 0.30001822113990784, 0.3160179555416107, 0.3320176899433136, 0.3480173945426941, 0.364017128944397, 0.38001686334609985, 0.39601659774780273, 0.4120163321495056, 0.4280160367488861, 0.444015771150589, 0.46001550555229187, 0.47601521015167236, 0.49201494455337524, 0.5080146789550781]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 9.0, 10.0, 7.0, 11.0, 10.0, 21.0, 39.0, 76.0, 182.0, 566.0, 1834.0, 7969.0, 43595.0, 529377.0, 419081.0, 36288.0, 6944.0, 1698.0, 507.0, 142.0, 79.0, 34.0, 20.0, 13.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.320556640625, -0.3101997375488281, -0.29984283447265625, -0.2894859313964844, -0.2791290283203125, -0.2687721252441406, -0.25841522216796875, -0.24805831909179688, -0.237701416015625, -0.22734451293945312, -0.21698760986328125, -0.20663070678710938, -0.1962738037109375, -0.18591690063476562, -0.17555999755859375, -0.16520309448242188, -0.15484619140625, -0.14448928833007812, -0.13413238525390625, -0.12377548217773438, -0.1134185791015625, -0.10306167602539062, -0.09270477294921875, -0.08234786987304688, -0.071990966796875, -0.061634063720703125, -0.05127716064453125, -0.040920257568359375, -0.0305633544921875, -0.020206451416015625, -0.00984954833984375, 0.000507354736328125, 0.0108642578125, 0.021221160888671875, 0.03157806396484375, 0.041934967041015625, 0.0522918701171875, 0.06264877319335938, 0.07300567626953125, 0.08336257934570312, 0.093719482421875, 0.10407638549804688, 0.11443328857421875, 0.12479019165039062, 0.1351470947265625, 0.14550399780273438, 0.15586090087890625, 0.16621780395507812, 0.17657470703125, 0.18693161010742188, 0.19728851318359375, 0.20764541625976562, 0.2180023193359375, 0.22835922241210938, 0.23871612548828125, 0.24907302856445312, 0.259429931640625, 0.2697868347167969, 0.28014373779296875, 0.2905006408691406, 0.3008575439453125, 0.3112144470214844, 0.32157135009765625, 0.3319282531738281, 0.34228515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 9.0, 4.0, 16.0, 16.0, 21.0, 15.0, 27.0, 22.0, 30.0, 30.0, 35.0, 43.0, 43.0, 40.0, 51.0, 34.0, 52.0, 50.0, 50.0, 42.0, 43.0, 37.0, 39.0, 36.0, 36.0, 27.0, 16.0, 17.0, 20.0, 12.0, 22.0, 7.0, 12.0, 9.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4013671875, -0.3894157409667969, -0.37746429443359375, -0.3655128479003906, -0.3535614013671875, -0.3416099548339844, -0.32965850830078125, -0.3177070617675781, -0.305755615234375, -0.2938041687011719, -0.28185272216796875, -0.2699012756347656, -0.2579498291015625, -0.24599838256835938, -0.23404693603515625, -0.22209548950195312, -0.21014404296875, -0.19819259643554688, -0.18624114990234375, -0.17428970336914062, -0.1623382568359375, -0.15038681030273438, -0.13843536376953125, -0.12648391723632812, -0.114532470703125, -0.10258102416992188, -0.09062957763671875, -0.07867813110351562, -0.0667266845703125, -0.054775238037109375, -0.04282379150390625, -0.030872344970703125, -0.0189208984375, -0.006969451904296875, 0.00498199462890625, 0.016933441162109375, 0.0288848876953125, 0.040836334228515625, 0.05278778076171875, 0.06473922729492188, 0.076690673828125, 0.08864212036132812, 0.10059356689453125, 0.11254501342773438, 0.1244964599609375, 0.13644790649414062, 0.14839935302734375, 0.16035079956054688, 0.17230224609375, 0.18425369262695312, 0.19620513916015625, 0.20815658569335938, 0.2201080322265625, 0.23205947875976562, 0.24401092529296875, 0.2559623718261719, 0.267913818359375, 0.2798652648925781, 0.29181671142578125, 0.3037681579589844, 0.3157196044921875, 0.3276710510253906, 0.33962249755859375, 0.3515739440917969, 0.363525390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 7.0, 13.0, 11.0, 23.0, 29.0, 40.0, 53.0, 88.0, 119.0, 211.0, 362.0, 769.0, 1511.0, 3481.0, 8365.0, 22948.0, 75238.0, 307181.0, 441503.0, 129968.0, 35254.0, 12231.0, 4956.0, 2027.0, 917.0, 481.0, 268.0, 162.0, 97.0, 66.0, 39.0, 34.0, 20.0, 17.0, 18.0, 6.0, 3.0, 8.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.149169921875, -0.14438819885253906, -0.13960647583007812, -0.1348247528076172, -0.13004302978515625, -0.1252613067626953, -0.12047958374023438, -0.11569786071777344, -0.1109161376953125, -0.10613441467285156, -0.10135269165039062, -0.09657096862792969, -0.09178924560546875, -0.08700752258300781, -0.08222579956054688, -0.07744407653808594, -0.072662353515625, -0.06788063049316406, -0.06309890747070312, -0.05831718444824219, -0.05353546142578125, -0.04875373840332031, -0.043972015380859375, -0.03919029235839844, -0.0344085693359375, -0.029626846313476562, -0.024845123291015625, -0.020063400268554688, -0.01528167724609375, -0.010499954223632812, -0.005718231201171875, -0.0009365081787109375, 0.00384521484375, 0.008626937866210938, 0.013408660888671875, 0.018190383911132812, 0.02297210693359375, 0.027753829956054688, 0.032535552978515625, 0.03731727600097656, 0.0420989990234375, 0.04688072204589844, 0.051662445068359375, 0.05644416809082031, 0.06122589111328125, 0.06600761413574219, 0.07078933715820312, 0.07557106018066406, 0.080352783203125, 0.08513450622558594, 0.08991622924804688, 0.09469795227050781, 0.09947967529296875, 0.10426139831542969, 0.10904312133789062, 0.11382484436035156, 0.1186065673828125, 0.12338829040527344, 0.12817001342773438, 0.1329517364501953, 0.13773345947265625, 0.1425151824951172, 0.14729690551757812, 0.15207862854003906, 0.1568603515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 8.0, 7.0, 7.0, 15.0, 11.0, 17.0, 9.0, 17.0, 21.0, 19.0, 32.0, 26.0, 34.0, 28.0, 40.0, 35.0, 33.0, 54.0, 38.0, 32.0, 50.0, 55.0, 37.0, 43.0, 35.0, 28.0, 34.0, 21.0, 31.0, 19.0, 21.0, 16.0, 22.0, 18.0, 17.0, 7.0, 12.0, 10.0, 8.0, 6.0, 4.0, 2.0, 8.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0], "bins": [-0.73974609375, -0.718994140625, -0.6982421875, -0.677490234375, -0.65673828125, -0.635986328125, -0.615234375, -0.594482421875, -0.57373046875, -0.552978515625, -0.5322265625, -0.511474609375, -0.49072265625, -0.469970703125, -0.44921875, -0.428466796875, -0.40771484375, -0.386962890625, -0.3662109375, -0.345458984375, -0.32470703125, -0.303955078125, -0.283203125, -0.262451171875, -0.24169921875, -0.220947265625, -0.2001953125, -0.179443359375, -0.15869140625, -0.137939453125, -0.1171875, -0.096435546875, -0.07568359375, -0.054931640625, -0.0341796875, -0.013427734375, 0.00732421875, 0.028076171875, 0.048828125, 0.069580078125, 0.09033203125, 0.111083984375, 0.1318359375, 0.152587890625, 0.17333984375, 0.194091796875, 0.21484375, 0.235595703125, 0.25634765625, 0.277099609375, 0.2978515625, 0.318603515625, 0.33935546875, 0.360107421875, 0.380859375, 0.401611328125, 0.42236328125, 0.443115234375, 0.4638671875, 0.484619140625, 0.50537109375, 0.526123046875, 0.546875, 0.567626953125, 0.58837890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 9.0, 8.0, 14.0, 15.0, 21.0, 44.0, 52.0, 96.0, 169.0, 282.0, 524.0, 1029.0, 2141.0, 5028.0, 13299.0, 45940.0, 238273.0, 549462.0, 143729.0, 30834.0, 9811.0, 4024.0, 1793.0, 861.0, 421.0, 270.0, 150.0, 82.0, 54.0, 27.0, 23.0, 9.0, 18.0, 9.0, 13.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061553955078125, -0.05965137481689453, -0.05774879455566406, -0.055846214294433594, -0.053943634033203125, -0.052041053771972656, -0.05013847351074219, -0.04823589324951172, -0.04633331298828125, -0.04443073272705078, -0.04252815246582031, -0.040625572204589844, -0.038722991943359375, -0.036820411682128906, -0.03491783142089844, -0.03301525115966797, -0.0311126708984375, -0.02921009063720703, -0.027307510375976562, -0.025404930114746094, -0.023502349853515625, -0.021599769592285156, -0.019697189331054688, -0.01779460906982422, -0.01589202880859375, -0.013989448547363281, -0.012086868286132812, -0.010184288024902344, -0.008281707763671875, -0.006379127502441406, -0.0044765472412109375, -0.0025739669799804688, -0.00067138671875, 0.0012311935424804688, 0.0031337738037109375, 0.005036354064941406, 0.006938934326171875, 0.008841514587402344, 0.010744094848632812, 0.012646675109863281, 0.01454925537109375, 0.01645183563232422, 0.018354415893554688, 0.020256996154785156, 0.022159576416015625, 0.024062156677246094, 0.025964736938476562, 0.02786731719970703, 0.0297698974609375, 0.03167247772216797, 0.03357505798339844, 0.035477638244628906, 0.037380218505859375, 0.039282798767089844, 0.04118537902832031, 0.04308795928955078, 0.04499053955078125, 0.04689311981201172, 0.04879570007324219, 0.050698280334472656, 0.052600860595703125, 0.054503440856933594, 0.05640602111816406, 0.05830860137939453, 0.060211181640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 15.0, 11.0, 16.0, 24.0, 39.0, 41.0, 58.0, 64.0, 88.0, 100.0, 97.0, 95.0, 85.0, 68.0, 57.0, 28.0, 31.0, 20.0, 17.0, 14.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.199411392211914e-05, -2.1243467926979065e-05, -2.049282193183899e-05, -1.9742175936698914e-05, -1.8991529941558838e-05, -1.8240883946418762e-05, -1.7490237951278687e-05, -1.673959195613861e-05, -1.5988945960998535e-05, -1.523829996585846e-05, -1.4487653970718384e-05, -1.3737007975578308e-05, -1.2986361980438232e-05, -1.2235715985298157e-05, -1.1485069990158081e-05, -1.0734423995018005e-05, -9.98377799987793e-06, -9.233132004737854e-06, -8.482486009597778e-06, -7.731840014457703e-06, -6.981194019317627e-06, -6.230548024177551e-06, -5.479902029037476e-06, -4.7292560338974e-06, -3.978610038757324e-06, -3.2279640436172485e-06, -2.477318048477173e-06, -1.7266720533370972e-06, -9.760260581970215e-07, -2.253800630569458e-07, 5.252659320831299e-07, 1.2759119272232056e-06, 2.0265579223632812e-06, 2.777203917503357e-06, 3.5278499126434326e-06, 4.278495907783508e-06, 5.029141902923584e-06, 5.77978789806366e-06, 6.530433893203735e-06, 7.281079888343811e-06, 8.031725883483887e-06, 8.782371878623962e-06, 9.533017873764038e-06, 1.0283663868904114e-05, 1.103430986404419e-05, 1.1784955859184265e-05, 1.253560185432434e-05, 1.3286247849464417e-05, 1.4036893844604492e-05, 1.4787539839744568e-05, 1.5538185834884644e-05, 1.628883183002472e-05, 1.7039477825164795e-05, 1.779012382030487e-05, 1.8540769815444946e-05, 1.9291415810585022e-05, 2.0042061805725098e-05, 2.0792707800865173e-05, 2.154335379600525e-05, 2.2293999791145325e-05, 2.30446457862854e-05, 2.3795291781425476e-05, 2.4545937776565552e-05, 2.5296583771705627e-05, 2.6047229766845703e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 8.0, 8.0, 15.0, 17.0, 20.0, 27.0, 56.0, 81.0, 138.0, 304.0, 788.0, 2078.0, 6620.0, 26345.0, 185276.0, 691526.0, 108995.0, 18507.0, 4943.0, 1525.0, 631.0, 280.0, 139.0, 64.0, 29.0, 27.0, 21.0, 16.0, 13.0, 12.0, 6.0, 6.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09519290924072266, -0.09242439270019531, -0.08965587615966797, -0.08688735961914062, -0.08411884307861328, -0.08135032653808594, -0.0785818099975586, -0.07581329345703125, -0.0730447769165039, -0.07027626037597656, -0.06750774383544922, -0.06473922729492188, -0.06197071075439453, -0.05920219421386719, -0.056433677673339844, -0.0536651611328125, -0.050896644592285156, -0.04812812805175781, -0.04535961151123047, -0.042591094970703125, -0.03982257843017578, -0.03705406188964844, -0.034285545349121094, -0.03151702880859375, -0.028748512268066406, -0.025979995727539062, -0.02321147918701172, -0.020442962646484375, -0.01767444610595703, -0.014905929565429688, -0.012137413024902344, -0.009368896484375, -0.006600379943847656, -0.0038318634033203125, -0.0010633468627929688, 0.001705169677734375, 0.004473686218261719, 0.0072422027587890625, 0.010010719299316406, 0.01277923583984375, 0.015547752380371094, 0.018316268920898438, 0.02108478546142578, 0.023853302001953125, 0.02662181854248047, 0.029390335083007812, 0.032158851623535156, 0.0349273681640625, 0.037695884704589844, 0.04046440124511719, 0.04323291778564453, 0.046001434326171875, 0.04876995086669922, 0.05153846740722656, 0.054306983947753906, 0.05707550048828125, 0.059844017028808594, 0.06261253356933594, 0.06538105010986328, 0.06814956665039062, 0.07091808319091797, 0.07368659973144531, 0.07645511627197266, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 7.0, 8.0, 7.0, 8.0, 21.0, 30.0, 32.0, 45.0, 59.0, 73.0, 94.0, 111.0, 108.0, 89.0, 83.0, 56.0, 40.0, 27.0, 25.0, 17.0, 12.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01519775390625, -0.014630556106567383, -0.014063358306884766, -0.013496160507202148, -0.012928962707519531, -0.012361764907836914, -0.011794567108154297, -0.01122736930847168, -0.010660171508789062, -0.010092973709106445, -0.009525775909423828, -0.008958578109741211, -0.008391380310058594, -0.007824182510375977, -0.007256984710693359, -0.006689786911010742, -0.006122589111328125, -0.005555391311645508, -0.004988193511962891, -0.0044209957122802734, -0.0038537979125976562, -0.003286600112915039, -0.002719402313232422, -0.0021522045135498047, -0.0015850067138671875, -0.0010178089141845703, -0.0004506111145019531, 0.00011658668518066406, 0.0006837844848632812, 0.0012509822845458984, 0.0018181800842285156, 0.002385377883911133, 0.00295257568359375, 0.003519773483276367, 0.004086971282958984, 0.0046541690826416016, 0.005221366882324219, 0.005788564682006836, 0.006355762481689453, 0.00692296028137207, 0.0074901580810546875, 0.008057355880737305, 0.008624553680419922, 0.009191751480102539, 0.009758949279785156, 0.010326147079467773, 0.01089334487915039, 0.011460542678833008, 0.012027740478515625, 0.012594938278198242, 0.01316213607788086, 0.013729333877563477, 0.014296531677246094, 0.014863729476928711, 0.015430927276611328, 0.015998125076293945, 0.016565322875976562, 0.01713252067565918, 0.017699718475341797, 0.018266916275024414, 0.01883411407470703, 0.01940131187438965, 0.019968509674072266, 0.020535707473754883, 0.0211029052734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 37.0, 76.0, 111.0, 177.0, 215.0, 166.0, 88.0, 61.0, 25.0, 16.0, 8.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1612666845321655, -1.1230378150939941, -1.0848090648651123, -1.046580195426941, -1.0083513259887695, -0.9701225757598877, -0.9318937063217163, -0.8936648964881897, -0.8554360866546631, -0.8172072768211365, -0.7789784669876099, -0.7407495975494385, -0.7025207877159119, -0.6642919778823853, -0.6260631084442139, -0.5878342986106873, -0.5496054887771606, -0.511376678943634, -0.47314783930778503, -0.43491899967193604, -0.3966901898384094, -0.3584613800048828, -0.3202325403690338, -0.2820037007331848, -0.2437748908996582, -0.2055460661649704, -0.1673172414302826, -0.1290884166955948, -0.09085959196090698, -0.05263076722621918, -0.014401942491531372, 0.023826897144317627, 0.06205570697784424, 0.10028453171253204, 0.13851335644721985, 0.17674218118190765, 0.21497100591659546, 0.25319981575012207, 0.29142865538597107, 0.32965749502182007, 0.3678863048553467, 0.4061151146888733, 0.4443439543247223, 0.4825727939605713, 0.5208016037940979, 0.5590304136276245, 0.5972592830657959, 0.6354880928993225, 0.6737169027328491, 0.7119457125663757, 0.7501745223999023, 0.7884033918380737, 0.8266322016716003, 0.864861011505127, 0.9030898809432983, 0.941318690776825, 0.9795475006103516, 1.017776370048523, 1.0560051202774048, 1.0942339897155762, 1.132462739944458, 1.1706916093826294, 1.2089204788208008, 1.2471492290496826, 1.285378098487854]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 11.0, 10.0, 11.0, 16.0, 15.0, 18.0, 16.0, 22.0, 22.0, 31.0, 30.0, 24.0, 44.0, 37.0, 36.0, 45.0, 47.0, 46.0, 47.0, 39.0, 36.0, 44.0, 48.0, 41.0, 18.0, 40.0, 25.0, 24.0, 26.0, 17.0, 16.0, 16.0, 11.0, 11.0, 13.0, 9.0, 5.0, 4.0, 4.0, 4.0, 7.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.3482048809528351, -0.3377043604850769, -0.3272038400173187, -0.31670331954956055, -0.30620282888412476, -0.2957023084163666, -0.2852017879486084, -0.2747012674808502, -0.26420074701309204, -0.25370022654533386, -0.24319970607757568, -0.2326992005109787, -0.22219868004322052, -0.21169815957546234, -0.20119765400886536, -0.19069713354110718, -0.180196613073349, -0.16969609260559082, -0.15919557213783264, -0.14869506657123566, -0.13819454610347748, -0.1276940256357193, -0.11719351261854172, -0.10669299960136414, -0.09619247913360596, -0.08569195866584778, -0.0751914456486702, -0.06469093263149261, -0.054190412163734436, -0.043689895421266556, -0.033189378678798676, -0.022688865661621094, -0.012188374996185303, -0.0016878582537174225, 0.008812658488750458, 0.019313175231218338, 0.029813691973686218, 0.0403142087161541, 0.05081472545862198, 0.06131523847579956, 0.07181575894355774, 0.08231627941131592, 0.0928167924284935, 0.10331730544567108, 0.11381782591342926, 0.12431834638118744, 0.13481885194778442, 0.1453193724155426, 0.15581989288330078, 0.16632041335105896, 0.17682093381881714, 0.18732143938541412, 0.1978219598531723, 0.20832248032093048, 0.21882298588752747, 0.22932350635528564, 0.23982402682304382, 0.250324547290802, 0.2608250677585602, 0.27132558822631836, 0.28182607889175415, 0.29232659935951233, 0.3028271198272705, 0.3133276402950287, 0.32382816076278687]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 2.0, 5.0, 5.0, 12.0, 19.0, 26.0, 58.0, 115.0, 646.0, 23300.0, 1011200.0, 12386.0, 535.0, 110.0, 43.0, 30.0, 11.0, 11.0, 12.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.267913818359375, -2.18817138671875, -2.108428955078125, -2.0286865234375, -1.948944091796875, -1.86920166015625, -1.789459228515625, -1.709716796875, -1.629974365234375, -1.55023193359375, -1.470489501953125, -1.3907470703125, -1.311004638671875, -1.23126220703125, -1.151519775390625, -1.07177734375, -0.992034912109375, -0.91229248046875, -0.832550048828125, -0.7528076171875, -0.673065185546875, -0.59332275390625, -0.513580322265625, -0.433837890625, -0.354095458984375, -0.27435302734375, -0.194610595703125, -0.1148681640625, -0.035125732421875, 0.04461669921875, 0.124359130859375, 0.2041015625, 0.283843994140625, 0.36358642578125, 0.443328857421875, 0.5230712890625, 0.602813720703125, 0.68255615234375, 0.762298583984375, 0.842041015625, 0.921783447265625, 1.00152587890625, 1.081268310546875, 1.1610107421875, 1.240753173828125, 1.32049560546875, 1.400238037109375, 1.47998046875, 1.559722900390625, 1.63946533203125, 1.719207763671875, 1.7989501953125, 1.878692626953125, 1.95843505859375, 2.038177490234375, 2.117919921875, 2.197662353515625, 2.27740478515625, 2.357147216796875, 2.4368896484375, 2.516632080078125, 2.59637451171875, 2.676116943359375, 2.755859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 7.0, 15.0, 17.0, 30.0, 30.0, 50.0, 47.0, 62.0, 61.0, 81.0, 67.0, 86.0, 86.0, 71.0, 54.0, 53.0, 43.0, 32.0, 25.0, 15.0, 15.0, 16.0, 10.0, 8.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.583984375, -1.5479888916015625, -1.511993408203125, -1.4759979248046875, -1.44000244140625, -1.4040069580078125, -1.368011474609375, -1.3320159912109375, -1.2960205078125, -1.2600250244140625, -1.224029541015625, -1.1880340576171875, -1.15203857421875, -1.1160430908203125, -1.080047607421875, -1.0440521240234375, -1.008056640625, -0.9720611572265625, -0.936065673828125, -0.9000701904296875, -0.86407470703125, -0.8280792236328125, -0.792083740234375, -0.7560882568359375, -0.7200927734375, -0.6840972900390625, -0.648101806640625, -0.6121063232421875, -0.57611083984375, -0.5401153564453125, -0.504119873046875, -0.4681243896484375, -0.43212890625, -0.3961334228515625, -0.360137939453125, -0.3241424560546875, -0.28814697265625, -0.2521514892578125, -0.216156005859375, -0.1801605224609375, -0.1441650390625, -0.1081695556640625, -0.072174072265625, -0.0361785888671875, -0.00018310546875, 0.0358123779296875, 0.071807861328125, 0.1078033447265625, 0.143798828125, 0.1797943115234375, 0.215789794921875, 0.2517852783203125, 0.28778076171875, 0.3237762451171875, 0.359771728515625, 0.3957672119140625, 0.4317626953125, 0.4677581787109375, 0.503753662109375, 0.5397491455078125, 0.57574462890625, 0.6117401123046875, 0.647735595703125, 0.6837310791015625, 0.7197265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 15.0, 17.0, 29.0, 33.0, 63.0, 73.0, 149.0, 201.0, 398.0, 953.0, 5971.0, 158974.0, 847629.0, 30258.0, 2413.0, 565.0, 280.0, 175.0, 113.0, 60.0, 54.0, 33.0, 33.0, 13.0, 15.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1328125, -1.0954132080078125, -1.058013916015625, -1.0206146240234375, -0.98321533203125, -0.9458160400390625, -0.908416748046875, -0.8710174560546875, -0.8336181640625, -0.7962188720703125, -0.758819580078125, -0.7214202880859375, -0.68402099609375, -0.6466217041015625, -0.609222412109375, -0.5718231201171875, -0.534423828125, -0.4970245361328125, -0.459625244140625, -0.4222259521484375, -0.38482666015625, -0.3474273681640625, -0.310028076171875, -0.2726287841796875, -0.2352294921875, -0.1978302001953125, -0.160430908203125, -0.1230316162109375, -0.08563232421875, -0.0482330322265625, -0.010833740234375, 0.0265655517578125, 0.06396484375, 0.1013641357421875, 0.138763427734375, 0.1761627197265625, 0.21356201171875, 0.2509613037109375, 0.288360595703125, 0.3257598876953125, 0.3631591796875, 0.4005584716796875, 0.437957763671875, 0.4753570556640625, 0.51275634765625, 0.5501556396484375, 0.587554931640625, 0.6249542236328125, 0.662353515625, 0.6997528076171875, 0.737152099609375, 0.7745513916015625, 0.81195068359375, 0.8493499755859375, 0.886749267578125, 0.9241485595703125, 0.9615478515625, 0.9989471435546875, 1.036346435546875, 1.0737457275390625, 1.11114501953125, 1.1485443115234375, 1.185943603515625, 1.2233428955078125, 1.2607421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 6.0, 8.0, 8.0, 8.0, 12.0, 15.0, 20.0, 31.0, 14.0, 20.0, 33.0, 39.0, 30.0, 39.0, 34.0, 48.0, 33.0, 48.0, 45.0, 59.0, 39.0, 44.0, 37.0, 45.0, 27.0, 28.0, 36.0, 29.0, 29.0, 19.0, 13.0, 18.0, 12.0, 13.0, 10.0, 6.0, 8.0, 12.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65771484375, -0.6344833374023438, -0.6112518310546875, -0.5880203247070312, -0.564788818359375, -0.5415573120117188, -0.5183258056640625, -0.49509429931640625, -0.47186279296875, -0.44863128662109375, -0.4253997802734375, -0.40216827392578125, -0.378936767578125, -0.35570526123046875, -0.3324737548828125, -0.30924224853515625, -0.2860107421875, -0.26277923583984375, -0.2395477294921875, -0.21631622314453125, -0.193084716796875, -0.16985321044921875, -0.1466217041015625, -0.12339019775390625, -0.10015869140625, -0.07692718505859375, -0.0536956787109375, -0.03046417236328125, -0.007232666015625, 0.01599884033203125, 0.0392303466796875, 0.06246185302734375, 0.085693359375, 0.10892486572265625, 0.1321563720703125, 0.15538787841796875, 0.178619384765625, 0.20185089111328125, 0.2250823974609375, 0.24831390380859375, 0.27154541015625, 0.29477691650390625, 0.3180084228515625, 0.34123992919921875, 0.364471435546875, 0.38770294189453125, 0.4109344482421875, 0.43416595458984375, 0.4573974609375, 0.48062896728515625, 0.5038604736328125, 0.5270919799804688, 0.550323486328125, 0.5735549926757812, 0.5967864990234375, 0.6200180053710938, 0.64324951171875, 0.6664810180664062, 0.6897125244140625, 0.7129440307617188, 0.736175537109375, 0.7594070434570312, 0.7826385498046875, 0.8058700561523438, 0.8291015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 9.0, 22.0, 49.0, 66.0, 140.0, 342.0, 1168.0, 6458.0, 102913.0, 868121.0, 62837.0, 4871.0, 995.0, 302.0, 111.0, 58.0, 27.0, 17.0, 10.0, 8.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.350341796875, -0.33882904052734375, -0.3273162841796875, -0.31580352783203125, -0.304290771484375, -0.29277801513671875, -0.2812652587890625, -0.26975250244140625, -0.25823974609375, -0.24672698974609375, -0.2352142333984375, -0.22370147705078125, -0.212188720703125, -0.20067596435546875, -0.1891632080078125, -0.17765045166015625, -0.1661376953125, -0.15462493896484375, -0.1431121826171875, -0.13159942626953125, -0.120086669921875, -0.10857391357421875, -0.0970611572265625, -0.08554840087890625, -0.07403564453125, -0.06252288818359375, -0.0510101318359375, -0.03949737548828125, -0.027984619140625, -0.01647186279296875, -0.0049591064453125, 0.00655364990234375, 0.01806640625, 0.02957916259765625, 0.0410919189453125, 0.05260467529296875, 0.064117431640625, 0.07563018798828125, 0.0871429443359375, 0.09865570068359375, 0.11016845703125, 0.12168121337890625, 0.1331939697265625, 0.14470672607421875, 0.156219482421875, 0.16773223876953125, 0.1792449951171875, 0.19075775146484375, 0.2022705078125, 0.21378326416015625, 0.2252960205078125, 0.23680877685546875, 0.248321533203125, 0.25983428955078125, 0.2713470458984375, 0.28285980224609375, 0.29437255859375, 0.30588531494140625, 0.3173980712890625, 0.32891082763671875, 0.340423583984375, 0.35193634033203125, 0.3634490966796875, 0.37496185302734375, 0.386474609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 14.0, 15.0, 23.0, 20.0, 47.0, 49.0, 58.0, 62.0, 102.0, 93.0, 86.0, 94.0, 77.0, 62.0, 36.0, 36.0, 25.0, 21.0, 19.0, 9.0, 16.0, 3.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8014183044433594e-05, -2.721603959798813e-05, -2.6417896151542664e-05, -2.56197527050972e-05, -2.4821609258651733e-05, -2.402346581220627e-05, -2.3225322365760803e-05, -2.2427178919315338e-05, -2.1629035472869873e-05, -2.0830892026424408e-05, -2.0032748579978943e-05, -1.9234605133533478e-05, -1.8436461687088013e-05, -1.7638318240642548e-05, -1.6840174794197083e-05, -1.6042031347751617e-05, -1.5243887901306152e-05, -1.4445744454860687e-05, -1.3647601008415222e-05, -1.2849457561969757e-05, -1.2051314115524292e-05, -1.1253170669078827e-05, -1.0455027222633362e-05, -9.656883776187897e-06, -8.858740329742432e-06, -8.060596883296967e-06, -7.2624534368515015e-06, -6.464309990406036e-06, -5.666166543960571e-06, -4.868023097515106e-06, -4.069879651069641e-06, -3.271736204624176e-06, -2.473592758178711e-06, -1.6754493117332458e-06, -8.773058652877808e-07, -7.916241884231567e-08, 7.189810276031494e-07, 1.5171244740486145e-06, 2.3152679204940796e-06, 3.1134113669395447e-06, 3.91155481338501e-06, 4.709698259830475e-06, 5.50784170627594e-06, 6.305985152721405e-06, 7.10412859916687e-06, 7.902272045612335e-06, 8.7004154920578e-06, 9.498558938503265e-06, 1.029670238494873e-05, 1.1094845831394196e-05, 1.189298927783966e-05, 1.2691132724285126e-05, 1.348927617073059e-05, 1.4287419617176056e-05, 1.5085563063621521e-05, 1.5883706510066986e-05, 1.668184995651245e-05, 1.7479993402957916e-05, 1.827813684940338e-05, 1.9076280295848846e-05, 1.987442374229431e-05, 2.0672567188739777e-05, 2.1470710635185242e-05, 2.2268854081630707e-05, 2.3066997528076172e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 16.0, 21.0, 53.0, 73.0, 145.0, 378.0, 1572.0, 13677.0, 599576.0, 421089.0, 10002.0, 1263.0, 362.0, 130.0, 84.0, 37.0, 18.0, 21.0, 13.0, 7.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4405975341796875, -0.426361083984375, -0.4121246337890625, -0.39788818359375, -0.3836517333984375, -0.369415283203125, -0.3551788330078125, -0.3409423828125, -0.3267059326171875, -0.312469482421875, -0.2982330322265625, -0.28399658203125, -0.2697601318359375, -0.255523681640625, -0.2412872314453125, -0.22705078125, -0.2128143310546875, -0.198577880859375, -0.1843414306640625, -0.17010498046875, -0.1558685302734375, -0.141632080078125, -0.1273956298828125, -0.1131591796875, -0.0989227294921875, -0.084686279296875, -0.0704498291015625, -0.05621337890625, -0.0419769287109375, -0.027740478515625, -0.0135040283203125, 0.000732421875, 0.0149688720703125, 0.029205322265625, 0.0434417724609375, 0.05767822265625, 0.0719146728515625, 0.086151123046875, 0.1003875732421875, 0.1146240234375, 0.1288604736328125, 0.143096923828125, 0.1573333740234375, 0.17156982421875, 0.1858062744140625, 0.200042724609375, 0.2142791748046875, 0.228515625, 0.2427520751953125, 0.256988525390625, 0.2712249755859375, 0.28546142578125, 0.2996978759765625, 0.313934326171875, 0.3281707763671875, 0.3424072265625, 0.3566436767578125, 0.370880126953125, 0.3851165771484375, 0.39935302734375, 0.4135894775390625, 0.427825927734375, 0.4420623779296875, 0.456298828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 15.0, 16.0, 26.0, 37.0, 80.0, 111.0, 150.0, 135.0, 137.0, 109.0, 57.0, 35.0, 26.0, 13.0, 9.0, 12.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.13201522827148438, -0.12779998779296875, -0.12358474731445312, -0.1193695068359375, -0.11515426635742188, -0.11093902587890625, -0.10672378540039062, -0.102508544921875, -0.09829330444335938, -0.09407806396484375, -0.08986282348632812, -0.0856475830078125, -0.08143234252929688, -0.07721710205078125, -0.07300186157226562, -0.06878662109375, -0.06457138061523438, -0.06035614013671875, -0.056140899658203125, -0.0519256591796875, -0.047710418701171875, -0.04349517822265625, -0.039279937744140625, -0.035064697265625, -0.030849456787109375, -0.02663421630859375, -0.022418975830078125, -0.0182037353515625, -0.013988494873046875, -0.00977325439453125, -0.005558013916015625, -0.0013427734375, 0.002872467041015625, 0.00708770751953125, 0.011302947998046875, 0.0155181884765625, 0.019733428955078125, 0.02394866943359375, 0.028163909912109375, 0.032379150390625, 0.036594390869140625, 0.04080963134765625, 0.045024871826171875, 0.0492401123046875, 0.053455352783203125, 0.05767059326171875, 0.061885833740234375, 0.06610107421875, 0.07031631469726562, 0.07453155517578125, 0.07874679565429688, 0.0829620361328125, 0.08717727661132812, 0.09139251708984375, 0.09560775756835938, 0.099822998046875, 0.10403823852539062, 0.10825347900390625, 0.11246871948242188, 0.1166839599609375, 0.12089920043945312, 0.12511444091796875, 0.12932968139648438, 0.133544921875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 11.0, 17.0, 59.0, 162.0, 261.0, 250.0, 145.0, 70.0, 18.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296754240989685, -1.188986897468567, -1.0812195539474487, -0.9734522104263306, -0.8656848669052124, -0.757917582988739, -0.6501502394676208, -0.5423828959465027, -0.4346155524253845, -0.32684820890426636, -0.2190808802843094, -0.11131355166435242, -0.003546208143234253, 0.10422110557556152, 0.2119884490966797, 0.31975579261779785, 0.427523136138916, 0.5352904796600342, 0.6430578231811523, 0.7508251667022705, 0.8585925102233887, 0.9663597941398621, 1.074127197265625, 1.1818945407867432, 1.2896618843078613, 1.3974292278289795, 1.5051965713500977, 1.6129639148712158, 1.720731258392334, 1.8284986019134521, 1.9362659454345703, 2.0440332889556885, 2.1518003940582275, 2.2595677375793457, 2.367335081100464, 2.475102424621582, 2.5828697681427, 2.6906371116638184, 2.7984044551849365, 2.9061717987060547, 3.013939142227173, 3.121706485748291, 3.229473829269409, 3.3372411727905273, 3.4450085163116455, 3.5527758598327637, 3.660543203353882, 3.768310546875, 3.876077651977539, 3.9838449954986572, 4.091612339019775, 4.1993794441223145, 4.307147026062012, 4.414914131164551, 4.522681713104248, 4.630448818206787, 4.738216400146484, 4.845983505249023, 4.953751087188721, 5.06151819229126, 5.169285774230957, 5.277052879333496, 5.384820461273193, 5.492587566375732, 5.60035514831543]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 8.0, 8.0, 9.0, 14.0, 18.0, 10.0, 16.0, 17.0, 26.0, 20.0, 33.0, 20.0, 22.0, 35.0, 32.0, 35.0, 29.0, 38.0, 37.0, 42.0, 25.0, 37.0, 31.0, 38.0, 28.0, 33.0, 27.0, 30.0, 28.0, 29.0, 28.0, 22.0, 19.0, 16.0, 23.0, 8.0, 16.0, 13.0, 16.0, 8.0, 8.0, 7.0, 5.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.0631518363952637, -1.030463457107544, -0.997775137424469, -0.965086817741394, -0.9323984980583191, -0.8997101783752441, -0.8670217990875244, -0.8343334794044495, -0.8016451597213745, -0.7689568400382996, -0.7362684607505798, -0.7035801410675049, -0.6708918213844299, -0.638203501701355, -0.6055151224136353, -0.5728268027305603, -0.5401384234428406, -0.5074501037597656, -0.4747617542743683, -0.44207340478897095, -0.409385085105896, -0.37669673562049866, -0.3440083861351013, -0.31132006645202637, -0.27863171696662903, -0.24594338238239288, -0.21325504779815674, -0.1805666983127594, -0.14787836372852325, -0.11519002914428711, -0.08250167965888977, -0.049813345074653625, -0.01712501049041748, 0.015563327819108963, 0.048251666128635406, 0.08094000816345215, 0.1136283427476883, 0.14631667733192444, 0.17900502681732178, 0.21169336140155792, 0.24438169598579407, 0.2770700454711914, 0.30975836515426636, 0.3424467146396637, 0.37513506412506104, 0.407823383808136, 0.4405117332935333, 0.47320008277893066, 0.5058884024620056, 0.5385767221450806, 0.5712651014328003, 0.6039534211158752, 0.6366417407989502, 0.6693301200866699, 0.7020184397697449, 0.7347067594528198, 0.7673951387405396, 0.8000834584236145, 0.8327718377113342, 0.8654601573944092, 0.8981484770774841, 0.9308367967605591, 0.9635251760482788, 0.9962134957313538, 1.0289018154144287]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 8.0, 10.0, 12.0, 23.0, 27.0, 40.0, 50.0, 101.0, 170.0, 342.0, 731.0, 1840.0, 5588.0, 24023.0, 164897.0, 1318892.0, 2248435.0, 370262.0, 44723.0, 9080.0, 2751.0, 1136.0, 530.0, 234.0, 137.0, 90.0, 54.0, 25.0, 27.0, 13.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.84130859375, -0.8159637451171875, -0.790618896484375, -0.7652740478515625, -0.73992919921875, -0.7145843505859375, -0.689239501953125, -0.6638946533203125, -0.6385498046875, -0.6132049560546875, -0.587860107421875, -0.5625152587890625, -0.53717041015625, -0.5118255615234375, -0.486480712890625, -0.4611358642578125, -0.435791015625, -0.4104461669921875, -0.385101318359375, -0.3597564697265625, -0.33441162109375, -0.3090667724609375, -0.283721923828125, -0.2583770751953125, -0.2330322265625, -0.2076873779296875, -0.182342529296875, -0.1569976806640625, -0.13165283203125, -0.1063079833984375, -0.080963134765625, -0.0556182861328125, -0.0302734375, -0.0049285888671875, 0.020416259765625, 0.0457611083984375, 0.07110595703125, 0.0964508056640625, 0.121795654296875, 0.1471405029296875, 0.1724853515625, 0.1978302001953125, 0.223175048828125, 0.2485198974609375, 0.27386474609375, 0.2992095947265625, 0.324554443359375, 0.3498992919921875, 0.375244140625, 0.4005889892578125, 0.425933837890625, 0.4512786865234375, 0.47662353515625, 0.5019683837890625, 0.527313232421875, 0.5526580810546875, 0.5780029296875, 0.6033477783203125, 0.628692626953125, 0.6540374755859375, 0.67938232421875, 0.7047271728515625, 0.730072021484375, 0.7554168701171875, 0.78076171875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 8.0, 15.0, 8.0, 13.0, 20.0, 28.0, 27.0, 26.0, 29.0, 43.0, 42.0, 36.0, 41.0, 35.0, 48.0, 43.0, 56.0, 51.0, 44.0, 36.0, 37.0, 31.0, 36.0, 24.0, 33.0, 23.0, 26.0, 19.0, 19.0, 19.0, 12.0, 12.0, 15.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.54052734375, -0.5247230529785156, -0.5089187622070312, -0.4931144714355469, -0.4773101806640625, -0.4615058898925781, -0.44570159912109375, -0.4298973083496094, -0.414093017578125, -0.3982887268066406, -0.38248443603515625, -0.3666801452636719, -0.3508758544921875, -0.3350715637207031, -0.31926727294921875, -0.3034629821777344, -0.28765869140625, -0.2718544006347656, -0.25605010986328125, -0.24024581909179688, -0.2244415283203125, -0.20863723754882812, -0.19283294677734375, -0.17702865600585938, -0.161224365234375, -0.14542007446289062, -0.12961578369140625, -0.11381149291992188, -0.0980072021484375, -0.08220291137695312, -0.06639862060546875, -0.050594329833984375, -0.0347900390625, -0.018985748291015625, -0.00318145751953125, 0.012622833251953125, 0.0284271240234375, 0.044231414794921875, 0.06003570556640625, 0.07583999633789062, 0.091644287109375, 0.10744857788085938, 0.12325286865234375, 0.13905715942382812, 0.1548614501953125, 0.17066574096679688, 0.18647003173828125, 0.20227432250976562, 0.21807861328125, 0.23388290405273438, 0.24968719482421875, 0.2654914855957031, 0.2812957763671875, 0.2971000671386719, 0.31290435791015625, 0.3287086486816406, 0.344512939453125, 0.3603172302246094, 0.37612152099609375, 0.3919258117675781, 0.4077301025390625, 0.4235343933105469, 0.43933868408203125, 0.4551429748535156, 0.470947265625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 9.0, 13.0, 17.0, 37.0, 61.0, 92.0, 178.0, 406.0, 1034.0, 3843.0, 29642.0, 1999498.0, 2123261.0, 30626.0, 3761.0, 1019.0, 378.0, 189.0, 74.0, 57.0, 27.0, 20.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.677734375, -1.6335906982421875, -1.589447021484375, -1.5453033447265625, -1.50115966796875, -1.4570159912109375, -1.412872314453125, -1.3687286376953125, -1.3245849609375, -1.2804412841796875, -1.236297607421875, -1.1921539306640625, -1.14801025390625, -1.1038665771484375, -1.059722900390625, -1.0155792236328125, -0.971435546875, -0.9272918701171875, -0.883148193359375, -0.8390045166015625, -0.79486083984375, -0.7507171630859375, -0.706573486328125, -0.6624298095703125, -0.6182861328125, -0.5741424560546875, -0.529998779296875, -0.4858551025390625, -0.44171142578125, -0.3975677490234375, -0.353424072265625, -0.3092803955078125, -0.26513671875, -0.2209930419921875, -0.176849365234375, -0.1327056884765625, -0.08856201171875, -0.0444183349609375, -0.000274658203125, 0.0438690185546875, 0.0880126953125, 0.1321563720703125, 0.176300048828125, 0.2204437255859375, 0.26458740234375, 0.3087310791015625, 0.352874755859375, 0.3970184326171875, 0.441162109375, 0.4853057861328125, 0.529449462890625, 0.5735931396484375, 0.61773681640625, 0.6618804931640625, 0.706024169921875, 0.7501678466796875, 0.7943115234375, 0.8384552001953125, 0.882598876953125, 0.9267425537109375, 0.97088623046875, 1.0150299072265625, 1.059173583984375, 1.1033172607421875, 1.1474609375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 10.0, 8.0, 16.0, 28.0, 38.0, 50.0, 98.0, 180.0, 373.0, 647.0, 868.0, 744.0, 441.0, 257.0, 130.0, 82.0, 34.0, 31.0, 13.0, 17.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24622344970703125, -0.2348785400390625, -0.22353363037109375, -0.212188720703125, -0.20084381103515625, -0.1894989013671875, -0.17815399169921875, -0.16680908203125, -0.15546417236328125, -0.1441192626953125, -0.13277435302734375, -0.121429443359375, -0.11008453369140625, -0.0987396240234375, -0.08739471435546875, -0.0760498046875, -0.06470489501953125, -0.0533599853515625, -0.04201507568359375, -0.030670166015625, -0.01932525634765625, -0.0079803466796875, 0.00336456298828125, 0.01470947265625, 0.02605438232421875, 0.0373992919921875, 0.04874420166015625, 0.060089111328125, 0.07143402099609375, 0.0827789306640625, 0.09412384033203125, 0.10546875, 0.11681365966796875, 0.1281585693359375, 0.13950347900390625, 0.150848388671875, 0.16219329833984375, 0.1735382080078125, 0.18488311767578125, 0.19622802734375, 0.20757293701171875, 0.2189178466796875, 0.23026275634765625, 0.241607666015625, 0.25295257568359375, 0.2642974853515625, 0.27564239501953125, 0.2869873046875, 0.29833221435546875, 0.3096771240234375, 0.32102203369140625, 0.332366943359375, 0.34371185302734375, 0.3550567626953125, 0.36640167236328125, 0.37774658203125, 0.38909149169921875, 0.4004364013671875, 0.41178131103515625, 0.423126220703125, 0.43447113037109375, 0.4458160400390625, 0.45716094970703125, 0.468505859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 6.0, 9.0, 10.0, 22.0, 45.0, 58.0, 79.0, 113.0, 157.0, 121.0, 124.0, 86.0, 65.0, 52.0, 24.0, 12.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.157740831375122, -1.1151161193847656, -1.0724912881851196, -1.0298665761947632, -0.987241804599762, -0.9446170330047607, -0.9019922614097595, -0.8593674898147583, -0.8167427778244019, -0.7741180062294006, -0.7314932346343994, -0.688868522644043, -0.6462437510490417, -0.6036189794540405, -0.5609942078590393, -0.5183694362640381, -0.47574466466903687, -0.43311989307403564, -0.3904951512813568, -0.3478703796863556, -0.30524563789367676, -0.26262086629867554, -0.21999609470367432, -0.17737135291099548, -0.13474658131599426, -0.09212182462215424, -0.04949706047773361, -0.006872296333312988, 0.03575246036052704, 0.07837721705436707, 0.12100198864936829, 0.16362673044204712, 0.20625150203704834, 0.24887625873088837, 0.2915010154247284, 0.3341257870197296, 0.37675052881240845, 0.41937530040740967, 0.4620000720024109, 0.5046248435974121, 0.5472495555877686, 0.5898743271827698, 0.632499098777771, 0.6751238107681274, 0.7177485823631287, 0.7603733539581299, 0.8029981255531311, 0.8456228971481323, 0.8882476687431335, 0.9308724403381348, 0.973497211933136, 1.0161219835281372, 1.0587466955184937, 1.1013715267181396, 1.143996238708496, 1.1866209506988525, 1.2292457818984985, 1.271870493888855, 1.314495325088501, 1.3571200370788574, 1.3997448682785034, 1.4423695802688599, 1.4849944114685059, 1.5276191234588623, 1.5702438354492188]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 13.0, 13.0, 18.0, 16.0, 14.0, 15.0, 11.0, 29.0, 25.0, 34.0, 27.0, 25.0, 44.0, 37.0, 49.0, 36.0, 51.0, 37.0, 45.0, 35.0, 36.0, 36.0, 24.0, 39.0, 35.0, 32.0, 32.0, 26.0, 19.0, 14.0, 19.0, 9.0, 16.0, 18.0, 14.0, 10.0, 7.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5457444787025452, -0.5296576619148254, -0.5135709047317505, -0.49748408794403076, -0.48139727115631104, -0.4653104841709137, -0.44922369718551636, -0.43313688039779663, -0.4170500934123993, -0.40096330642700195, -0.3848764896392822, -0.3687897026538849, -0.35270291566848755, -0.3366160988807678, -0.3205293118953705, -0.30444252490997314, -0.2883557081222534, -0.2722689211368561, -0.25618210434913635, -0.240095317363739, -0.22400851547718048, -0.20792171359062195, -0.1918349266052246, -0.17574812471866608, -0.15966132283210754, -0.143574520945549, -0.12748771905899048, -0.11140093207359314, -0.0953141301870346, -0.07922732830047607, -0.06314053386449814, -0.0470537394285202, -0.030966997146606445, -0.014880198985338211, 0.0012065991759300232, 0.017293397337198257, 0.03338019549846649, 0.049466997385025024, 0.06555379182100296, 0.0816405862569809, 0.09772738814353943, 0.11381419003009796, 0.1299009919166565, 0.14598777890205383, 0.16207458078861237, 0.1781613826751709, 0.19424816966056824, 0.21033497154712677, 0.2264217734336853, 0.24250857532024384, 0.25859537720680237, 0.2746821641921997, 0.29076898097991943, 0.3068557679653168, 0.3229425549507141, 0.33902937173843384, 0.3551161587238312, 0.3712029457092285, 0.38728976249694824, 0.4033765494823456, 0.4194633364677429, 0.43555015325546265, 0.45163694024086, 0.4677237272262573, 0.48381054401397705]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 10.0, 16.0, 31.0, 45.0, 75.0, 122.0, 289.0, 765.0, 2631.0, 9783.0, 47223.0, 241313.0, 515732.0, 184080.0, 35484.0, 7617.0, 2140.0, 654.0, 244.0, 100.0, 59.0, 35.0, 18.0, 22.0, 17.0, 8.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.132659912109375, -0.12799072265625, -0.123321533203125, -0.11865234375, -0.113983154296875, -0.10931396484375, -0.104644775390625, -0.0999755859375, -0.095306396484375, -0.09063720703125, -0.085968017578125, -0.081298828125, -0.076629638671875, -0.07196044921875, -0.067291259765625, -0.0626220703125, -0.057952880859375, -0.05328369140625, -0.048614501953125, -0.0439453125, -0.039276123046875, -0.03460693359375, -0.029937744140625, -0.0252685546875, -0.020599365234375, -0.01593017578125, -0.011260986328125, -0.006591796875, -0.001922607421875, 0.00274658203125, 0.007415771484375, 0.0120849609375, 0.016754150390625, 0.02142333984375, 0.026092529296875, 0.03076171875, 0.035430908203125, 0.04010009765625, 0.044769287109375, 0.0494384765625, 0.054107666015625, 0.05877685546875, 0.063446044921875, 0.068115234375, 0.072784423828125, 0.07745361328125, 0.082122802734375, 0.0867919921875, 0.091461181640625, 0.09613037109375, 0.100799560546875, 0.10546875, 0.110137939453125, 0.11480712890625, 0.119476318359375, 0.1241455078125, 0.128814697265625, 0.13348388671875, 0.138153076171875, 0.142822265625, 0.147491455078125, 0.15216064453125, 0.156829833984375, 0.1614990234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 11.0, 24.0, 26.0, 20.0, 24.0, 26.0, 40.0, 35.0, 43.0, 53.0, 65.0, 48.0, 59.0, 61.0, 40.0, 48.0, 41.0, 43.0, 47.0, 31.0, 38.0, 23.0, 19.0, 16.0, 22.0, 21.0, 9.0, 12.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.4308204650878906, -0.41779327392578125, -0.4047660827636719, -0.3917388916015625, -0.3787117004394531, -0.36568450927734375, -0.3526573181152344, -0.339630126953125, -0.3266029357910156, -0.31357574462890625, -0.3005485534667969, -0.2875213623046875, -0.2744941711425781, -0.26146697998046875, -0.24843978881835938, -0.23541259765625, -0.22238540649414062, -0.20935821533203125, -0.19633102416992188, -0.1833038330078125, -0.17027664184570312, -0.15724945068359375, -0.14422225952148438, -0.131195068359375, -0.11816787719726562, -0.10514068603515625, -0.09211349487304688, -0.0790863037109375, -0.06605911254882812, -0.05303192138671875, -0.040004730224609375, -0.0269775390625, -0.013950347900390625, -0.00092315673828125, 0.012104034423828125, 0.0251312255859375, 0.038158416748046875, 0.05118560791015625, 0.06421279907226562, 0.077239990234375, 0.09026718139648438, 0.10329437255859375, 0.11632156372070312, 0.1293487548828125, 0.14237594604492188, 0.15540313720703125, 0.16843032836914062, 0.18145751953125, 0.19448471069335938, 0.20751190185546875, 0.22053909301757812, 0.2335662841796875, 0.24659347534179688, 0.25962066650390625, 0.2726478576660156, 0.285675048828125, 0.2987022399902344, 0.31172943115234375, 0.3247566223144531, 0.3377838134765625, 0.3508110046386719, 0.36383819580078125, 0.3768653869628906, 0.389892578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 11.0, 20.0, 17.0, 15.0, 39.0, 41.0, 61.0, 108.0, 146.0, 211.0, 408.0, 706.0, 1524.0, 3720.0, 9859.0, 29533.0, 92137.0, 246128.0, 350523.0, 205045.0, 71917.0, 22911.0, 7794.0, 2877.0, 1265.0, 569.0, 344.0, 199.0, 127.0, 86.0, 64.0, 48.0, 36.0, 21.0, 15.0, 7.0, 11.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09136962890625, -0.08854866027832031, -0.08572769165039062, -0.08290672302246094, -0.08008575439453125, -0.07726478576660156, -0.07444381713867188, -0.07162284851074219, -0.0688018798828125, -0.06598091125488281, -0.06315994262695312, -0.06033897399902344, -0.05751800537109375, -0.05469703674316406, -0.051876068115234375, -0.04905509948730469, -0.046234130859375, -0.04341316223144531, -0.040592193603515625, -0.03777122497558594, -0.03495025634765625, -0.03212928771972656, -0.029308319091796875, -0.026487350463867188, -0.0236663818359375, -0.020845413208007812, -0.018024444580078125, -0.015203475952148438, -0.01238250732421875, -0.009561538696289062, -0.006740570068359375, -0.0039196014404296875, -0.0010986328125, 0.0017223358154296875, 0.004543304443359375, 0.0073642730712890625, 0.01018524169921875, 0.013006210327148438, 0.015827178955078125, 0.018648147583007812, 0.0214691162109375, 0.024290084838867188, 0.027111053466796875, 0.029932022094726562, 0.03275299072265625, 0.03557395935058594, 0.038394927978515625, 0.04121589660644531, 0.044036865234375, 0.04685783386230469, 0.049678802490234375, 0.05249977111816406, 0.05532073974609375, 0.05814170837402344, 0.060962677001953125, 0.06378364562988281, 0.0666046142578125, 0.06942558288574219, 0.07224655151367188, 0.07506752014160156, 0.07788848876953125, 0.08070945739746094, 0.08353042602539062, 0.08635139465332031, 0.08917236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 6.0, 9.0, 12.0, 14.0, 14.0, 18.0, 15.0, 27.0, 22.0, 29.0, 22.0, 38.0, 52.0, 36.0, 53.0, 47.0, 43.0, 42.0, 54.0, 53.0, 42.0, 38.0, 34.0, 41.0, 34.0, 31.0, 23.0, 20.0, 21.0, 20.0, 19.0, 10.0, 15.0, 12.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6744918823242188, -0.6522064208984375, -0.6299209594726562, -0.607635498046875, -0.5853500366210938, -0.5630645751953125, -0.5407791137695312, -0.51849365234375, -0.49620819091796875, -0.4739227294921875, -0.45163726806640625, -0.429351806640625, -0.40706634521484375, -0.3847808837890625, -0.36249542236328125, -0.3402099609375, -0.31792449951171875, -0.2956390380859375, -0.27335357666015625, -0.251068115234375, -0.22878265380859375, -0.2064971923828125, -0.18421173095703125, -0.16192626953125, -0.13964080810546875, -0.1173553466796875, -0.09506988525390625, -0.072784423828125, -0.05049896240234375, -0.0282135009765625, -0.00592803955078125, 0.016357421875, 0.03864288330078125, 0.0609283447265625, 0.08321380615234375, 0.105499267578125, 0.12778472900390625, 0.1500701904296875, 0.17235565185546875, 0.19464111328125, 0.21692657470703125, 0.2392120361328125, 0.26149749755859375, 0.283782958984375, 0.30606842041015625, 0.3283538818359375, 0.35063934326171875, 0.3729248046875, 0.39521026611328125, 0.4174957275390625, 0.43978118896484375, 0.462066650390625, 0.48435211181640625, 0.5066375732421875, 0.5289230346679688, 0.55120849609375, 0.5734939575195312, 0.5957794189453125, 0.6180648803710938, 0.640350341796875, 0.6626358032226562, 0.6849212646484375, 0.7072067260742188, 0.7294921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 9.0, 21.0, 20.0, 34.0, 71.0, 135.0, 171.0, 271.0, 475.0, 957.0, 1896.0, 4547.0, 14045.0, 58106.0, 283479.0, 496991.0, 142935.0, 30054.0, 8158.0, 2990.0, 1377.0, 681.0, 427.0, 275.0, 133.0, 90.0, 56.0, 47.0, 23.0, 15.0, 5.0, 12.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.047760009765625, -0.0462803840637207, -0.044800758361816406, -0.04332113265991211, -0.04184150695800781, -0.040361881256103516, -0.03888225555419922, -0.03740262985229492, -0.035923004150390625, -0.03444337844848633, -0.03296375274658203, -0.031484127044677734, -0.030004501342773438, -0.02852487564086914, -0.027045249938964844, -0.025565624237060547, -0.02408599853515625, -0.022606372833251953, -0.021126747131347656, -0.01964712142944336, -0.018167495727539062, -0.016687870025634766, -0.015208244323730469, -0.013728618621826172, -0.012248992919921875, -0.010769367218017578, -0.009289741516113281, -0.007810115814208984, -0.0063304901123046875, -0.004850864410400391, -0.0033712387084960938, -0.0018916130065917969, -0.0004119873046875, 0.0010676383972167969, 0.0025472640991210938, 0.004026889801025391, 0.0055065155029296875, 0.006986141204833984, 0.008465766906738281, 0.009945392608642578, 0.011425018310546875, 0.012904644012451172, 0.014384269714355469, 0.015863895416259766, 0.017343521118164062, 0.01882314682006836, 0.020302772521972656, 0.021782398223876953, 0.02326202392578125, 0.024741649627685547, 0.026221275329589844, 0.02770090103149414, 0.029180526733398438, 0.030660152435302734, 0.03213977813720703, 0.03361940383911133, 0.035099029541015625, 0.03657865524291992, 0.03805828094482422, 0.039537906646728516, 0.04101753234863281, 0.04249715805053711, 0.043976783752441406, 0.0454564094543457, 0.04693603515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 15.0, 24.0, 23.0, 26.0, 30.0, 36.0, 59.0, 69.0, 86.0, 85.0, 63.0, 90.0, 80.0, 54.0, 56.0, 39.0, 36.0, 20.0, 21.0, 21.0, 14.0, 11.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5079975128173828e-05, -1.4600344002246857e-05, -1.4120712876319885e-05, -1.3641081750392914e-05, -1.3161450624465942e-05, -1.2681819498538971e-05, -1.2202188372612e-05, -1.1722557246685028e-05, -1.1242926120758057e-05, -1.0763294994831085e-05, -1.0283663868904114e-05, -9.804032742977142e-06, -9.324401617050171e-06, -8.8447704911232e-06, -8.365139365196228e-06, -7.885508239269257e-06, -7.405877113342285e-06, -6.926245987415314e-06, -6.446614861488342e-06, -5.966983735561371e-06, -5.487352609634399e-06, -5.007721483707428e-06, -4.5280903577804565e-06, -4.048459231853485e-06, -3.5688281059265137e-06, -3.0891969799995422e-06, -2.609565854072571e-06, -2.1299347281455994e-06, -1.650303602218628e-06, -1.1706724762916565e-06, -6.910413503646851e-07, -2.1141022443771362e-07, 2.682209014892578e-07, 7.478520274162292e-07, 1.2274831533432007e-06, 1.7071142792701721e-06, 2.1867454051971436e-06, 2.666376531124115e-06, 3.1460076570510864e-06, 3.625638782978058e-06, 4.105269908905029e-06, 4.584901034832001e-06, 5.064532160758972e-06, 5.544163286685944e-06, 6.023794412612915e-06, 6.5034255385398865e-06, 6.983056664466858e-06, 7.462687790393829e-06, 7.9423189163208e-06, 8.421950042247772e-06, 8.901581168174744e-06, 9.381212294101715e-06, 9.860843420028687e-06, 1.0340474545955658e-05, 1.082010567188263e-05, 1.12997367978096e-05, 1.1779367923736572e-05, 1.2258999049663544e-05, 1.2738630175590515e-05, 1.3218261301517487e-05, 1.3697892427444458e-05, 1.417752355337143e-05, 1.4657154679298401e-05, 1.5136785805225372e-05, 1.5616416931152344e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 3.0, 3.0, 8.0, 10.0, 13.0, 15.0, 16.0, 27.0, 29.0, 39.0, 69.0, 93.0, 147.0, 282.0, 600.0, 1656.0, 5938.0, 29942.0, 217383.0, 615588.0, 147934.0, 21644.0, 4651.0, 1289.0, 501.0, 254.0, 125.0, 78.0, 53.0, 41.0, 34.0, 29.0, 13.0, 13.0, 9.0, 4.0, 5.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.08038330078125, -0.07823419570922852, -0.07608509063720703, -0.07393598556518555, -0.07178688049316406, -0.06963777542114258, -0.0674886703491211, -0.06533956527709961, -0.06319046020507812, -0.06104135513305664, -0.058892250061035156, -0.05674314498901367, -0.05459403991699219, -0.0524449348449707, -0.05029582977294922, -0.048146724700927734, -0.04599761962890625, -0.043848514556884766, -0.04169940948486328, -0.0395503044128418, -0.03740119934082031, -0.03525209426879883, -0.033102989196777344, -0.03095388412475586, -0.028804779052734375, -0.02665567398071289, -0.024506568908691406, -0.022357463836669922, -0.020208358764648438, -0.018059253692626953, -0.01591014862060547, -0.013761043548583984, -0.0116119384765625, -0.009462833404541016, -0.007313728332519531, -0.005164623260498047, -0.0030155181884765625, -0.0008664131164550781, 0.0012826919555664062, 0.0034317970275878906, 0.005580902099609375, 0.007730007171630859, 0.009879112243652344, 0.012028217315673828, 0.014177322387695312, 0.016326427459716797, 0.01847553253173828, 0.020624637603759766, 0.02277374267578125, 0.024922847747802734, 0.02707195281982422, 0.029221057891845703, 0.03137016296386719, 0.03351926803588867, 0.035668373107910156, 0.03781747817993164, 0.039966583251953125, 0.04211568832397461, 0.044264793395996094, 0.04641389846801758, 0.04856300354003906, 0.05071210861206055, 0.05286121368408203, 0.055010318756103516, 0.057159423828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 4.0, 14.0, 19.0, 11.0, 10.0, 14.0, 30.0, 32.0, 41.0, 65.0, 64.0, 83.0, 99.0, 78.0, 68.0, 59.0, 59.0, 37.0, 47.0, 36.0, 21.0, 29.0, 13.0, 9.0, 7.0, 10.0, 7.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0118408203125, -0.011399984359741211, -0.010959148406982422, -0.010518312454223633, -0.010077476501464844, -0.009636640548706055, -0.009195804595947266, -0.008754968643188477, -0.008314132690429688, -0.007873296737670898, -0.007432460784912109, -0.00699162483215332, -0.006550788879394531, -0.006109952926635742, -0.005669116973876953, -0.005228281021118164, -0.004787445068359375, -0.004346609115600586, -0.003905773162841797, -0.003464937210083008, -0.0030241012573242188, -0.0025832653045654297, -0.0021424293518066406, -0.0017015933990478516, -0.0012607574462890625, -0.0008199214935302734, -0.0003790855407714844, 6.175041198730469e-05, 0.0005025863647460938, 0.0009434223175048828, 0.0013842582702636719, 0.001825094223022461, 0.00226593017578125, 0.002706766128540039, 0.003147602081298828, 0.003588438034057617, 0.004029273986816406, 0.004470109939575195, 0.004910945892333984, 0.0053517818450927734, 0.0057926177978515625, 0.0062334537506103516, 0.006674289703369141, 0.00711512565612793, 0.007555961608886719, 0.007996797561645508, 0.008437633514404297, 0.008878469467163086, 0.009319305419921875, 0.009760141372680664, 0.010200977325439453, 0.010641813278198242, 0.011082649230957031, 0.01152348518371582, 0.01196432113647461, 0.012405157089233398, 0.012845993041992188, 0.013286828994750977, 0.013727664947509766, 0.014168500900268555, 0.014609336853027344, 0.015050172805786133, 0.015491008758544922, 0.01593184471130371, 0.0163726806640625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 15.0, 36.0, 60.0, 121.0, 177.0, 206.0, 150.0, 119.0, 56.0, 25.0, 17.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1063568592071533, -1.0711039304733276, -1.0358508825302124, -1.0005979537963867, -0.9653449058532715, -0.930091917514801, -0.8948389291763306, -0.8595860004425049, -0.8243329524993896, -0.7890799641609192, -0.7538269758224487, -0.7185739874839783, -0.6833209991455078, -0.6480680108070374, -0.6128150224685669, -0.5775620937347412, -0.5423091053962708, -0.5070561170578003, -0.47180312871932983, -0.4365501403808594, -0.4012971520423889, -0.36604416370391846, -0.3307912051677704, -0.2955382168292999, -0.26028522849082947, -0.225032240152359, -0.18977925181388855, -0.15452627837657928, -0.11927329003810883, -0.08402030169963837, -0.0487673282623291, -0.013514339923858643, 0.021738648414611816, 0.05699163302779198, 0.09224461764097214, 0.127497598528862, 0.16275058686733246, 0.19800357520580292, 0.23325654864311218, 0.26850953698158264, 0.3037625253200531, 0.33901551365852356, 0.374268501996994, 0.4095214605331421, 0.44477444887161255, 0.480027437210083, 0.5152804255485535, 0.5505334138870239, 0.5857864022254944, 0.6210393905639648, 0.6562923789024353, 0.6915453672409058, 0.7267983555793762, 0.7620513439178467, 0.7973042726516724, 0.8325573205947876, 0.8678102493286133, 0.9030632376670837, 0.9383162260055542, 0.9735692143440247, 1.0088222026824951, 1.0440751314163208, 1.079328179359436, 1.1145811080932617, 1.149834156036377]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 17.0, 16.0, 15.0, 21.0, 27.0, 28.0, 35.0, 31.0, 32.0, 45.0, 50.0, 54.0, 49.0, 47.0, 46.0, 62.0, 42.0, 40.0, 42.0, 40.0, 40.0, 30.0, 33.0, 22.0, 13.0, 13.0, 13.0, 29.0, 5.0, 10.0, 8.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4031316637992859, -0.3914082944393158, -0.3796849250793457, -0.367961585521698, -0.3562382161617279, -0.3445148468017578, -0.3327914774417877, -0.3210681080818176, -0.3093447685241699, -0.29762139916419983, -0.28589802980422974, -0.27417469024658203, -0.26245132088661194, -0.25072795152664185, -0.23900458216667175, -0.22728121280670166, -0.21555784344673157, -0.20383447408676147, -0.19211111962795258, -0.18038775026798248, -0.16866439580917358, -0.1569410264492035, -0.1452176570892334, -0.1334942877292633, -0.1217709332704544, -0.11004757136106491, -0.09832420945167542, -0.08660084009170532, -0.07487747818231583, -0.06315411627292633, -0.05143074691295624, -0.03970738500356674, -0.027984023094177246, -0.0162606593221426, -0.004537295550107956, 0.007186070084571838, 0.018909431993961334, 0.03063279390335083, 0.04235616326332092, 0.05407952517271042, 0.06580288708209991, 0.07752624899148941, 0.0892496109008789, 0.100972980260849, 0.1126963421702385, 0.12441970407962799, 0.13614307343959808, 0.14786642789840698, 0.15958979725837708, 0.17131316661834717, 0.18303652107715607, 0.19475989043712616, 0.20648324489593506, 0.21820661425590515, 0.22992998361587524, 0.24165335297584534, 0.25337672233581543, 0.2651000916957855, 0.2768234610557556, 0.2885468006134033, 0.3002701699733734, 0.3119935393333435, 0.3237169086933136, 0.3354402780532837, 0.3471636176109314]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 5.0, 12.0, 23.0, 40.0, 33.0, 53.0, 76.0, 125.0, 197.0, 338.0, 670.0, 1199.0, 2632.0, 5935.0, 14758.0, 40763.0, 126765.0, 387263.0, 319054.0, 95520.0, 31548.0, 11919.0, 4974.0, 2139.0, 1065.0, 565.0, 318.0, 171.0, 106.0, 80.0, 53.0, 40.0, 30.0, 16.0, 13.0, 14.0, 9.0, 7.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.343994140625, -0.3341331481933594, -0.32427215576171875, -0.3144111633300781, -0.3045501708984375, -0.2946891784667969, -0.28482818603515625, -0.2749671936035156, -0.265106201171875, -0.2552452087402344, -0.24538421630859375, -0.23552322387695312, -0.2256622314453125, -0.21580123901367188, -0.20594024658203125, -0.19607925415039062, -0.18621826171875, -0.17635726928710938, -0.16649627685546875, -0.15663528442382812, -0.1467742919921875, -0.13691329956054688, -0.12705230712890625, -0.11719131469726562, -0.107330322265625, -0.09746932983398438, -0.08760833740234375, -0.07774734497070312, -0.0678863525390625, -0.058025360107421875, -0.04816436767578125, -0.038303375244140625, -0.0284423828125, -0.018581390380859375, -0.00872039794921875, 0.001140594482421875, 0.0110015869140625, 0.020862579345703125, 0.03072357177734375, 0.040584564208984375, 0.050445556640625, 0.060306549072265625, 0.07016754150390625, 0.08002853393554688, 0.0898895263671875, 0.09975051879882812, 0.10961151123046875, 0.11947250366210938, 0.12933349609375, 0.13919448852539062, 0.14905548095703125, 0.15891647338867188, 0.1687774658203125, 0.17863845825195312, 0.18849945068359375, 0.19836044311523438, 0.208221435546875, 0.21808242797851562, 0.22794342041015625, 0.23780441284179688, 0.2476654052734375, 0.2575263977050781, 0.26738739013671875, 0.2772483825683594, 0.287109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 8.0, 10.0, 10.0, 3.0, 16.0, 20.0, 13.0, 18.0, 27.0, 33.0, 30.0, 27.0, 24.0, 41.0, 47.0, 47.0, 43.0, 39.0, 45.0, 47.0, 54.0, 35.0, 57.0, 32.0, 42.0, 34.0, 37.0, 27.0, 20.0, 16.0, 11.0, 14.0, 6.0, 12.0, 11.0, 8.0, 10.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7348556518554688, -0.7123870849609375, -0.6899185180664062, -0.667449951171875, -0.6449813842773438, -0.6225128173828125, -0.6000442504882812, -0.57757568359375, -0.5551071166992188, -0.5326385498046875, -0.5101699829101562, -0.487701416015625, -0.46523284912109375, -0.4427642822265625, -0.42029571533203125, -0.3978271484375, -0.37535858154296875, -0.3528900146484375, -0.33042144775390625, -0.307952880859375, -0.28548431396484375, -0.2630157470703125, -0.24054718017578125, -0.21807861328125, -0.19561004638671875, -0.1731414794921875, -0.15067291259765625, -0.128204345703125, -0.10573577880859375, -0.0832672119140625, -0.06079864501953125, -0.038330078125, -0.01586151123046875, 0.0066070556640625, 0.02907562255859375, 0.051544189453125, 0.07401275634765625, 0.0964813232421875, 0.11894989013671875, 0.14141845703125, 0.16388702392578125, 0.1863555908203125, 0.20882415771484375, 0.231292724609375, 0.25376129150390625, 0.2762298583984375, 0.29869842529296875, 0.3211669921875, 0.34363555908203125, 0.3661041259765625, 0.38857269287109375, 0.411041259765625, 0.43350982666015625, 0.4559783935546875, 0.47844696044921875, 0.50091552734375, 0.5233840942382812, 0.5458526611328125, 0.5683212280273438, 0.590789794921875, 0.6132583618164062, 0.6357269287109375, 0.6581954956054688, 0.6806640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 0.0, 8.0, 11.0, 13.0, 12.0, 23.0, 15.0, 41.0, 28.0, 54.0, 80.0, 94.0, 140.0, 195.0, 368.0, 652.0, 2524.0, 23424.0, 436296.0, 549268.0, 30359.0, 2958.0, 798.0, 367.0, 248.0, 138.0, 114.0, 85.0, 58.0, 54.0, 32.0, 19.0, 14.0, 9.0, 9.0, 15.0, 8.0, 0.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6923828125, -0.6700820922851562, -0.6477813720703125, -0.6254806518554688, -0.603179931640625, -0.5808792114257812, -0.5585784912109375, -0.5362777709960938, -0.51397705078125, -0.49167633056640625, -0.4693756103515625, -0.44707489013671875, -0.424774169921875, -0.40247344970703125, -0.3801727294921875, -0.35787200927734375, -0.3355712890625, -0.31327056884765625, -0.2909698486328125, -0.26866912841796875, -0.246368408203125, -0.22406768798828125, -0.2017669677734375, -0.17946624755859375, -0.15716552734375, -0.13486480712890625, -0.1125640869140625, -0.09026336669921875, -0.067962646484375, -0.04566192626953125, -0.0233612060546875, -0.00106048583984375, 0.021240234375, 0.04354095458984375, 0.0658416748046875, 0.08814239501953125, 0.110443115234375, 0.13274383544921875, 0.1550445556640625, 0.17734527587890625, 0.19964599609375, 0.22194671630859375, 0.2442474365234375, 0.26654815673828125, 0.288848876953125, 0.31114959716796875, 0.3334503173828125, 0.35575103759765625, 0.3780517578125, 0.40035247802734375, 0.4226531982421875, 0.44495391845703125, 0.467254638671875, 0.48955535888671875, 0.5118560791015625, 0.5341567993164062, 0.55645751953125, 0.5787582397460938, 0.6010589599609375, 0.6233596801757812, 0.645660400390625, 0.6679611206054688, 0.6902618408203125, 0.7125625610351562, 0.73486328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 4.0, 4.0, 19.0, 11.0, 10.0, 15.0, 17.0, 15.0, 25.0, 19.0, 22.0, 26.0, 39.0, 42.0, 44.0, 35.0, 37.0, 51.0, 38.0, 35.0, 44.0, 49.0, 32.0, 38.0, 44.0, 34.0, 31.0, 31.0, 27.0, 31.0, 19.0, 16.0, 16.0, 11.0, 10.0, 12.0, 11.0, 7.0, 8.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.79736328125, -0.772491455078125, -0.74761962890625, -0.722747802734375, -0.6978759765625, -0.673004150390625, -0.64813232421875, -0.623260498046875, -0.598388671875, -0.573516845703125, -0.54864501953125, -0.523773193359375, -0.4989013671875, -0.474029541015625, -0.44915771484375, -0.424285888671875, -0.3994140625, -0.374542236328125, -0.34967041015625, -0.324798583984375, -0.2999267578125, -0.275054931640625, -0.25018310546875, -0.225311279296875, -0.200439453125, -0.175567626953125, -0.15069580078125, -0.125823974609375, -0.1009521484375, -0.076080322265625, -0.05120849609375, -0.026336669921875, -0.00146484375, 0.023406982421875, 0.04827880859375, 0.073150634765625, 0.0980224609375, 0.122894287109375, 0.14776611328125, 0.172637939453125, 0.197509765625, 0.222381591796875, 0.24725341796875, 0.272125244140625, 0.2969970703125, 0.321868896484375, 0.34674072265625, 0.371612548828125, 0.396484375, 0.421356201171875, 0.44622802734375, 0.471099853515625, 0.4959716796875, 0.520843505859375, 0.54571533203125, 0.570587158203125, 0.595458984375, 0.620330810546875, 0.64520263671875, 0.670074462890625, 0.6949462890625, 0.719818115234375, 0.74468994140625, 0.769561767578125, 0.79443359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 2.0, 7.0, 12.0, 10.0, 25.0, 31.0, 41.0, 63.0, 95.0, 174.0, 376.0, 929.0, 2940.0, 14993.0, 166586.0, 758063.0, 90472.0, 9887.0, 2325.0, 772.0, 300.0, 161.0, 90.0, 58.0, 39.0, 19.0, 16.0, 13.0, 9.0, 5.0, 4.0, 4.0, 10.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2225341796875, -0.21566390991210938, -0.20879364013671875, -0.20192337036132812, -0.1950531005859375, -0.18818283081054688, -0.18131256103515625, -0.17444229125976562, -0.167572021484375, -0.16070175170898438, -0.15383148193359375, -0.14696121215820312, -0.1400909423828125, -0.13322067260742188, -0.12635040283203125, -0.11948013305664062, -0.11260986328125, -0.10573959350585938, -0.09886932373046875, -0.09199905395507812, -0.0851287841796875, -0.07825851440429688, -0.07138824462890625, -0.06451797485351562, -0.057647705078125, -0.050777435302734375, -0.04390716552734375, -0.037036895751953125, -0.0301666259765625, -0.023296356201171875, -0.01642608642578125, -0.009555816650390625, -0.002685546875, 0.004184722900390625, 0.01105499267578125, 0.017925262451171875, 0.0247955322265625, 0.031665802001953125, 0.03853607177734375, 0.045406341552734375, 0.052276611328125, 0.059146881103515625, 0.06601715087890625, 0.07288742065429688, 0.0797576904296875, 0.08662796020507812, 0.09349822998046875, 0.10036849975585938, 0.10723876953125, 0.11410903930664062, 0.12097930908203125, 0.12784957885742188, 0.1347198486328125, 0.14159011840820312, 0.14846038818359375, 0.15533065795898438, 0.162200927734375, 0.16907119750976562, 0.17594146728515625, 0.18281173706054688, 0.1896820068359375, 0.19655227661132812, 0.20342254638671875, 0.21029281616210938, 0.2171630859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 7.0, 9.0, 11.0, 29.0, 35.0, 60.0, 71.0, 97.0, 94.0, 96.0, 99.0, 106.0, 71.0, 55.0, 53.0, 35.0, 13.0, 13.0, 9.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.147125244140625e-05, -3.0734576284885406e-05, -2.9997900128364563e-05, -2.926122397184372e-05, -2.8524547815322876e-05, -2.7787871658802032e-05, -2.705119550228119e-05, -2.6314519345760345e-05, -2.5577843189239502e-05, -2.484116703271866e-05, -2.4104490876197815e-05, -2.336781471967697e-05, -2.2631138563156128e-05, -2.1894462406635284e-05, -2.115778625011444e-05, -2.0421110093593597e-05, -1.9684433937072754e-05, -1.894775778055191e-05, -1.8211081624031067e-05, -1.7474405467510223e-05, -1.673772931098938e-05, -1.6001053154468536e-05, -1.5264376997947693e-05, -1.452770084142685e-05, -1.3791024684906006e-05, -1.3054348528385162e-05, -1.2317672371864319e-05, -1.1580996215343475e-05, -1.0844320058822632e-05, -1.0107643902301788e-05, -9.370967745780945e-06, -8.634291589260101e-06, -7.897615432739258e-06, -7.160939276218414e-06, -6.424263119697571e-06, -5.687586963176727e-06, -4.950910806655884e-06, -4.21423465013504e-06, -3.4775584936141968e-06, -2.7408823370933533e-06, -2.0042061805725098e-06, -1.2675300240516663e-06, -5.308538675308228e-07, 2.0582228899002075e-07, 9.424984455108643e-07, 1.6791746020317078e-06, 2.4158507585525513e-06, 3.1525269150733948e-06, 3.889203071594238e-06, 4.625879228115082e-06, 5.362555384635925e-06, 6.099231541156769e-06, 6.835907697677612e-06, 7.572583854198456e-06, 8.3092600107193e-06, 9.045936167240143e-06, 9.782612323760986e-06, 1.051928848028183e-05, 1.1255964636802673e-05, 1.1992640793323517e-05, 1.272931694984436e-05, 1.3465993106365204e-05, 1.4202669262886047e-05, 1.4939345419406891e-05, 1.5676021575927734e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 16.0, 16.0, 27.0, 34.0, 48.0, 110.0, 181.0, 359.0, 970.0, 2677.0, 12807.0, 240403.0, 750084.0, 33701.0, 4627.0, 1394.0, 510.0, 243.0, 122.0, 75.0, 38.0, 21.0, 24.0, 16.0, 5.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.2856292724609375, -0.275848388671875, -0.2660675048828125, -0.25628662109375, -0.2465057373046875, -0.236724853515625, -0.2269439697265625, -0.2171630859375, -0.2073822021484375, -0.197601318359375, -0.1878204345703125, -0.17803955078125, -0.1682586669921875, -0.158477783203125, -0.1486968994140625, -0.138916015625, -0.1291351318359375, -0.119354248046875, -0.1095733642578125, -0.09979248046875, -0.0900115966796875, -0.080230712890625, -0.0704498291015625, -0.0606689453125, -0.0508880615234375, -0.041107177734375, -0.0313262939453125, -0.02154541015625, -0.0117645263671875, -0.001983642578125, 0.0077972412109375, 0.017578125, 0.0273590087890625, 0.037139892578125, 0.0469207763671875, 0.05670166015625, 0.0664825439453125, 0.076263427734375, 0.0860443115234375, 0.0958251953125, 0.1056060791015625, 0.115386962890625, 0.1251678466796875, 0.13494873046875, 0.1447296142578125, 0.154510498046875, 0.1642913818359375, 0.174072265625, 0.1838531494140625, 0.193634033203125, 0.2034149169921875, 0.21319580078125, 0.2229766845703125, 0.232757568359375, 0.2425384521484375, 0.2523193359375, 0.2621002197265625, 0.271881103515625, 0.2816619873046875, 0.29144287109375, 0.3012237548828125, 0.311004638671875, 0.3207855224609375, 0.33056640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 10.0, 11.0, 27.0, 40.0, 54.0, 78.0, 87.0, 108.0, 130.0, 102.0, 91.0, 68.0, 47.0, 40.0, 23.0, 21.0, 14.0, 12.0, 4.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09625244140625, -0.09344673156738281, -0.09064102172851562, -0.08783531188964844, -0.08502960205078125, -0.08222389221191406, -0.07941818237304688, -0.07661247253417969, -0.0738067626953125, -0.07100105285644531, -0.06819534301757812, -0.06538963317871094, -0.06258392333984375, -0.05977821350097656, -0.056972503662109375, -0.05416679382324219, -0.051361083984375, -0.04855537414550781, -0.045749664306640625, -0.04294395446777344, -0.04013824462890625, -0.03733253479003906, -0.034526824951171875, -0.03172111511230469, -0.0289154052734375, -0.026109695434570312, -0.023303985595703125, -0.020498275756835938, -0.01769256591796875, -0.014886856079101562, -0.012081146240234375, -0.009275436401367188, -0.0064697265625, -0.0036640167236328125, -0.000858306884765625, 0.0019474029541015625, 0.00475311279296875, 0.0075588226318359375, 0.010364532470703125, 0.013170242309570312, 0.0159759521484375, 0.018781661987304688, 0.021587371826171875, 0.024393081665039062, 0.02719879150390625, 0.030004501342773438, 0.032810211181640625, 0.03561592102050781, 0.038421630859375, 0.04122734069824219, 0.044033050537109375, 0.04683876037597656, 0.04964447021484375, 0.05245018005371094, 0.055255889892578125, 0.05806159973144531, 0.0608673095703125, 0.06367301940917969, 0.06647872924804688, 0.06928443908691406, 0.07209014892578125, 0.07489585876464844, 0.07770156860351562, 0.08050727844238281, 0.08331298828125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 9.0, 32.0, 56.0, 79.0, 113.0, 166.0, 144.0, 106.0, 117.0, 63.0, 47.0, 25.0, 7.0, 10.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8401200771331787, -1.7863998413085938, -1.7326794862747192, -1.6789592504501343, -1.6252390146255493, -1.5715186595916748, -1.5177984237670898, -1.4640781879425049, -1.41035795211792, -1.356637716293335, -1.3029173612594604, -1.2491971254348755, -1.1954768896102905, -1.141756534576416, -1.088036298751831, -1.034316062927246, -0.9805957078933716, -0.9268754124641418, -0.8731551766395569, -0.8194348812103271, -0.7657146453857422, -0.7119943499565125, -0.6582740545272827, -0.6045538187026978, -0.550833523273468, -0.49711325764656067, -0.4433929920196533, -0.3896726965904236, -0.33595243096351624, -0.2822321653366089, -0.22851186990737915, -0.1747916042804718, -0.1210712194442749, -0.06735094636678696, -0.013630673289299011, 0.04008960723876953, 0.09380987286567688, 0.14753013849258423, 0.20125043392181396, 0.2549706995487213, 0.30869096517562866, 0.362411230802536, 0.41613149642944336, 0.4698517918586731, 0.5235720872879028, 0.5772923231124878, 0.6310126185417175, 0.6847329139709473, 0.7384531497955322, 0.792173445224762, 0.8458936810493469, 0.8996139764785767, 0.9533342123031616, 1.0070545673370361, 1.060774803161621, 1.114495038986206, 1.168215274810791, 1.221935510635376, 1.2756558656692505, 1.3293761014938354, 1.3830963373184204, 1.436816692352295, 1.4905369281768799, 1.5442571640014648, 1.5979775190353394]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 5.0, 7.0, 14.0, 12.0, 12.0, 19.0, 21.0, 24.0, 28.0, 30.0, 29.0, 34.0, 44.0, 45.0, 41.0, 43.0, 41.0, 47.0, 43.0, 46.0, 34.0, 36.0, 38.0, 42.0, 20.0, 25.0, 37.0, 24.0, 16.0, 26.0, 17.0, 19.0, 14.0, 8.0, 9.0, 2.0, 4.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.43735933303833, -1.3946735858917236, -1.3519877195358276, -1.3093019723892212, -1.2666162252426147, -1.2239303588867188, -1.1812446117401123, -1.1385588645935059, -1.0958729982376099, -1.0531872510910034, -1.0105013847351074, -0.967815637588501, -0.9251298308372498, -0.8824440240859985, -0.8397582769393921, -0.7970724701881409, -0.7543867230415344, -0.7117009162902832, -0.6690151691436768, -0.6263293623924255, -0.5836435556411743, -0.5409578084945679, -0.49827200174331665, -0.45558619499206543, -0.4129004180431366, -0.37021464109420776, -0.32752883434295654, -0.2848430573940277, -0.24215726554393768, -0.19947147369384766, -0.15678569674491882, -0.1140998899936676, -0.07141411304473877, -0.02872832491993904, 0.013957463204860687, 0.05664324760437012, 0.09932903945446014, 0.14201483130455017, 0.184700608253479, 0.22738641500473022, 0.27007219195365906, 0.3127579689025879, 0.3554437756538391, 0.39812955260276794, 0.4408153295516968, 0.483501136302948, 0.5261869430541992, 0.5688726902008057, 0.6115584969520569, 0.6542443037033081, 0.6969300508499146, 0.7396158576011658, 0.782301664352417, 0.8249874114990234, 0.8676732182502747, 0.9103590250015259, 0.9530447721481323, 0.9957305788993835, 1.0384163856506348, 1.0811021327972412, 1.1237878799438477, 1.1664737462997437, 1.20915949344635, 1.251845359802246, 1.2945311069488525]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 10.0, 24.0, 26.0, 45.0, 99.0, 175.0, 295.0, 600.0, 1449.0, 3827.0, 12624.0, 67879.0, 457585.0, 2209829.0, 1238807.0, 162885.0, 26826.0, 6875.0, 2388.0, 927.0, 470.0, 218.0, 138.0, 96.0, 50.0, 34.0, 15.0, 19.0, 14.0, 11.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5421218872070312, -0.5193023681640625, -0.49648284912109375, -0.473663330078125, -0.45084381103515625, -0.4280242919921875, -0.40520477294921875, -0.38238525390625, -0.35956573486328125, -0.3367462158203125, -0.31392669677734375, -0.291107177734375, -0.26828765869140625, -0.2454681396484375, -0.22264862060546875, -0.1998291015625, -0.17700958251953125, -0.1541900634765625, -0.13137054443359375, -0.108551025390625, -0.08573150634765625, -0.0629119873046875, -0.04009246826171875, -0.01727294921875, 0.00554656982421875, 0.0283660888671875, 0.05118560791015625, 0.074005126953125, 0.09682464599609375, 0.1196441650390625, 0.14246368408203125, 0.165283203125, 0.18810272216796875, 0.2109222412109375, 0.23374176025390625, 0.256561279296875, 0.27938079833984375, 0.3022003173828125, 0.32501983642578125, 0.34783935546875, 0.37065887451171875, 0.3934783935546875, 0.41629791259765625, 0.439117431640625, 0.46193695068359375, 0.4847564697265625, 0.5075759887695312, 0.5303955078125, 0.5532150268554688, 0.5760345458984375, 0.5988540649414062, 0.621673583984375, 0.6444931030273438, 0.6673126220703125, 0.6901321411132812, 0.71295166015625, 0.7357711791992188, 0.7585906982421875, 0.7814102172851562, 0.804229736328125, 0.8270492553710938, 0.8498687744140625, 0.8726882934570312, 0.8955078125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 1.0, 4.0, 5.0, 9.0, 9.0, 4.0, 14.0, 11.0, 17.0, 19.0, 35.0, 35.0, 35.0, 20.0, 40.0, 30.0, 40.0, 57.0, 46.0, 66.0, 56.0, 43.0, 62.0, 38.0, 43.0, 36.0, 31.0, 26.0, 29.0, 19.0, 19.0, 14.0, 13.0, 14.0, 16.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5066871643066406, -0.49140167236328125, -0.4761161804199219, -0.4608306884765625, -0.4455451965332031, -0.43025970458984375, -0.4149742126464844, -0.399688720703125, -0.3844032287597656, -0.36911773681640625, -0.3538322448730469, -0.3385467529296875, -0.3232612609863281, -0.30797576904296875, -0.2926902770996094, -0.27740478515625, -0.2621192932128906, -0.24683380126953125, -0.23154830932617188, -0.2162628173828125, -0.20097732543945312, -0.18569183349609375, -0.17040634155273438, -0.155120849609375, -0.13983535766601562, -0.12454986572265625, -0.10926437377929688, -0.0939788818359375, -0.07869338989257812, -0.06340789794921875, -0.048122406005859375, -0.0328369140625, -0.017551422119140625, -0.00226593017578125, 0.013019561767578125, 0.0283050537109375, 0.043590545654296875, 0.05887603759765625, 0.07416152954101562, 0.089447021484375, 0.10473251342773438, 0.12001800537109375, 0.13530349731445312, 0.1505889892578125, 0.16587448120117188, 0.18115997314453125, 0.19644546508789062, 0.21173095703125, 0.22701644897460938, 0.24230194091796875, 0.2575874328613281, 0.2728729248046875, 0.2881584167480469, 0.30344390869140625, 0.3187294006347656, 0.334014892578125, 0.3493003845214844, 0.36458587646484375, 0.3798713684082031, 0.3951568603515625, 0.4104423522949219, 0.42572784423828125, 0.4410133361816406, 0.456298828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 6.0, 11.0, 18.0, 39.0, 52.0, 55.0, 96.0, 187.0, 297.0, 667.0, 1284.0, 3738.0, 16474.0, 134279.0, 2860129.0, 1103352.0, 59501.0, 9272.0, 2598.0, 1018.0, 496.0, 267.0, 145.0, 97.0, 55.0, 45.0, 29.0, 21.0, 14.0, 9.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.814453125, -0.7862014770507812, -0.7579498291015625, -0.7296981811523438, -0.701446533203125, -0.6731948852539062, -0.6449432373046875, -0.6166915893554688, -0.58843994140625, -0.5601882934570312, -0.5319366455078125, -0.5036849975585938, -0.475433349609375, -0.44718170166015625, -0.4189300537109375, -0.39067840576171875, -0.3624267578125, -0.33417510986328125, -0.3059234619140625, -0.27767181396484375, -0.249420166015625, -0.22116851806640625, -0.1929168701171875, -0.16466522216796875, -0.13641357421875, -0.10816192626953125, -0.0799102783203125, -0.05165863037109375, -0.023406982421875, 0.00484466552734375, 0.0330963134765625, 0.06134796142578125, 0.089599609375, 0.11785125732421875, 0.1461029052734375, 0.17435455322265625, 0.202606201171875, 0.23085784912109375, 0.2591094970703125, 0.28736114501953125, 0.31561279296875, 0.34386444091796875, 0.3721160888671875, 0.40036773681640625, 0.428619384765625, 0.45687103271484375, 0.4851226806640625, 0.5133743286132812, 0.5416259765625, 0.5698776245117188, 0.5981292724609375, 0.6263809204101562, 0.654632568359375, 0.6828842163085938, 0.7111358642578125, 0.7393875122070312, 0.76763916015625, 0.7958908081054688, 0.8241424560546875, 0.8523941040039062, 0.880645751953125, 0.9088973999023438, 0.9371490478515625, 0.9654006958007812, 0.99365234375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 13.0, 8.0, 19.0, 16.0, 26.0, 47.0, 53.0, 66.0, 132.0, 142.0, 247.0, 350.0, 495.0, 542.0, 522.0, 432.0, 315.0, 208.0, 142.0, 78.0, 63.0, 35.0, 33.0, 26.0, 14.0, 13.0, 5.0, 7.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.2329864501953125, -0.225860595703125, -0.2187347412109375, -0.21160888671875, -0.2044830322265625, -0.197357177734375, -0.1902313232421875, -0.18310546875, -0.1759796142578125, -0.168853759765625, -0.1617279052734375, -0.15460205078125, -0.1474761962890625, -0.140350341796875, -0.1332244873046875, -0.1260986328125, -0.1189727783203125, -0.111846923828125, -0.1047210693359375, -0.09759521484375, -0.0904693603515625, -0.083343505859375, -0.0762176513671875, -0.069091796875, -0.0619659423828125, -0.054840087890625, -0.0477142333984375, -0.04058837890625, -0.0334625244140625, -0.026336669921875, -0.0192108154296875, -0.0120849609375, -0.0049591064453125, 0.002166748046875, 0.0092926025390625, 0.01641845703125, 0.0235443115234375, 0.030670166015625, 0.0377960205078125, 0.044921875, 0.0520477294921875, 0.059173583984375, 0.0662994384765625, 0.07342529296875, 0.0805511474609375, 0.087677001953125, 0.0948028564453125, 0.1019287109375, 0.1090545654296875, 0.116180419921875, 0.1233062744140625, 0.13043212890625, 0.1375579833984375, 0.144683837890625, 0.1518096923828125, 0.158935546875, 0.1660614013671875, 0.173187255859375, 0.1803131103515625, 0.18743896484375, 0.1945648193359375, 0.201690673828125, 0.2088165283203125, 0.2159423828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 13.0, 17.0, 22.0, 39.0, 61.0, 112.0, 97.0, 137.0, 131.0, 119.0, 95.0, 46.0, 50.0, 24.0, 9.0, 14.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3122243881225586, -1.2723603248596191, -1.2324962615966797, -1.1926320791244507, -1.1527680158615112, -1.1129039525985718, -1.0730398893356323, -1.0331757068634033, -0.9933116436004639, -0.9534475803375244, -0.9135834574699402, -0.8737193942070007, -0.8338552713394165, -0.793991208076477, -0.7541271448135376, -0.7142630219459534, -0.6743989586830139, -0.6345348954200745, -0.5946707725524902, -0.5548067092895508, -0.5149425864219666, -0.4750785231590271, -0.43521443009376526, -0.3953503370285034, -0.3554862439632416, -0.31562215089797974, -0.2757580578327179, -0.23589397966861725, -0.1960298866033554, -0.15616579353809357, -0.11630171537399292, -0.07643762230873108, -0.03657352924346924, 0.003290560096502304, 0.043154649436473846, 0.08301873505115509, 0.12288282811641693, 0.16274692118167877, 0.20261099934577942, 0.24247509241104126, 0.2823391854763031, 0.32220327854156494, 0.3620673716068268, 0.4019314646720886, 0.4417955279350281, 0.4816596508026123, 0.5215237140655518, 0.5613877773284912, 0.6012519001960754, 0.6411159634590149, 0.6809800863265991, 0.7208441495895386, 0.7607082724571228, 0.8005723357200623, 0.8404364585876465, 0.8803005218505859, 0.9201645851135254, 0.9600286483764648, 0.9998927712440491, 1.0397568941116333, 1.0796209573745728, 1.1194850206375122, 1.1593490839004517, 1.1992132663726807, 1.2390773296356201]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 7.0, 10.0, 11.0, 14.0, 12.0, 10.0, 13.0, 16.0, 16.0, 20.0, 20.0, 27.0, 29.0, 27.0, 34.0, 32.0, 32.0, 35.0, 36.0, 37.0, 44.0, 43.0, 42.0, 46.0, 30.0, 38.0, 31.0, 38.0, 32.0, 23.0, 24.0, 22.0, 23.0, 19.0, 17.0, 7.0, 13.0, 14.0, 10.0, 10.0, 5.0, 7.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.41921043395996094, -0.40491753816604614, -0.39062461256980896, -0.3763316869735718, -0.362038791179657, -0.3477458953857422, -0.333452969789505, -0.3191600441932678, -0.304867148399353, -0.29057425260543823, -0.27628132700920105, -0.26198840141296387, -0.24769550561904907, -0.23340259492397308, -0.2191096842288971, -0.2048167735338211, -0.19052386283874512, -0.17623095214366913, -0.16193804144859314, -0.14764513075351715, -0.13335222005844116, -0.11905930936336517, -0.10476639866828918, -0.0904734879732132, -0.07618057727813721, -0.06188766658306122, -0.04759475588798523, -0.03330184519290924, -0.019008934497833252, -0.004716023802757263, 0.009576886892318726, 0.023869797587394714, 0.0381627082824707, 0.05245561897754669, 0.06674852967262268, 0.08104144036769867, 0.09533435106277466, 0.10962726175785065, 0.12392017245292664, 0.13821308314800262, 0.1525059938430786, 0.1667989045381546, 0.1810918152332306, 0.19538472592830658, 0.20967763662338257, 0.22397054731845856, 0.23826345801353455, 0.25255638360977173, 0.2668492794036865, 0.2811421751976013, 0.2954351007938385, 0.3097280263900757, 0.3240209221839905, 0.3383138179779053, 0.35260674357414246, 0.36689966917037964, 0.38119256496429443, 0.39548546075820923, 0.4097783863544464, 0.4240713119506836, 0.4383642077445984, 0.4526571035385132, 0.46695002913475037, 0.48124295473098755, 0.49553585052490234]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 8.0, 8.0, 16.0, 26.0, 35.0, 51.0, 67.0, 108.0, 214.0, 497.0, 1092.0, 2847.0, 9074.0, 32733.0, 134866.0, 420128.0, 327778.0, 87112.0, 21720.0, 6297.0, 2149.0, 809.0, 367.0, 210.0, 122.0, 65.0, 52.0, 32.0, 16.0, 15.0, 13.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1307373046875, -0.12649917602539062, -0.12226104736328125, -0.11802291870117188, -0.1137847900390625, -0.10954666137695312, -0.10530853271484375, -0.10107040405273438, -0.096832275390625, -0.09259414672851562, -0.08835601806640625, -0.08411788940429688, -0.0798797607421875, -0.07564163208007812, -0.07140350341796875, -0.06716537475585938, -0.06292724609375, -0.058689117431640625, -0.05445098876953125, -0.050212860107421875, -0.0459747314453125, -0.041736602783203125, -0.03749847412109375, -0.033260345458984375, -0.029022216796875, -0.024784088134765625, -0.02054595947265625, -0.016307830810546875, -0.0120697021484375, -0.007831573486328125, -0.00359344482421875, 0.000644683837890625, 0.0048828125, 0.009120941162109375, 0.01335906982421875, 0.017597198486328125, 0.0218353271484375, 0.026073455810546875, 0.03031158447265625, 0.034549713134765625, 0.038787841796875, 0.043025970458984375, 0.04726409912109375, 0.051502227783203125, 0.0557403564453125, 0.059978485107421875, 0.06421661376953125, 0.06845474243164062, 0.07269287109375, 0.07693099975585938, 0.08116912841796875, 0.08540725708007812, 0.0896453857421875, 0.09388351440429688, 0.09812164306640625, 0.10235977172851562, 0.106597900390625, 0.11083602905273438, 0.11507415771484375, 0.11931228637695312, 0.1235504150390625, 0.12778854370117188, 0.13202667236328125, 0.13626480102539062, 0.1405029296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 10.0, 7.0, 14.0, 10.0, 11.0, 14.0, 15.0, 21.0, 25.0, 18.0, 20.0, 25.0, 26.0, 31.0, 31.0, 44.0, 32.0, 39.0, 41.0, 44.0, 42.0, 36.0, 38.0, 37.0, 45.0, 39.0, 29.0, 27.0, 22.0, 32.0, 20.0, 22.0, 25.0, 10.0, 16.0, 20.0, 12.0, 7.0, 5.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.30078125, -0.2908782958984375, -0.280975341796875, -0.2710723876953125, -0.26116943359375, -0.2512664794921875, -0.241363525390625, -0.2314605712890625, -0.2215576171875, -0.2116546630859375, -0.201751708984375, -0.1918487548828125, -0.18194580078125, -0.1720428466796875, -0.162139892578125, -0.1522369384765625, -0.142333984375, -0.1324310302734375, -0.122528076171875, -0.1126251220703125, -0.10272216796875, -0.0928192138671875, -0.082916259765625, -0.0730133056640625, -0.0631103515625, -0.0532073974609375, -0.043304443359375, -0.0334014892578125, -0.02349853515625, -0.0135955810546875, -0.003692626953125, 0.0062103271484375, 0.01611328125, 0.0260162353515625, 0.035919189453125, 0.0458221435546875, 0.05572509765625, 0.0656280517578125, 0.075531005859375, 0.0854339599609375, 0.0953369140625, 0.1052398681640625, 0.115142822265625, 0.1250457763671875, 0.13494873046875, 0.1448516845703125, 0.154754638671875, 0.1646575927734375, 0.174560546875, 0.1844635009765625, 0.194366455078125, 0.2042694091796875, 0.21417236328125, 0.2240753173828125, 0.233978271484375, 0.2438812255859375, 0.2537841796875, 0.2636871337890625, 0.273590087890625, 0.2834930419921875, 0.29339599609375, 0.3032989501953125, 0.313201904296875, 0.3231048583984375, 0.3330078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 9.0, 15.0, 16.0, 21.0, 37.0, 45.0, 60.0, 96.0, 107.0, 165.0, 240.0, 346.0, 555.0, 1017.0, 1836.0, 3791.0, 8321.0, 19462.0, 48327.0, 116566.0, 238338.0, 289657.0, 182067.0, 79428.0, 32382.0, 13249.0, 5961.0, 2796.0, 1404.0, 791.0, 450.0, 290.0, 198.0, 144.0, 106.0, 68.0, 43.0, 31.0, 33.0, 18.0, 13.0, 12.0, 13.0, 7.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0806884765625, -0.07833480834960938, -0.07598114013671875, -0.07362747192382812, -0.0712738037109375, -0.06892013549804688, -0.06656646728515625, -0.06421279907226562, -0.061859130859375, -0.059505462646484375, -0.05715179443359375, -0.054798126220703125, -0.0524444580078125, -0.050090789794921875, -0.04773712158203125, -0.045383453369140625, -0.04302978515625, -0.040676116943359375, -0.03832244873046875, -0.035968780517578125, -0.0336151123046875, -0.031261444091796875, -0.02890777587890625, -0.026554107666015625, -0.024200439453125, -0.021846771240234375, -0.01949310302734375, -0.017139434814453125, -0.0147857666015625, -0.012432098388671875, -0.01007843017578125, -0.007724761962890625, -0.00537109375, -0.003017425537109375, -0.00066375732421875, 0.001689910888671875, 0.0040435791015625, 0.006397247314453125, 0.00875091552734375, 0.011104583740234375, 0.013458251953125, 0.015811920166015625, 0.01816558837890625, 0.020519256591796875, 0.0228729248046875, 0.025226593017578125, 0.02758026123046875, 0.029933929443359375, 0.03228759765625, 0.034641265869140625, 0.03699493408203125, 0.039348602294921875, 0.0417022705078125, 0.044055938720703125, 0.04640960693359375, 0.048763275146484375, 0.051116943359375, 0.053470611572265625, 0.05582427978515625, 0.058177947998046875, 0.0605316162109375, 0.06288528442382812, 0.06523895263671875, 0.06759262084960938, 0.0699462890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 5.0, 6.0, 8.0, 14.0, 14.0, 14.0, 21.0, 21.0, 24.0, 24.0, 30.0, 34.0, 35.0, 49.0, 40.0, 44.0, 40.0, 47.0, 45.0, 61.0, 53.0, 37.0, 39.0, 36.0, 42.0, 28.0, 33.0, 18.0, 25.0, 13.0, 14.0, 16.0, 13.0, 14.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.693145751953125, -0.66949462890625, -0.645843505859375, -0.6221923828125, -0.598541259765625, -0.57489013671875, -0.551239013671875, -0.527587890625, -0.503936767578125, -0.48028564453125, -0.456634521484375, -0.4329833984375, -0.409332275390625, -0.38568115234375, -0.362030029296875, -0.33837890625, -0.314727783203125, -0.29107666015625, -0.267425537109375, -0.2437744140625, -0.220123291015625, -0.19647216796875, -0.172821044921875, -0.149169921875, -0.125518798828125, -0.10186767578125, -0.078216552734375, -0.0545654296875, -0.030914306640625, -0.00726318359375, 0.016387939453125, 0.0400390625, 0.063690185546875, 0.08734130859375, 0.110992431640625, 0.1346435546875, 0.158294677734375, 0.18194580078125, 0.205596923828125, 0.229248046875, 0.252899169921875, 0.27655029296875, 0.300201416015625, 0.3238525390625, 0.347503662109375, 0.37115478515625, 0.394805908203125, 0.41845703125, 0.442108154296875, 0.46575927734375, 0.489410400390625, 0.5130615234375, 0.536712646484375, 0.56036376953125, 0.584014892578125, 0.607666015625, 0.631317138671875, 0.65496826171875, 0.678619384765625, 0.7022705078125, 0.725921630859375, 0.74957275390625, 0.773223876953125, 0.796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 8.0, 8.0, 7.0, 14.0, 28.0, 45.0, 57.0, 117.0, 205.0, 363.0, 668.0, 1424.0, 3226.0, 8840.0, 29693.0, 122217.0, 401842.0, 348314.0, 95024.0, 23568.0, 7376.0, 2794.0, 1295.0, 616.0, 346.0, 183.0, 109.0, 59.0, 34.0, 24.0, 20.0, 6.0, 14.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04461669921875, -0.043261051177978516, -0.04190540313720703, -0.04054975509643555, -0.03919410705566406, -0.03783845901489258, -0.036482810974121094, -0.03512716293334961, -0.033771514892578125, -0.03241586685180664, -0.031060218811035156, -0.029704570770263672, -0.028348922729492188, -0.026993274688720703, -0.02563762664794922, -0.024281978607177734, -0.02292633056640625, -0.021570682525634766, -0.02021503448486328, -0.018859386444091797, -0.017503738403320312, -0.016148090362548828, -0.014792442321777344, -0.01343679428100586, -0.012081146240234375, -0.01072549819946289, -0.009369850158691406, -0.008014202117919922, -0.0066585540771484375, -0.005302906036376953, -0.003947257995605469, -0.0025916099548339844, -0.0012359619140625, 0.00011968612670898438, 0.0014753341674804688, 0.002830982208251953, 0.0041866302490234375, 0.005542278289794922, 0.006897926330566406, 0.00825357437133789, 0.009609222412109375, 0.01096487045288086, 0.012320518493652344, 0.013676166534423828, 0.015031814575195312, 0.016387462615966797, 0.01774311065673828, 0.019098758697509766, 0.02045440673828125, 0.021810054779052734, 0.02316570281982422, 0.024521350860595703, 0.025876998901367188, 0.027232646942138672, 0.028588294982910156, 0.02994394302368164, 0.031299591064453125, 0.03265523910522461, 0.034010887145996094, 0.03536653518676758, 0.03672218322753906, 0.03807783126831055, 0.03943347930908203, 0.040789127349853516, 0.042144775390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 12.0, 7.0, 9.0, 23.0, 28.0, 30.0, 52.0, 43.0, 67.0, 57.0, 68.0, 77.0, 67.0, 71.0, 75.0, 72.0, 46.0, 34.0, 37.0, 38.0, 27.0, 18.0, 14.0, 9.0, 3.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.5533529222011566e-05, -1.5033408999443054e-05, -1.4533288776874542e-05, -1.403316855430603e-05, -1.3533048331737518e-05, -1.3032928109169006e-05, -1.2532807886600494e-05, -1.2032687664031982e-05, -1.153256744146347e-05, -1.1032447218894958e-05, -1.0532326996326447e-05, -1.0032206773757935e-05, -9.532086551189423e-06, -9.03196632862091e-06, -8.531846106052399e-06, -8.031725883483887e-06, -7.531605660915375e-06, -7.031485438346863e-06, -6.531365215778351e-06, -6.031244993209839e-06, -5.531124770641327e-06, -5.031004548072815e-06, -4.530884325504303e-06, -4.030764102935791e-06, -3.530643880367279e-06, -3.030523657798767e-06, -2.530403435230255e-06, -2.030283212661743e-06, -1.5301629900932312e-06, -1.0300427675247192e-06, -5.299225449562073e-07, -2.9802322387695312e-08, 4.7031790018081665e-07, 9.704381227493286e-07, 1.4705583453178406e-06, 1.9706785678863525e-06, 2.4707987904548645e-06, 2.9709190130233765e-06, 3.4710392355918884e-06, 3.9711594581604e-06, 4.471279680728912e-06, 4.971399903297424e-06, 5.471520125865936e-06, 5.971640348434448e-06, 6.47176057100296e-06, 6.971880793571472e-06, 7.472001016139984e-06, 7.972121238708496e-06, 8.472241461277008e-06, 8.97236168384552e-06, 9.472481906414032e-06, 9.972602128982544e-06, 1.0472722351551056e-05, 1.0972842574119568e-05, 1.147296279668808e-05, 1.1973083019256592e-05, 1.2473203241825104e-05, 1.2973323464393616e-05, 1.3473443686962128e-05, 1.397356390953064e-05, 1.4473684132099152e-05, 1.4973804354667664e-05, 1.5473924577236176e-05, 1.5974044799804688e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 13.0, 7.0, 8.0, 10.0, 13.0, 24.0, 27.0, 53.0, 61.0, 75.0, 119.0, 191.0, 265.0, 444.0, 738.0, 1553.0, 3151.0, 7388.0, 20451.0, 63694.0, 205962.0, 402738.0, 230457.0, 72356.0, 23173.0, 8148.0, 3445.0, 1705.0, 828.0, 508.0, 292.0, 189.0, 135.0, 94.0, 58.0, 42.0, 35.0, 28.0, 18.0, 8.0, 12.0, 8.0, 10.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.041107177734375, -0.039844512939453125, -0.03858184814453125, -0.037319183349609375, -0.0360565185546875, -0.034793853759765625, -0.03353118896484375, -0.032268524169921875, -0.031005859375, -0.029743194580078125, -0.02848052978515625, -0.027217864990234375, -0.0259552001953125, -0.024692535400390625, -0.02342987060546875, -0.022167205810546875, -0.020904541015625, -0.019641876220703125, -0.01837921142578125, -0.017116546630859375, -0.0158538818359375, -0.014591217041015625, -0.01332855224609375, -0.012065887451171875, -0.01080322265625, -0.009540557861328125, -0.00827789306640625, -0.007015228271484375, -0.0057525634765625, -0.004489898681640625, -0.00322723388671875, -0.001964569091796875, -0.000701904296875, 0.000560760498046875, 0.00182342529296875, 0.003086090087890625, 0.0043487548828125, 0.005611419677734375, 0.00687408447265625, 0.008136749267578125, 0.0093994140625, 0.010662078857421875, 0.01192474365234375, 0.013187408447265625, 0.0144500732421875, 0.015712738037109375, 0.01697540283203125, 0.018238067626953125, 0.019500732421875, 0.020763397216796875, 0.02202606201171875, 0.023288726806640625, 0.0245513916015625, 0.025814056396484375, 0.02707672119140625, 0.028339385986328125, 0.02960205078125, 0.030864715576171875, 0.03212738037109375, 0.033390045166015625, 0.0346527099609375, 0.035915374755859375, 0.03717803955078125, 0.038440704345703125, 0.039703369140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 11.0, 8.0, 15.0, 21.0, 22.0, 27.0, 41.0, 46.0, 37.0, 39.0, 61.0, 56.0, 62.0, 68.0, 58.0, 60.0, 61.0, 51.0, 33.0, 50.0, 34.0, 23.0, 25.0, 15.0, 16.0, 10.0, 9.0, 6.0, 4.0, 4.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00968170166015625, -0.009288549423217773, -0.008895397186279297, -0.00850224494934082, -0.008109092712402344, -0.007715940475463867, -0.007322788238525391, -0.006929636001586914, -0.0065364837646484375, -0.006143331527709961, -0.005750179290771484, -0.005357027053833008, -0.004963874816894531, -0.004570722579956055, -0.004177570343017578, -0.0037844181060791016, -0.003391265869140625, -0.0029981136322021484, -0.002604961395263672, -0.0022118091583251953, -0.0018186569213867188, -0.0014255046844482422, -0.0010323524475097656, -0.0006392002105712891, -0.0002460479736328125, 0.00014710426330566406, 0.0005402565002441406, 0.0009334087371826172, 0.0013265609741210938, 0.0017197132110595703, 0.002112865447998047, 0.0025060176849365234, 0.002899169921875, 0.0032923221588134766, 0.003685474395751953, 0.00407862663269043, 0.004471778869628906, 0.004864931106567383, 0.005258083343505859, 0.005651235580444336, 0.0060443878173828125, 0.006437540054321289, 0.006830692291259766, 0.007223844528198242, 0.007616996765136719, 0.008010149002075195, 0.008403301239013672, 0.008796453475952148, 0.009189605712890625, 0.009582757949829102, 0.009975910186767578, 0.010369062423706055, 0.010762214660644531, 0.011155366897583008, 0.011548519134521484, 0.011941671371459961, 0.012334823608398438, 0.012727975845336914, 0.01312112808227539, 0.013514280319213867, 0.013907432556152344, 0.01430058479309082, 0.014693737030029297, 0.015086889266967773, 0.01548004150390625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 13.0, 18.0, 31.0, 54.0, 80.0, 119.0, 137.0, 166.0, 142.0, 93.0, 67.0, 30.0, 18.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.830352246761322, -0.802791953086853, -0.775231659412384, -0.747671365737915, -0.7201110124588013, -0.692550778388977, -0.6649904251098633, -0.6374301314353943, -0.6098698377609253, -0.5823095440864563, -0.5547492504119873, -0.5271889567375183, -0.49962863326072693, -0.47206833958625793, -0.44450801610946655, -0.41694772243499756, -0.38938742876052856, -0.36182713508605957, -0.3342668414115906, -0.3067065179347992, -0.2791462242603302, -0.2515859305858612, -0.22402562201023102, -0.19646531343460083, -0.16890501976013184, -0.14134472608566284, -0.11378441751003265, -0.08622411638498306, -0.05866381525993347, -0.031103521585464478, -0.0035432130098342896, 0.0240170955657959, 0.05157744884490967, 0.07913774996995926, 0.10669805109500885, 0.13425835967063904, 0.16181865334510803, 0.18937894701957703, 0.21693925559520721, 0.2444995641708374, 0.2720598578453064, 0.2996201515197754, 0.3271804451942444, 0.35474076867103577, 0.38230106234550476, 0.40986135601997375, 0.43742167949676514, 0.46498197317123413, 0.4925422668457031, 0.5201025605201721, 0.5476628541946411, 0.5752231478691101, 0.6027834415435791, 0.6303437948226929, 0.6579040884971619, 0.6854643821716309, 0.7130246758460999, 0.7405849695205688, 0.7681452631950378, 0.7957055568695068, 0.8232659101486206, 0.8508261442184448, 0.8783864974975586, 0.9059467911720276, 0.9335070848464966]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 9.0, 4.0, 6.0, 16.0, 14.0, 7.0, 19.0, 21.0, 15.0, 23.0, 21.0, 29.0, 31.0, 33.0, 37.0, 35.0, 42.0, 46.0, 37.0, 46.0, 51.0, 47.0, 39.0, 39.0, 37.0, 47.0, 36.0, 24.0, 31.0, 24.0, 17.0, 19.0, 12.0, 14.0, 16.0, 12.0, 8.0, 7.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30832287669181824, -0.2980031967163086, -0.28768354654312134, -0.2773638963699341, -0.26704421639442444, -0.2567245364189148, -0.24640488624572754, -0.2360852211713791, -0.22576555609703064, -0.2154458910226822, -0.20512622594833374, -0.1948065608739853, -0.18448689579963684, -0.1741672307252884, -0.16384756565093994, -0.1535279005765915, -0.14320823550224304, -0.1328885704278946, -0.12256890535354614, -0.11224924027919769, -0.10192957520484924, -0.0916099101305008, -0.08129024505615234, -0.0709705799818039, -0.060650914907455444, -0.050331249833106995, -0.040011584758758545, -0.029691919684410095, -0.019372254610061646, -0.009052589535713196, 0.001267075538635254, 0.011586740612983704, 0.021906375885009766, 0.032226040959358215, 0.042545706033706665, 0.052865371108055115, 0.06318503618240356, 0.07350470125675201, 0.08382436633110046, 0.09414403140544891, 0.10446369647979736, 0.11478336155414581, 0.12510302662849426, 0.1354226917028427, 0.14574235677719116, 0.1560620218515396, 0.16638168692588806, 0.1767013520002365, 0.18702101707458496, 0.1973406821489334, 0.20766034722328186, 0.2179800122976303, 0.22829967737197876, 0.2386193424463272, 0.24893900752067566, 0.2592586874961853, 0.26957833766937256, 0.2798979878425598, 0.29021766781806946, 0.3005373477935791, 0.31085699796676636, 0.3211766481399536, 0.33149632811546326, 0.3418160080909729, 0.35213565826416016]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 12.0, 15.0, 18.0, 26.0, 59.0, 78.0, 140.0, 197.0, 285.0, 586.0, 1002.0, 1893.0, 3630.0, 7239.0, 14951.0, 34291.0, 87687.0, 287252.0, 403923.0, 122534.0, 44832.0, 19209.0, 9009.0, 4471.0, 2262.0, 1269.0, 697.0, 376.0, 192.0, 141.0, 97.0, 59.0, 38.0, 35.0, 18.0, 11.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.31453895568847656, -0.3055915832519531, -0.2966442108154297, -0.28769683837890625, -0.2787494659423828, -0.2698020935058594, -0.26085472106933594, -0.2519073486328125, -0.24295997619628906, -0.23401260375976562, -0.2250652313232422, -0.21611785888671875, -0.2071704864501953, -0.19822311401367188, -0.18927574157714844, -0.180328369140625, -0.17138099670410156, -0.16243362426757812, -0.1534862518310547, -0.14453887939453125, -0.1355915069580078, -0.12664413452148438, -0.11769676208496094, -0.1087493896484375, -0.09980201721191406, -0.09085464477539062, -0.08190727233886719, -0.07295989990234375, -0.06401252746582031, -0.055065155029296875, -0.04611778259277344, -0.03717041015625, -0.028223037719726562, -0.019275665283203125, -0.010328292846679688, -0.00138092041015625, 0.0075664520263671875, 0.016513824462890625, 0.025461196899414062, 0.0344085693359375, 0.04335594177246094, 0.052303314208984375, 0.06125068664550781, 0.07019805908203125, 0.07914543151855469, 0.08809280395507812, 0.09704017639160156, 0.105987548828125, 0.11493492126464844, 0.12388229370117188, 0.1328296661376953, 0.14177703857421875, 0.1507244110107422, 0.15967178344726562, 0.16861915588378906, 0.1775665283203125, 0.18651390075683594, 0.19546127319335938, 0.2044086456298828, 0.21335601806640625, 0.2223033905029297, 0.23125076293945312, 0.24019813537597656, 0.2491455078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 2.0, 2.0, 6.0, 5.0, 5.0, 11.0, 9.0, 16.0, 7.0, 16.0, 15.0, 21.0, 20.0, 22.0, 19.0, 29.0, 34.0, 37.0, 28.0, 36.0, 35.0, 38.0, 37.0, 38.0, 49.0, 42.0, 44.0, 33.0, 42.0, 34.0, 47.0, 24.0, 27.0, 21.0, 23.0, 23.0, 14.0, 13.0, 21.0, 9.0, 12.0, 5.0, 2.0, 9.0, 7.0, 1.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57373046875, -0.5545272827148438, -0.5353240966796875, -0.5161209106445312, -0.496917724609375, -0.47771453857421875, -0.4585113525390625, -0.43930816650390625, -0.42010498046875, -0.40090179443359375, -0.3816986083984375, -0.36249542236328125, -0.343292236328125, -0.32408905029296875, -0.3048858642578125, -0.28568267822265625, -0.2664794921875, -0.24727630615234375, -0.2280731201171875, -0.20886993408203125, -0.189666748046875, -0.17046356201171875, -0.1512603759765625, -0.13205718994140625, -0.11285400390625, -0.09365081787109375, -0.0744476318359375, -0.05524444580078125, -0.036041259765625, -0.01683807373046875, 0.0023651123046875, 0.02156829833984375, 0.040771484375, 0.05997467041015625, 0.0791778564453125, 0.09838104248046875, 0.117584228515625, 0.13678741455078125, 0.1559906005859375, 0.17519378662109375, 0.19439697265625, 0.21360015869140625, 0.2328033447265625, 0.25200653076171875, 0.271209716796875, 0.29041290283203125, 0.3096160888671875, 0.32881927490234375, 0.3480224609375, 0.36722564697265625, 0.3864288330078125, 0.40563201904296875, 0.424835205078125, 0.44403839111328125, 0.4632415771484375, 0.48244476318359375, 0.50164794921875, 0.5208511352539062, 0.5400543212890625, 0.5592575073242188, 0.578460693359375, 0.5976638793945312, 0.6168670654296875, 0.6360702514648438, 0.6552734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 10.0, 6.0, 15.0, 18.0, 24.0, 45.0, 68.0, 96.0, 136.0, 267.0, 591.0, 2423.0, 21864.0, 696857.0, 310877.0, 12430.0, 1671.0, 521.0, 241.0, 142.0, 93.0, 43.0, 35.0, 18.0, 18.0, 14.0, 9.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0517578125, -1.0216140747070312, -0.9914703369140625, -0.9613265991210938, -0.931182861328125, -0.9010391235351562, -0.8708953857421875, -0.8407516479492188, -0.81060791015625, -0.7804641723632812, -0.7503204345703125, -0.7201766967773438, -0.690032958984375, -0.6598892211914062, -0.6297454833984375, -0.5996017456054688, -0.5694580078125, -0.5393142700195312, -0.5091705322265625, -0.47902679443359375, -0.448883056640625, -0.41873931884765625, -0.3885955810546875, -0.35845184326171875, -0.32830810546875, -0.29816436767578125, -0.2680206298828125, -0.23787689208984375, -0.207733154296875, -0.17758941650390625, -0.1474456787109375, -0.11730194091796875, -0.087158203125, -0.05701446533203125, -0.0268707275390625, 0.00327301025390625, 0.033416748046875, 0.06356048583984375, 0.0937042236328125, 0.12384796142578125, 0.15399169921875, 0.18413543701171875, 0.2142791748046875, 0.24442291259765625, 0.274566650390625, 0.30471038818359375, 0.3348541259765625, 0.36499786376953125, 0.3951416015625, 0.42528533935546875, 0.4554290771484375, 0.48557281494140625, 0.515716552734375, 0.5458602905273438, 0.5760040283203125, 0.6061477661132812, 0.63629150390625, 0.6664352416992188, 0.6965789794921875, 0.7267227172851562, 0.756866455078125, 0.7870101928710938, 0.8171539306640625, 0.8472976684570312, 0.87744140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 6.0, 6.0, 7.0, 15.0, 12.0, 12.0, 15.0, 13.0, 26.0, 20.0, 30.0, 38.0, 36.0, 43.0, 49.0, 32.0, 52.0, 41.0, 44.0, 39.0, 41.0, 46.0, 55.0, 35.0, 50.0, 34.0, 29.0, 23.0, 21.0, 22.0, 17.0, 22.0, 10.0, 13.0, 4.0, 4.0, 4.0, 10.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 3.0, 3.0], "bins": [-0.9736328125, -0.9471435546875, -0.920654296875, -0.8941650390625, -0.86767578125, -0.8411865234375, -0.814697265625, -0.7882080078125, -0.76171875, -0.7352294921875, -0.708740234375, -0.6822509765625, -0.65576171875, -0.6292724609375, -0.602783203125, -0.5762939453125, -0.5498046875, -0.5233154296875, -0.496826171875, -0.4703369140625, -0.44384765625, -0.4173583984375, -0.390869140625, -0.3643798828125, -0.337890625, -0.3114013671875, -0.284912109375, -0.2584228515625, -0.23193359375, -0.2054443359375, -0.178955078125, -0.1524658203125, -0.1259765625, -0.0994873046875, -0.072998046875, -0.0465087890625, -0.02001953125, 0.0064697265625, 0.032958984375, 0.0594482421875, 0.0859375, 0.1124267578125, 0.138916015625, 0.1654052734375, 0.19189453125, 0.2183837890625, 0.244873046875, 0.2713623046875, 0.2978515625, 0.3243408203125, 0.350830078125, 0.3773193359375, 0.40380859375, 0.4302978515625, 0.456787109375, 0.4832763671875, 0.509765625, 0.5362548828125, 0.562744140625, 0.5892333984375, 0.61572265625, 0.6422119140625, 0.668701171875, 0.6951904296875, 0.7216796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 15.0, 24.0, 44.0, 75.0, 154.0, 267.0, 611.0, 2062.0, 11138.0, 268824.0, 737544.0, 23060.0, 3045.0, 838.0, 394.0, 189.0, 84.0, 52.0, 35.0, 21.0, 18.0, 8.0, 3.0, 6.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.330322265625, -0.3197174072265625, -0.309112548828125, -0.2985076904296875, -0.28790283203125, -0.2772979736328125, -0.266693115234375, -0.2560882568359375, -0.2454833984375, -0.2348785400390625, -0.224273681640625, -0.2136688232421875, -0.20306396484375, -0.1924591064453125, -0.181854248046875, -0.1712493896484375, -0.16064453125, -0.1500396728515625, -0.139434814453125, -0.1288299560546875, -0.11822509765625, -0.1076202392578125, -0.097015380859375, -0.0864105224609375, -0.0758056640625, -0.0652008056640625, -0.054595947265625, -0.0439910888671875, -0.03338623046875, -0.0227813720703125, -0.012176513671875, -0.0015716552734375, 0.009033203125, 0.0196380615234375, 0.030242919921875, 0.0408477783203125, 0.05145263671875, 0.0620574951171875, 0.072662353515625, 0.0832672119140625, 0.0938720703125, 0.1044769287109375, 0.115081787109375, 0.1256866455078125, 0.13629150390625, 0.1468963623046875, 0.157501220703125, 0.1681060791015625, 0.1787109375, 0.1893157958984375, 0.199920654296875, 0.2105255126953125, 0.22113037109375, 0.2317352294921875, 0.242340087890625, 0.2529449462890625, 0.2635498046875, 0.2741546630859375, 0.284759521484375, 0.2953643798828125, 0.30596923828125, 0.3165740966796875, 0.327178955078125, 0.3377838134765625, 0.348388671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 2.0, 8.0, 12.0, 4.0, 20.0, 18.0, 28.0, 40.0, 52.0, 83.0, 87.0, 126.0, 125.0, 109.0, 81.0, 43.0, 38.0, 24.0, 19.0, 12.0, 14.0, 10.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.002716064453125e-05, -1.9253231585025787e-05, -1.8479302525520325e-05, -1.7705373466014862e-05, -1.69314444065094e-05, -1.6157515347003937e-05, -1.5383586287498474e-05, -1.4609657227993011e-05, -1.3835728168487549e-05, -1.3061799108982086e-05, -1.2287870049476624e-05, -1.1513940989971161e-05, -1.0740011930465698e-05, -9.966082870960236e-06, -9.192153811454773e-06, -8.41822475194931e-06, -7.644295692443848e-06, -6.870366632938385e-06, -6.096437573432922e-06, -5.32250851392746e-06, -4.548579454421997e-06, -3.7746503949165344e-06, -3.0007213354110718e-06, -2.226792275905609e-06, -1.4528632164001465e-06, -6.789341568946838e-07, 9.499490261077881e-08, 8.689239621162415e-07, 1.642853021621704e-06, 2.4167820811271667e-06, 3.1907111406326294e-06, 3.964640200138092e-06, 4.738569259643555e-06, 5.512498319149017e-06, 6.28642737865448e-06, 7.060356438159943e-06, 7.834285497665405e-06, 8.608214557170868e-06, 9.38214361667633e-06, 1.0156072676181793e-05, 1.0930001735687256e-05, 1.1703930795192719e-05, 1.2477859854698181e-05, 1.3251788914203644e-05, 1.4025717973709106e-05, 1.4799647033214569e-05, 1.5573576092720032e-05, 1.6347505152225494e-05, 1.7121434211730957e-05, 1.789536327123642e-05, 1.8669292330741882e-05, 1.9443221390247345e-05, 2.0217150449752808e-05, 2.099107950925827e-05, 2.1765008568763733e-05, 2.2538937628269196e-05, 2.3312866687774658e-05, 2.408679574728012e-05, 2.4860724806785583e-05, 2.5634653866291046e-05, 2.640858292579651e-05, 2.718251198530197e-05, 2.7956441044807434e-05, 2.8730370104312897e-05, 2.950429916381836e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 3.0, 8.0, 6.0, 9.0, 16.0, 25.0, 42.0, 57.0, 137.0, 208.0, 368.0, 749.0, 2019.0, 7919.0, 117654.0, 865814.0, 45675.0, 4956.0, 1526.0, 611.0, 301.0, 173.0, 93.0, 68.0, 36.0, 16.0, 17.0, 6.0, 12.0, 5.0, 7.0, 3.0, 0.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2836723327636719, -0.27291107177734375, -0.2621498107910156, -0.2513885498046875, -0.24062728881835938, -0.22986602783203125, -0.21910476684570312, -0.208343505859375, -0.19758224487304688, -0.18682098388671875, -0.17605972290039062, -0.1652984619140625, -0.15453720092773438, -0.14377593994140625, -0.13301467895507812, -0.12225341796875, -0.11149215698242188, -0.10073089599609375, -0.08996963500976562, -0.0792083740234375, -0.06844711303710938, -0.05768585205078125, -0.046924591064453125, -0.036163330078125, -0.025402069091796875, -0.01464080810546875, -0.003879547119140625, 0.0068817138671875, 0.017642974853515625, 0.02840423583984375, 0.039165496826171875, 0.0499267578125, 0.060688018798828125, 0.07144927978515625, 0.08221054077148438, 0.0929718017578125, 0.10373306274414062, 0.11449432373046875, 0.12525558471679688, 0.136016845703125, 0.14677810668945312, 0.15753936767578125, 0.16830062866210938, 0.1790618896484375, 0.18982315063476562, 0.20058441162109375, 0.21134567260742188, 0.22210693359375, 0.23286819458007812, 0.24362945556640625, 0.2543907165527344, 0.2651519775390625, 0.2759132385253906, 0.28667449951171875, 0.2974357604980469, 0.308197021484375, 0.3189582824707031, 0.32971954345703125, 0.3404808044433594, 0.3512420654296875, 0.3620033264160156, 0.37276458740234375, 0.3835258483886719, 0.394287109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 15.0, 13.0, 26.0, 28.0, 43.0, 80.0, 92.0, 128.0, 141.0, 128.0, 78.0, 68.0, 42.0, 44.0, 17.0, 10.0, 11.0, 7.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140869140625, -0.13730716705322266, -0.1337451934814453, -0.13018321990966797, -0.12662124633789062, -0.12305927276611328, -0.11949729919433594, -0.1159353256225586, -0.11237335205078125, -0.1088113784790039, -0.10524940490722656, -0.10168743133544922, -0.09812545776367188, -0.09456348419189453, -0.09100151062011719, -0.08743953704833984, -0.0838775634765625, -0.08031558990478516, -0.07675361633300781, -0.07319164276123047, -0.06962966918945312, -0.06606769561767578, -0.06250572204589844, -0.058943748474121094, -0.05538177490234375, -0.051819801330566406, -0.04825782775878906, -0.04469585418701172, -0.041133880615234375, -0.03757190704345703, -0.03400993347167969, -0.030447959899902344, -0.026885986328125, -0.023324012756347656, -0.019762039184570312, -0.01620006561279297, -0.012638092041015625, -0.009076118469238281, -0.0055141448974609375, -0.0019521713256835938, 0.00160980224609375, 0.005171775817871094, 0.008733749389648438, 0.012295722961425781, 0.015857696533203125, 0.01941967010498047, 0.022981643676757812, 0.026543617248535156, 0.0301055908203125, 0.033667564392089844, 0.03722953796386719, 0.04079151153564453, 0.044353485107421875, 0.04791545867919922, 0.05147743225097656, 0.055039405822753906, 0.05860137939453125, 0.062163352966308594, 0.06572532653808594, 0.06928730010986328, 0.07284927368164062, 0.07641124725341797, 0.07997322082519531, 0.08353519439697266, 0.08709716796875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 10.0, 17.0, 30.0, 52.0, 86.0, 144.0, 194.0, 209.0, 127.0, 73.0, 33.0, 19.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3770989179611206, -1.3074686527252197, -1.2378385066986084, -1.1682082414627075, -1.0985779762268066, -1.0289478302001953, -0.9593175649642944, -0.8896872997283936, -0.8200570940971375, -0.7504268884658813, -0.6807966232299805, -0.6111664175987244, -0.5415362119674683, -0.4719059467315674, -0.4022757411003113, -0.3326455056667328, -0.2630152702331543, -0.1933850347995758, -0.12375481426715851, -0.05412459373474121, 0.01550564169883728, 0.08513587713241577, 0.15476608276367188, 0.22439631819725037, 0.29402655363082886, 0.36365678906440735, 0.43328702449798584, 0.5029172301292419, 0.572547435760498, 0.6421777009963989, 0.711807906627655, 0.7814381122589111, 0.8510684967041016, 0.9206987023353577, 0.9903289675712585, 1.0599591732025146, 1.1295894384384155, 1.1992197036743164, 1.2688498497009277, 1.3384801149368286, 1.4081103801727295, 1.4777406454086304, 1.5473707914352417, 1.6170010566711426, 1.6866313219070435, 1.7562615871429443, 1.8258917331695557, 1.8955219984054565, 1.9651521444320679, 2.0347824096679688, 2.10441255569458, 2.1740427017211914, 2.243673086166382, 2.313303232192993, 2.3829336166381836, 2.452563762664795, 2.5221939086914062, 2.5918240547180176, 2.661454439163208, 2.7310845851898193, 2.8007147312164307, 2.870345115661621, 2.9399752616882324, 3.0096054077148438, 3.079235792160034]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 8.0, 13.0, 17.0, 10.0, 14.0, 19.0, 27.0, 25.0, 20.0, 34.0, 33.0, 37.0, 38.0, 35.0, 38.0, 41.0, 44.0, 43.0, 43.0, 46.0, 39.0, 37.0, 38.0, 41.0, 33.0, 32.0, 23.0, 18.0, 21.0, 12.0, 22.0, 15.0, 15.0, 14.0, 12.0, 7.0, 1.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.158236026763916, -1.1192200183868408, -1.080203890800476, -1.0411878824234009, -1.0021718740463257, -0.9631558060646057, -0.9241397380828857, -0.8851237297058105, -0.8461077213287354, -0.8070916533470154, -0.7680756449699402, -0.7290595769882202, -0.690043568611145, -0.651027500629425, -0.6120114326477051, -0.5729954242706299, -0.5339793562889099, -0.49496331810951233, -0.45594727993011475, -0.4169312119483948, -0.3779152035713196, -0.3388991355895996, -0.299883097410202, -0.26086705923080444, -0.22185102105140686, -0.18283498287200928, -0.1438189446926117, -0.10480289161205292, -0.06578685343265533, -0.02677081525325775, 0.012245237827301025, 0.05126127600669861, 0.09027731418609619, 0.12929335236549377, 0.16830939054489136, 0.20732544362545013, 0.24634148180484772, 0.2853575348854065, 0.3243735730648041, 0.36338961124420166, 0.40240564942359924, 0.4414216876029968, 0.4804377257823944, 0.519453763961792, 0.558469831943512, 0.5974858403205872, 0.6365019083023071, 0.6755179166793823, 0.7145339846611023, 0.7535500526428223, 0.7925660610198975, 0.8315821290016174, 0.8705981373786926, 0.9096142053604126, 0.9486302137374878, 0.9876462817192078, 1.0266623497009277, 1.065678358078003, 1.1046944856643677, 1.1437104940414429, 1.182726502418518, 1.2217425107955933, 1.260758638381958, 1.2997746467590332, 1.3387906551361084]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 10.0, 12.0, 18.0, 26.0, 63.0, 78.0, 141.0, 264.0, 581.0, 1299.0, 3818.0, 14855.0, 104714.0, 1224940.0, 2498569.0, 303719.0, 30990.0, 6540.0, 2020.0, 781.0, 349.0, 167.0, 118.0, 59.0, 42.0, 31.0, 22.0, 12.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.900390625, -0.8724441528320312, -0.8444976806640625, -0.8165512084960938, -0.788604736328125, -0.7606582641601562, -0.7327117919921875, -0.7047653198242188, -0.67681884765625, -0.6488723754882812, -0.6209259033203125, -0.5929794311523438, -0.565032958984375, -0.5370864868164062, -0.5091400146484375, -0.48119354248046875, -0.4532470703125, -0.42530059814453125, -0.3973541259765625, -0.36940765380859375, -0.341461181640625, -0.31351470947265625, -0.2855682373046875, -0.25762176513671875, -0.22967529296875, -0.20172882080078125, -0.1737823486328125, -0.14583587646484375, -0.117889404296875, -0.08994293212890625, -0.0619964599609375, -0.03404998779296875, -0.006103515625, 0.02184295654296875, 0.0497894287109375, 0.07773590087890625, 0.105682373046875, 0.13362884521484375, 0.1615753173828125, 0.18952178955078125, 0.21746826171875, 0.24541473388671875, 0.2733612060546875, 0.30130767822265625, 0.329254150390625, 0.35720062255859375, 0.3851470947265625, 0.41309356689453125, 0.4410400390625, 0.46898651123046875, 0.4969329833984375, 0.5248794555664062, 0.552825927734375, 0.5807723999023438, 0.6087188720703125, 0.6366653442382812, 0.66461181640625, 0.6925582885742188, 0.7205047607421875, 0.7484512329101562, 0.776397705078125, 0.8043441772460938, 0.8322906494140625, 0.8602371215820312, 0.88818359375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 6.0, 10.0, 6.0, 10.0, 8.0, 16.0, 17.0, 17.0, 20.0, 25.0, 19.0, 21.0, 29.0, 30.0, 54.0, 29.0, 45.0, 44.0, 35.0, 46.0, 42.0, 52.0, 35.0, 47.0, 35.0, 33.0, 38.0, 28.0, 27.0, 31.0, 22.0, 20.0, 13.0, 15.0, 15.0, 11.0, 13.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.435546875, -0.4223480224609375, -0.409149169921875, -0.3959503173828125, -0.38275146484375, -0.3695526123046875, -0.356353759765625, -0.3431549072265625, -0.3299560546875, -0.3167572021484375, -0.303558349609375, -0.2903594970703125, -0.27716064453125, -0.2639617919921875, -0.250762939453125, -0.2375640869140625, -0.224365234375, -0.2111663818359375, -0.197967529296875, -0.1847686767578125, -0.17156982421875, -0.1583709716796875, -0.145172119140625, -0.1319732666015625, -0.1187744140625, -0.1055755615234375, -0.092376708984375, -0.0791778564453125, -0.06597900390625, -0.0527801513671875, -0.039581298828125, -0.0263824462890625, -0.01318359375, 1.52587890625e-05, 0.013214111328125, 0.0264129638671875, 0.03961181640625, 0.0528106689453125, 0.066009521484375, 0.0792083740234375, 0.0924072265625, 0.1056060791015625, 0.118804931640625, 0.1320037841796875, 0.14520263671875, 0.1584014892578125, 0.171600341796875, 0.1847991943359375, 0.197998046875, 0.2111968994140625, 0.224395751953125, 0.2375946044921875, 0.25079345703125, 0.2639923095703125, 0.277191162109375, 0.2903900146484375, 0.3035888671875, 0.3167877197265625, 0.329986572265625, 0.3431854248046875, 0.35638427734375, 0.3695831298828125, 0.382781982421875, 0.3959808349609375, 0.4091796875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 5.0, 7.0, 8.0, 23.0, 32.0, 45.0, 71.0, 108.0, 197.0, 403.0, 911.0, 2615.0, 10420.0, 73120.0, 1918974.0, 2092384.0, 78789.0, 11244.0, 2873.0, 1008.0, 448.0, 218.0, 110.0, 92.0, 59.0, 44.0, 20.0, 7.0, 8.0, 5.0, 6.0, 8.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.7812652587890625, -0.750030517578125, -0.7187957763671875, -0.68756103515625, -0.6563262939453125, -0.625091552734375, -0.5938568115234375, -0.5626220703125, -0.5313873291015625, -0.500152587890625, -0.4689178466796875, -0.43768310546875, -0.4064483642578125, -0.375213623046875, -0.3439788818359375, -0.312744140625, -0.2815093994140625, -0.250274658203125, -0.2190399169921875, -0.18780517578125, -0.1565704345703125, -0.125335693359375, -0.0941009521484375, -0.0628662109375, -0.0316314697265625, -0.000396728515625, 0.0308380126953125, 0.06207275390625, 0.0933074951171875, 0.124542236328125, 0.1557769775390625, 0.18701171875, 0.2182464599609375, 0.249481201171875, 0.2807159423828125, 0.31195068359375, 0.3431854248046875, 0.374420166015625, 0.4056549072265625, 0.4368896484375, 0.4681243896484375, 0.499359130859375, 0.5305938720703125, 0.56182861328125, 0.5930633544921875, 0.624298095703125, 0.6555328369140625, 0.686767578125, 0.7180023193359375, 0.749237060546875, 0.7804718017578125, 0.81170654296875, 0.8429412841796875, 0.874176025390625, 0.9054107666015625, 0.9366455078125, 0.9678802490234375, 0.999114990234375, 1.0303497314453125, 1.06158447265625, 1.0928192138671875, 1.124053955078125, 1.1552886962890625, 1.1865234375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 2.0, 2.0, 7.0, 9.0, 6.0, 9.0, 17.0, 32.0, 34.0, 46.0, 63.0, 73.0, 143.0, 210.0, 275.0, 450.0, 568.0, 545.0, 473.0, 345.0, 249.0, 150.0, 124.0, 68.0, 47.0, 32.0, 30.0, 26.0, 13.0, 10.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2627696990966797, -0.2555198669433594, -0.24827003479003906, -0.24102020263671875, -0.23377037048339844, -0.22652053833007812, -0.2192707061767578, -0.2120208740234375, -0.2047710418701172, -0.19752120971679688, -0.19027137756347656, -0.18302154541015625, -0.17577171325683594, -0.16852188110351562, -0.1612720489501953, -0.154022216796875, -0.1467723846435547, -0.13952255249023438, -0.13227272033691406, -0.12502288818359375, -0.11777305603027344, -0.11052322387695312, -0.10327339172363281, -0.0960235595703125, -0.08877372741699219, -0.08152389526367188, -0.07427406311035156, -0.06702423095703125, -0.05977439880371094, -0.052524566650390625, -0.04527473449707031, -0.03802490234375, -0.030775070190429688, -0.023525238037109375, -0.016275405883789062, -0.00902557373046875, -0.0017757415771484375, 0.005474090576171875, 0.012723922729492188, 0.0199737548828125, 0.027223587036132812, 0.034473419189453125, 0.04172325134277344, 0.04897308349609375, 0.05622291564941406, 0.06347274780273438, 0.07072257995605469, 0.077972412109375, 0.08522224426269531, 0.09247207641601562, 0.09972190856933594, 0.10697174072265625, 0.11422157287597656, 0.12147140502929688, 0.1287212371826172, 0.1359710693359375, 0.1432209014892578, 0.15047073364257812, 0.15772056579589844, 0.16497039794921875, 0.17222023010253906, 0.17947006225585938, 0.1867198944091797, 0.1939697265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 14.0, 16.0, 27.0, 46.0, 77.0, 104.0, 131.0, 141.0, 145.0, 103.0, 81.0, 46.0, 38.0, 18.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5321861505508423, -1.486545205116272, -1.4409042596817017, -1.3952631950378418, -1.3496222496032715, -1.3039813041687012, -1.2583403587341309, -1.2126994132995605, -1.1670584678649902, -1.12141752243042, -1.0757765769958496, -1.0301356315612793, -0.9844945669174194, -0.9388536214828491, -0.8932126760482788, -0.8475717306137085, -0.8019306659698486, -0.7562897205352783, -0.7106487154960632, -0.6650077700614929, -0.6193667650222778, -0.5737258195877075, -0.5280848741531372, -0.4824438989162445, -0.4368029236793518, -0.3911619484424591, -0.3455209732055664, -0.2998800277709961, -0.2542390525341034, -0.2085980772972107, -0.16295713186264038, -0.11731615662574768, -0.07167518138885498, -0.026034213602542877, 0.019606754183769226, 0.06524771451950073, 0.11088868975639343, 0.15652966499328613, 0.20217061042785645, 0.24781158566474915, 0.29345256090164185, 0.33909353613853455, 0.38473451137542725, 0.43037545680999756, 0.47601643204689026, 0.521657407283783, 0.5672983527183533, 0.6129393577575684, 0.6585803031921387, 0.704221248626709, 0.7498622536659241, 0.7955031991004944, 0.8411442041397095, 0.8867851495742798, 0.9324260950088501, 0.9780670404434204, 1.0237081050872803, 1.0693490505218506, 1.114989995956421, 1.1606309413909912, 1.206272006034851, 1.2519129514694214, 1.2975538969039917, 1.343194842338562, 1.3888357877731323]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 4.0, 4.0, 12.0, 10.0, 14.0, 15.0, 15.0, 19.0, 30.0, 26.0, 25.0, 35.0, 44.0, 37.0, 37.0, 34.0, 40.0, 34.0, 52.0, 46.0, 34.0, 37.0, 42.0, 34.0, 44.0, 35.0, 42.0, 26.0, 21.0, 25.0, 18.0, 11.0, 15.0, 14.0, 8.0, 7.0, 12.0, 9.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4953939616680145, -0.4797289967536926, -0.4640640318393707, -0.44839906692504883, -0.43273407220840454, -0.41706913709640503, -0.40140414237976074, -0.38573917746543884, -0.37007421255111694, -0.35440924763679504, -0.33874428272247314, -0.32307931780815125, -0.30741435289382935, -0.29174935817718506, -0.27608439326286316, -0.26041942834854126, -0.24475446343421936, -0.22908949851989746, -0.21342453360557556, -0.19775955379009247, -0.18209458887577057, -0.16642962396144867, -0.15076464414596558, -0.13509967923164368, -0.11943471431732178, -0.10376974940299988, -0.08810477703809738, -0.07243980467319489, -0.056774839758872986, -0.041109874844551086, -0.02544490247964859, -0.009779930114746094, 0.005885064601898193, 0.02155003324151039, 0.03721500188112259, 0.05287997052073479, 0.06854493916034698, 0.08420990407466888, 0.09987487643957138, 0.11553984880447388, 0.13120481371879578, 0.14686977863311768, 0.16253474354743958, 0.17819972336292267, 0.19386468827724457, 0.20952965319156647, 0.22519463300704956, 0.24085959792137146, 0.25652456283569336, 0.27218952775001526, 0.28785449266433716, 0.30351945757865906, 0.31918442249298096, 0.33484941720962524, 0.35051438212394714, 0.36617934703826904, 0.38184431195259094, 0.39750927686691284, 0.41317424178123474, 0.42883920669555664, 0.4445042014122009, 0.46016913652420044, 0.4758341312408447, 0.4914990961551666, 0.5071640610694885]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 9.0, 8.0, 16.0, 22.0, 46.0, 88.0, 142.0, 315.0, 818.0, 2033.0, 6050.0, 23891.0, 155502.0, 656166.0, 168297.0, 25064.0, 6441.0, 2114.0, 815.0, 376.0, 154.0, 84.0, 35.0, 22.0, 9.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.22997283935546875, -0.2219085693359375, -0.21384429931640625, -0.205780029296875, -0.19771575927734375, -0.1896514892578125, -0.18158721923828125, -0.17352294921875, -0.16545867919921875, -0.1573944091796875, -0.14933013916015625, -0.141265869140625, -0.13320159912109375, -0.1251373291015625, -0.11707305908203125, -0.1090087890625, -0.10094451904296875, -0.0928802490234375, -0.08481597900390625, -0.076751708984375, -0.06868743896484375, -0.0606231689453125, -0.05255889892578125, -0.04449462890625, -0.03643035888671875, -0.0283660888671875, -0.02030181884765625, -0.012237548828125, -0.00417327880859375, 0.0038909912109375, 0.01195526123046875, 0.02001953125, 0.02808380126953125, 0.0361480712890625, 0.04421234130859375, 0.052276611328125, 0.06034088134765625, 0.0684051513671875, 0.07646942138671875, 0.08453369140625, 0.09259796142578125, 0.1006622314453125, 0.10872650146484375, 0.116790771484375, 0.12485504150390625, 0.1329193115234375, 0.14098358154296875, 0.1490478515625, 0.15711212158203125, 0.1651763916015625, 0.17324066162109375, 0.181304931640625, 0.18936920166015625, 0.1974334716796875, 0.20549774169921875, 0.21356201171875, 0.22162628173828125, 0.2296905517578125, 0.23775482177734375, 0.245819091796875, 0.25388336181640625, 0.2619476318359375, 0.27001190185546875, 0.278076171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 8.0, 10.0, 18.0, 15.0, 16.0, 20.0, 22.0, 25.0, 37.0, 40.0, 47.0, 38.0, 64.0, 51.0, 43.0, 40.0, 59.0, 53.0, 44.0, 51.0, 49.0, 43.0, 28.0, 32.0, 26.0, 17.0, 17.0, 11.0, 9.0, 12.0, 11.0, 3.0, 10.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.4306640625, -0.41888427734375, -0.4071044921875, -0.39532470703125, -0.383544921875, -0.37176513671875, -0.3599853515625, -0.34820556640625, -0.33642578125, -0.32464599609375, -0.3128662109375, -0.30108642578125, -0.289306640625, -0.27752685546875, -0.2657470703125, -0.25396728515625, -0.2421875, -0.23040771484375, -0.2186279296875, -0.20684814453125, -0.195068359375, -0.18328857421875, -0.1715087890625, -0.15972900390625, -0.14794921875, -0.13616943359375, -0.1243896484375, -0.11260986328125, -0.100830078125, -0.08905029296875, -0.0772705078125, -0.06549072265625, -0.0537109375, -0.04193115234375, -0.0301513671875, -0.01837158203125, -0.006591796875, 0.00518798828125, 0.0169677734375, 0.02874755859375, 0.04052734375, 0.05230712890625, 0.0640869140625, 0.07586669921875, 0.087646484375, 0.09942626953125, 0.1112060546875, 0.12298583984375, 0.134765625, 0.14654541015625, 0.1583251953125, 0.17010498046875, 0.181884765625, 0.19366455078125, 0.2054443359375, 0.21722412109375, 0.22900390625, 0.24078369140625, 0.2525634765625, 0.26434326171875, 0.276123046875, 0.28790283203125, 0.2996826171875, 0.31146240234375, 0.3232421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 10.0, 16.0, 14.0, 24.0, 38.0, 46.0, 77.0, 124.0, 231.0, 409.0, 802.0, 1562.0, 3326.0, 8273.0, 24915.0, 90688.0, 317496.0, 401396.0, 141848.0, 37096.0, 11567.0, 4441.0, 1958.0, 963.0, 516.0, 258.0, 172.0, 82.0, 59.0, 50.0, 21.0, 18.0, 21.0, 7.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1143798828125, -0.11058807373046875, -0.1067962646484375, -0.10300445556640625, -0.099212646484375, -0.09542083740234375, -0.0916290283203125, -0.08783721923828125, -0.08404541015625, -0.08025360107421875, -0.0764617919921875, -0.07266998291015625, -0.068878173828125, -0.06508636474609375, -0.0612945556640625, -0.05750274658203125, -0.0537109375, -0.04991912841796875, -0.0461273193359375, -0.04233551025390625, -0.038543701171875, -0.03475189208984375, -0.0309600830078125, -0.02716827392578125, -0.02337646484375, -0.01958465576171875, -0.0157928466796875, -0.01200103759765625, -0.008209228515625, -0.00441741943359375, -0.0006256103515625, 0.00316619873046875, 0.0069580078125, 0.01074981689453125, 0.0145416259765625, 0.01833343505859375, 0.022125244140625, 0.02591705322265625, 0.0297088623046875, 0.03350067138671875, 0.03729248046875, 0.04108428955078125, 0.0448760986328125, 0.04866790771484375, 0.052459716796875, 0.05625152587890625, 0.0600433349609375, 0.06383514404296875, 0.067626953125, 0.07141876220703125, 0.0752105712890625, 0.07900238037109375, 0.082794189453125, 0.08658599853515625, 0.0903778076171875, 0.09416961669921875, 0.09796142578125, 0.10175323486328125, 0.1055450439453125, 0.10933685302734375, 0.113128662109375, 0.11692047119140625, 0.1207122802734375, 0.12450408935546875, 0.1282958984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 6.0, 8.0, 4.0, 7.0, 9.0, 20.0, 17.0, 13.0, 21.0, 25.0, 19.0, 26.0, 30.0, 30.0, 37.0, 34.0, 29.0, 49.0, 54.0, 35.0, 35.0, 37.0, 35.0, 50.0, 40.0, 41.0, 36.0, 39.0, 30.0, 28.0, 24.0, 18.0, 22.0, 18.0, 11.0, 10.0, 7.0, 7.0, 5.0, 7.0, 5.0, 1.0, 10.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.60302734375, -0.5830841064453125, -0.563140869140625, -0.5431976318359375, -0.52325439453125, -0.5033111572265625, -0.483367919921875, -0.4634246826171875, -0.4434814453125, -0.4235382080078125, -0.403594970703125, -0.3836517333984375, -0.36370849609375, -0.3437652587890625, -0.323822021484375, -0.3038787841796875, -0.283935546875, -0.2639923095703125, -0.244049072265625, -0.2241058349609375, -0.20416259765625, -0.1842193603515625, -0.164276123046875, -0.1443328857421875, -0.1243896484375, -0.1044464111328125, -0.084503173828125, -0.0645599365234375, -0.04461669921875, -0.0246734619140625, -0.004730224609375, 0.0152130126953125, 0.03515625, 0.0550994873046875, 0.075042724609375, 0.0949859619140625, 0.11492919921875, 0.1348724365234375, 0.154815673828125, 0.1747589111328125, 0.1947021484375, 0.2146453857421875, 0.234588623046875, 0.2545318603515625, 0.27447509765625, 0.2944183349609375, 0.314361572265625, 0.3343048095703125, 0.354248046875, 0.3741912841796875, 0.394134521484375, 0.4140777587890625, 0.43402099609375, 0.4539642333984375, 0.473907470703125, 0.4938507080078125, 0.5137939453125, 0.5337371826171875, 0.553680419921875, 0.5736236572265625, 0.59356689453125, 0.6135101318359375, 0.633453369140625, 0.6533966064453125, 0.67333984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 15.0, 7.0, 11.0, 20.0, 26.0, 36.0, 62.0, 87.0, 131.0, 178.0, 307.0, 584.0, 1029.0, 1822.0, 3512.0, 7322.0, 16681.0, 46431.0, 201142.0, 533492.0, 165950.0, 40464.0, 15130.0, 6838.0, 3226.0, 1724.0, 912.0, 521.0, 292.0, 185.0, 134.0, 90.0, 55.0, 47.0, 20.0, 17.0, 19.0, 7.0, 6.0, 10.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061553955078125, -0.059656620025634766, -0.05775928497314453, -0.0558619499206543, -0.05396461486816406, -0.05206727981567383, -0.050169944763183594, -0.04827260971069336, -0.046375274658203125, -0.04447793960571289, -0.042580604553222656, -0.04068326950073242, -0.03878593444824219, -0.03688859939575195, -0.03499126434326172, -0.033093929290771484, -0.03119659423828125, -0.029299259185791016, -0.02740192413330078, -0.025504589080810547, -0.023607254028320312, -0.021709918975830078, -0.019812583923339844, -0.01791524887084961, -0.016017913818359375, -0.01412057876586914, -0.012223243713378906, -0.010325908660888672, -0.008428573608398438, -0.006531238555908203, -0.004633903503417969, -0.0027365684509277344, -0.0008392333984375, 0.0010581016540527344, 0.0029554367065429688, 0.004852771759033203, 0.0067501068115234375, 0.008647441864013672, 0.010544776916503906, 0.01244211196899414, 0.014339447021484375, 0.01623678207397461, 0.018134117126464844, 0.020031452178955078, 0.021928787231445312, 0.023826122283935547, 0.02572345733642578, 0.027620792388916016, 0.02951812744140625, 0.031415462493896484, 0.03331279754638672, 0.03521013259887695, 0.03710746765136719, 0.03900480270385742, 0.040902137756347656, 0.04279947280883789, 0.044696807861328125, 0.04659414291381836, 0.048491477966308594, 0.05038881301879883, 0.05228614807128906, 0.0541834831237793, 0.05608081817626953, 0.057978153228759766, 0.05987548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 10.0, 20.0, 25.0, 52.0, 71.0, 121.0, 140.0, 165.0, 137.0, 77.0, 60.0, 33.0, 20.0, 10.0, 9.0, 8.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1113624572753906e-05, -3.001280128955841e-05, -2.8911978006362915e-05, -2.781115472316742e-05, -2.6710331439971924e-05, -2.5609508156776428e-05, -2.4508684873580933e-05, -2.3407861590385437e-05, -2.230703830718994e-05, -2.1206215023994446e-05, -2.010539174079895e-05, -1.9004568457603455e-05, -1.790374517440796e-05, -1.6802921891212463e-05, -1.5702098608016968e-05, -1.4601275324821472e-05, -1.3500452041625977e-05, -1.2399628758430481e-05, -1.1298805475234985e-05, -1.019798219203949e-05, -9.097158908843994e-06, -7.996335625648499e-06, -6.895512342453003e-06, -5.794689059257507e-06, -4.693865776062012e-06, -3.593042492866516e-06, -2.4922192096710205e-06, -1.391395926475525e-06, -2.905726432800293e-07, 8.102506399154663e-07, 1.911073923110962e-06, 3.0118972063064575e-06, 4.112720489501953e-06, 5.213543772697449e-06, 6.314367055892944e-06, 7.41519033908844e-06, 8.516013622283936e-06, 9.616836905479431e-06, 1.0717660188674927e-05, 1.1818483471870422e-05, 1.2919306755065918e-05, 1.4020130038261414e-05, 1.512095332145691e-05, 1.6221776604652405e-05, 1.73225998878479e-05, 1.8423423171043396e-05, 1.952424645423889e-05, 2.0625069737434387e-05, 2.1725893020629883e-05, 2.282671630382538e-05, 2.3927539587020874e-05, 2.502836287021637e-05, 2.6129186153411865e-05, 2.723000943660736e-05, 2.8330832719802856e-05, 2.9431656002998352e-05, 3.053247928619385e-05, 3.163330256938934e-05, 3.273412585258484e-05, 3.3834949135780334e-05, 3.493577241897583e-05, 3.6036595702171326e-05, 3.713741898536682e-05, 3.823824226856232e-05, 3.933906555175781e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 2.0, 10.0, 7.0, 11.0, 17.0, 19.0, 29.0, 30.0, 36.0, 48.0, 70.0, 140.0, 227.0, 428.0, 831.0, 1707.0, 3623.0, 8833.0, 24590.0, 99682.0, 549671.0, 283596.0, 48913.0, 15004.0, 5803.0, 2495.0, 1200.0, 619.0, 309.0, 204.0, 120.0, 70.0, 55.0, 33.0, 23.0, 18.0, 17.0, 11.0, 9.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.07830810546875, -0.07567787170410156, -0.07304763793945312, -0.07041740417480469, -0.06778717041015625, -0.06515693664550781, -0.06252670288085938, -0.05989646911621094, -0.0572662353515625, -0.05463600158691406, -0.052005767822265625, -0.04937553405761719, -0.04674530029296875, -0.04411506652832031, -0.041484832763671875, -0.03885459899902344, -0.036224365234375, -0.03359413146972656, -0.030963897705078125, -0.028333663940429688, -0.02570343017578125, -0.023073196411132812, -0.020442962646484375, -0.017812728881835938, -0.0151824951171875, -0.012552261352539062, -0.009922027587890625, -0.0072917938232421875, -0.00466156005859375, -0.0020313262939453125, 0.000598907470703125, 0.0032291412353515625, 0.005859375, 0.008489608764648438, 0.011119842529296875, 0.013750076293945312, 0.01638031005859375, 0.019010543823242188, 0.021640777587890625, 0.024271011352539062, 0.0269012451171875, 0.029531478881835938, 0.032161712646484375, 0.03479194641113281, 0.03742218017578125, 0.04005241394042969, 0.042682647705078125, 0.04531288146972656, 0.047943115234375, 0.05057334899902344, 0.053203582763671875, 0.05583381652832031, 0.05846405029296875, 0.06109428405761719, 0.06372451782226562, 0.06635475158691406, 0.0689849853515625, 0.07161521911621094, 0.07424545288085938, 0.07687568664550781, 0.07950592041015625, 0.08213615417480469, 0.08476638793945312, 0.08739662170410156, 0.09002685546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 9.0, 11.0, 5.0, 22.0, 22.0, 30.0, 61.0, 73.0, 95.0, 126.0, 117.0, 110.0, 99.0, 49.0, 40.0, 24.0, 16.0, 16.0, 14.0, 12.0, 8.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03289794921875, -0.031966447830200195, -0.03103494644165039, -0.030103445053100586, -0.02917194366455078, -0.028240442276000977, -0.027308940887451172, -0.026377439498901367, -0.025445938110351562, -0.024514436721801758, -0.023582935333251953, -0.02265143394470215, -0.021719932556152344, -0.02078843116760254, -0.019856929779052734, -0.01892542839050293, -0.017993927001953125, -0.01706242561340332, -0.016130924224853516, -0.015199422836303711, -0.014267921447753906, -0.013336420059204102, -0.012404918670654297, -0.011473417282104492, -0.010541915893554688, -0.009610414505004883, -0.008678913116455078, -0.0077474117279052734, -0.006815910339355469, -0.005884408950805664, -0.004952907562255859, -0.004021406173706055, -0.00308990478515625, -0.0021584033966064453, -0.0012269020080566406, -0.00029540061950683594, 0.0006361007690429688, 0.0015676021575927734, 0.002499103546142578, 0.003430604934692383, 0.0043621063232421875, 0.005293607711791992, 0.006225109100341797, 0.0071566104888916016, 0.008088111877441406, 0.009019613265991211, 0.009951114654541016, 0.01088261604309082, 0.011814117431640625, 0.01274561882019043, 0.013677120208740234, 0.014608621597290039, 0.015540122985839844, 0.01647162437438965, 0.017403125762939453, 0.018334627151489258, 0.019266128540039062, 0.020197629928588867, 0.021129131317138672, 0.022060632705688477, 0.02299213409423828, 0.023923635482788086, 0.02485513687133789, 0.025786638259887695, 0.0267181396484375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 23.0, 35.0, 58.0, 84.0, 137.0, 161.0, 154.0, 140.0, 80.0, 54.0, 40.0, 12.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9094133377075195, -0.8789806365966797, -0.8485479354858398, -0.818115234375, -0.7876825332641602, -0.7572498321533203, -0.7268170714378357, -0.6963843703269958, -0.665951669216156, -0.6355189681053162, -0.6050862669944763, -0.5746535658836365, -0.5442208051681519, -0.513788104057312, -0.48335540294647217, -0.4529227018356323, -0.4224900007247925, -0.39205729961395264, -0.3616245985031128, -0.33119186758995056, -0.3007591664791107, -0.2703264653682709, -0.23989374935626984, -0.2094610333442688, -0.17902833223342896, -0.1485956311225891, -0.11816291511058807, -0.08773020654916763, -0.05729749798774719, -0.02686479687690735, 0.003567919135093689, 0.03400063514709473, 0.06443333625793457, 0.09486604481935501, 0.12529875338077545, 0.1557314693927765, 0.18616417050361633, 0.21659687161445618, 0.24702958762645721, 0.27746230363845825, 0.3078950047492981, 0.33832770586013794, 0.3687604069709778, 0.39919313788414, 0.42962583899497986, 0.4600585401058197, 0.49049127101898193, 0.5209239721298218, 0.5513566732406616, 0.5817893743515015, 0.6122220754623413, 0.6426547765731812, 0.673087477684021, 0.7035201787948608, 0.7339529395103455, 0.7643856406211853, 0.7948183417320251, 0.825251042842865, 0.8556837439537048, 0.8861164450645447, 0.9165492057800293, 0.9469819068908691, 0.977414608001709, 1.0078473091125488, 1.0382800102233887]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 3.0, 13.0, 13.0, 14.0, 13.0, 23.0, 25.0, 20.0, 26.0, 40.0, 41.0, 38.0, 49.0, 40.0, 34.0, 55.0, 48.0, 48.0, 39.0, 38.0, 50.0, 48.0, 37.0, 35.0, 31.0, 28.0, 26.0, 22.0, 13.0, 13.0, 10.0, 11.0, 8.0, 13.0, 6.0, 2.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.4059903621673584, -0.3953148126602173, -0.38463926315307617, -0.37396374344825745, -0.36328819394111633, -0.3526126444339752, -0.3419370949268341, -0.3312615752220154, -0.32058602571487427, -0.30991047620773315, -0.29923492670059204, -0.2885594069957733, -0.2778838574886322, -0.2672083079814911, -0.25653275847435, -0.24585722386837006, -0.23518167436122894, -0.22450612485408783, -0.2138305902481079, -0.2031550407409668, -0.19247950613498688, -0.18180395662784576, -0.17112842202186584, -0.16045287251472473, -0.14977732300758362, -0.1391017735004425, -0.12842623889446259, -0.11775068938732147, -0.10707515478134155, -0.09639960527420044, -0.08572406321763992, -0.0750485211610794, -0.06437298655509949, -0.05369744449853897, -0.043021902441978455, -0.03234635666012764, -0.021670814603567123, -0.010995272547006607, -0.00031972676515579224, 0.010355815291404724, 0.02103135734796524, 0.03170689940452576, 0.04238244146108627, 0.05305798724293709, 0.0637335330247879, 0.07440906763076782, 0.08508461713790894, 0.09576015919446945, 0.10643570125102997, 0.11711124330759048, 0.127786785364151, 0.13846233487129211, 0.14913786947727203, 0.15981341898441315, 0.17048895359039307, 0.18116450309753418, 0.1918400526046753, 0.2025156021118164, 0.21319113671779633, 0.22386668622493744, 0.23454222083091736, 0.24521777033805847, 0.2558933198451996, 0.2665688395500183, 0.2772443890571594]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 7.0, 5.0, 17.0, 15.0, 17.0, 48.0, 55.0, 90.0, 122.0, 229.0, 382.0, 671.0, 1518.0, 3745.0, 10316.0, 32350.0, 155245.0, 665793.0, 132404.0, 29469.0, 9566.0, 3439.0, 1495.0, 614.0, 350.0, 217.0, 136.0, 65.0, 60.0, 35.0, 18.0, 22.0, 12.0, 7.0, 9.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.447265625, -0.43389892578125, -0.4205322265625, -0.40716552734375, -0.393798828125, -0.38043212890625, -0.3670654296875, -0.35369873046875, -0.34033203125, -0.32696533203125, -0.3135986328125, -0.30023193359375, -0.286865234375, -0.27349853515625, -0.2601318359375, -0.24676513671875, -0.2333984375, -0.22003173828125, -0.2066650390625, -0.19329833984375, -0.179931640625, -0.16656494140625, -0.1531982421875, -0.13983154296875, -0.12646484375, -0.11309814453125, -0.0997314453125, -0.08636474609375, -0.072998046875, -0.05963134765625, -0.0462646484375, -0.03289794921875, -0.01953125, -0.00616455078125, 0.0072021484375, 0.02056884765625, 0.033935546875, 0.04730224609375, 0.0606689453125, 0.07403564453125, 0.08740234375, 0.10076904296875, 0.1141357421875, 0.12750244140625, 0.140869140625, 0.15423583984375, 0.1676025390625, 0.18096923828125, 0.1943359375, 0.20770263671875, 0.2210693359375, 0.23443603515625, 0.247802734375, 0.26116943359375, 0.2745361328125, 0.28790283203125, 0.30126953125, 0.31463623046875, 0.3280029296875, 0.34136962890625, 0.354736328125, 0.36810302734375, 0.3814697265625, 0.39483642578125, 0.408203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 4.0, 11.0, 11.0, 19.0, 20.0, 35.0, 20.0, 34.0, 33.0, 43.0, 46.0, 41.0, 50.0, 45.0, 47.0, 44.0, 52.0, 41.0, 56.0, 52.0, 44.0, 26.0, 39.0, 27.0, 26.0, 15.0, 20.0, 15.0, 17.0, 10.0, 15.0, 3.0, 12.0, 3.0, 0.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.755859375, -0.7333450317382812, -0.7108306884765625, -0.6883163452148438, -0.665802001953125, -0.6432876586914062, -0.6207733154296875, -0.5982589721679688, -0.57574462890625, -0.5532302856445312, -0.5307159423828125, -0.5082015991210938, -0.485687255859375, -0.46317291259765625, -0.4406585693359375, -0.41814422607421875, -0.3956298828125, -0.37311553955078125, -0.3506011962890625, -0.32808685302734375, -0.305572509765625, -0.28305816650390625, -0.2605438232421875, -0.23802947998046875, -0.21551513671875, -0.19300079345703125, -0.1704864501953125, -0.14797210693359375, -0.125457763671875, -0.10294342041015625, -0.0804290771484375, -0.05791473388671875, -0.035400390625, -0.01288604736328125, 0.0096282958984375, 0.03214263916015625, 0.054656982421875, 0.07717132568359375, 0.0996856689453125, 0.12220001220703125, 0.14471435546875, 0.16722869873046875, 0.1897430419921875, 0.21225738525390625, 0.234771728515625, 0.25728607177734375, 0.2798004150390625, 0.30231475830078125, 0.3248291015625, 0.34734344482421875, 0.3698577880859375, 0.39237213134765625, 0.414886474609375, 0.43740081787109375, 0.4599151611328125, 0.48242950439453125, 0.50494384765625, 0.5274581909179688, 0.5499725341796875, 0.5724868774414062, 0.595001220703125, 0.6175155639648438, 0.6400299072265625, 0.6625442504882812, 0.68505859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 1.0, 9.0, 3.0, 13.0, 3.0, 20.0, 23.0, 33.0, 30.0, 36.0, 60.0, 82.0, 113.0, 187.0, 292.0, 605.0, 1994.0, 16078.0, 631601.0, 381495.0, 12577.0, 1819.0, 565.0, 288.0, 156.0, 121.0, 86.0, 53.0, 46.0, 31.0, 19.0, 20.0, 16.0, 14.0, 11.0, 9.0, 13.0, 6.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0302734375, -0.9990081787109375, -0.967742919921875, -0.9364776611328125, -0.90521240234375, -0.8739471435546875, -0.842681884765625, -0.8114166259765625, -0.7801513671875, -0.7488861083984375, -0.717620849609375, -0.6863555908203125, -0.65509033203125, -0.6238250732421875, -0.592559814453125, -0.5612945556640625, -0.530029296875, -0.4987640380859375, -0.467498779296875, -0.4362335205078125, -0.40496826171875, -0.3737030029296875, -0.342437744140625, -0.3111724853515625, -0.2799072265625, -0.2486419677734375, -0.217376708984375, -0.1861114501953125, -0.15484619140625, -0.1235809326171875, -0.092315673828125, -0.0610504150390625, -0.02978515625, 0.0014801025390625, 0.032745361328125, 0.0640106201171875, 0.09527587890625, 0.1265411376953125, 0.157806396484375, 0.1890716552734375, 0.2203369140625, 0.2516021728515625, 0.282867431640625, 0.3141326904296875, 0.34539794921875, 0.3766632080078125, 0.407928466796875, 0.4391937255859375, 0.470458984375, 0.5017242431640625, 0.532989501953125, 0.5642547607421875, 0.59552001953125, 0.6267852783203125, 0.658050537109375, 0.6893157958984375, 0.7205810546875, 0.7518463134765625, 0.783111572265625, 0.8143768310546875, 0.84564208984375, 0.8769073486328125, 0.908172607421875, 0.9394378662109375, 0.970703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 8.0, 9.0, 7.0, 4.0, 6.0, 8.0, 12.0, 9.0, 10.0, 16.0, 26.0, 27.0, 33.0, 32.0, 31.0, 42.0, 33.0, 54.0, 45.0, 43.0, 48.0, 43.0, 37.0, 52.0, 47.0, 31.0, 24.0, 35.0, 19.0, 27.0, 32.0, 30.0, 18.0, 17.0, 10.0, 15.0, 13.0, 11.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.75634765625, -0.732391357421875, -0.70843505859375, -0.684478759765625, -0.6605224609375, -0.636566162109375, -0.61260986328125, -0.588653564453125, -0.564697265625, -0.540740966796875, -0.51678466796875, -0.492828369140625, -0.4688720703125, -0.444915771484375, -0.42095947265625, -0.397003173828125, -0.373046875, -0.349090576171875, -0.32513427734375, -0.301177978515625, -0.2772216796875, -0.253265380859375, -0.22930908203125, -0.205352783203125, -0.181396484375, -0.157440185546875, -0.13348388671875, -0.109527587890625, -0.0855712890625, -0.061614990234375, -0.03765869140625, -0.013702392578125, 0.01025390625, 0.034210205078125, 0.05816650390625, 0.082122802734375, 0.1060791015625, 0.130035400390625, 0.15399169921875, 0.177947998046875, 0.201904296875, 0.225860595703125, 0.24981689453125, 0.273773193359375, 0.2977294921875, 0.321685791015625, 0.34564208984375, 0.369598388671875, 0.3935546875, 0.417510986328125, 0.44146728515625, 0.465423583984375, 0.4893798828125, 0.513336181640625, 0.53729248046875, 0.561248779296875, 0.585205078125, 0.609161376953125, 0.63311767578125, 0.657073974609375, 0.6810302734375, 0.704986572265625, 0.72894287109375, 0.752899169921875, 0.77685546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 15.0, 17.0, 23.0, 31.0, 48.0, 55.0, 88.0, 85.0, 146.0, 190.0, 319.0, 512.0, 878.0, 1603.0, 3271.0, 9185.0, 45765.0, 667927.0, 279945.0, 26064.0, 6465.0, 2600.0, 1293.0, 724.0, 408.0, 260.0, 187.0, 123.0, 83.0, 74.0, 35.0, 36.0, 18.0, 10.0, 16.0, 9.0, 12.0, 3.0, 3.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.173828125, -0.16800498962402344, -0.16218185424804688, -0.1563587188720703, -0.15053558349609375, -0.1447124481201172, -0.13888931274414062, -0.13306617736816406, -0.1272430419921875, -0.12141990661621094, -0.11559677124023438, -0.10977363586425781, -0.10395050048828125, -0.09812736511230469, -0.09230422973632812, -0.08648109436035156, -0.080657958984375, -0.07483482360839844, -0.06901168823242188, -0.06318855285644531, -0.05736541748046875, -0.05154228210449219, -0.045719146728515625, -0.03989601135253906, -0.0340728759765625, -0.028249740600585938, -0.022426605224609375, -0.016603469848632812, -0.01078033447265625, -0.0049571990966796875, 0.000865936279296875, 0.0066890716552734375, 0.01251220703125, 0.018335342407226562, 0.024158477783203125, 0.029981613159179688, 0.03580474853515625, 0.04162788391113281, 0.047451019287109375, 0.05327415466308594, 0.0590972900390625, 0.06492042541503906, 0.07074356079101562, 0.07656669616699219, 0.08238983154296875, 0.08821296691894531, 0.09403610229492188, 0.09985923767089844, 0.105682373046875, 0.11150550842285156, 0.11732864379882812, 0.12315177917480469, 0.12897491455078125, 0.1347980499267578, 0.14062118530273438, 0.14644432067871094, 0.1522674560546875, 0.15809059143066406, 0.16391372680664062, 0.1697368621826172, 0.17555999755859375, 0.1813831329345703, 0.18720626831054688, 0.19302940368652344, 0.1988525390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 6.0, 5.0, 7.0, 16.0, 20.0, 36.0, 82.0, 136.0, 207.0, 202.0, 107.0, 74.0, 31.0, 22.0, 10.0, 11.0, 5.0, 8.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.522634506225586e-05, -3.4125521779060364e-05, -3.302469849586487e-05, -3.192387521266937e-05, -3.082305192947388e-05, -2.972222864627838e-05, -2.8621405363082886e-05, -2.752058207988739e-05, -2.6419758796691895e-05, -2.53189355134964e-05, -2.4218112230300903e-05, -2.3117288947105408e-05, -2.2016465663909912e-05, -2.0915642380714417e-05, -1.981481909751892e-05, -1.8713995814323425e-05, -1.761317253112793e-05, -1.6512349247932434e-05, -1.541152596473694e-05, -1.4310702681541443e-05, -1.3209879398345947e-05, -1.2109056115150452e-05, -1.1008232831954956e-05, -9.90740954875946e-06, -8.806586265563965e-06, -7.70576298236847e-06, -6.604939699172974e-06, -5.504116415977478e-06, -4.403293132781982e-06, -3.302469849586487e-06, -2.201646566390991e-06, -1.1008232831954956e-06, 0.0, 1.1008232831954956e-06, 2.201646566390991e-06, 3.302469849586487e-06, 4.403293132781982e-06, 5.504116415977478e-06, 6.604939699172974e-06, 7.70576298236847e-06, 8.806586265563965e-06, 9.90740954875946e-06, 1.1008232831954956e-05, 1.2109056115150452e-05, 1.3209879398345947e-05, 1.4310702681541443e-05, 1.541152596473694e-05, 1.6512349247932434e-05, 1.761317253112793e-05, 1.8713995814323425e-05, 1.981481909751892e-05, 2.0915642380714417e-05, 2.2016465663909912e-05, 2.3117288947105408e-05, 2.4218112230300903e-05, 2.53189355134964e-05, 2.6419758796691895e-05, 2.752058207988739e-05, 2.8621405363082886e-05, 2.972222864627838e-05, 3.082305192947388e-05, 3.192387521266937e-05, 3.302469849586487e-05, 3.4125521779060364e-05, 3.522634506225586e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 11.0, 19.0, 28.0, 24.0, 49.0, 71.0, 97.0, 158.0, 241.0, 388.0, 626.0, 1075.0, 2058.0, 3882.0, 10605.0, 64264.0, 779484.0, 157199.0, 17291.0, 5049.0, 2434.0, 1319.0, 830.0, 472.0, 308.0, 167.0, 137.0, 84.0, 49.0, 29.0, 28.0, 17.0, 16.0, 4.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2291259765625, -0.2218914031982422, -0.21465682983398438, -0.20742225646972656, -0.20018768310546875, -0.19295310974121094, -0.18571853637695312, -0.1784839630126953, -0.1712493896484375, -0.1640148162841797, -0.15678024291992188, -0.14954566955566406, -0.14231109619140625, -0.13507652282714844, -0.12784194946289062, -0.12060737609863281, -0.113372802734375, -0.10613822937011719, -0.09890365600585938, -0.09166908264160156, -0.08443450927734375, -0.07719993591308594, -0.06996536254882812, -0.06273078918457031, -0.0554962158203125, -0.04826164245605469, -0.041027069091796875, -0.03379249572753906, -0.02655792236328125, -0.019323348999023438, -0.012088775634765625, -0.0048542022705078125, 0.00238037109375, 0.009614944458007812, 0.016849517822265625, 0.024084091186523438, 0.03131866455078125, 0.03855323791503906, 0.045787811279296875, 0.05302238464355469, 0.0602569580078125, 0.06749153137207031, 0.07472610473632812, 0.08196067810058594, 0.08919525146484375, 0.09642982482910156, 0.10366439819335938, 0.11089897155761719, 0.118133544921875, 0.1253681182861328, 0.13260269165039062, 0.13983726501464844, 0.14707183837890625, 0.15430641174316406, 0.16154098510742188, 0.1687755584716797, 0.1760101318359375, 0.1832447052001953, 0.19047927856445312, 0.19771385192871094, 0.20494842529296875, 0.21218299865722656, 0.21941757202148438, 0.2266521453857422, 0.23388671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 6.0, 19.0, 27.0, 36.0, 61.0, 106.0, 176.0, 203.0, 110.0, 86.0, 42.0, 35.0, 25.0, 16.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.09182071685791016, -0.08854866027832031, -0.08527660369873047, -0.08200454711914062, -0.07873249053955078, -0.07546043395996094, -0.0721883773803711, -0.06891632080078125, -0.0656442642211914, -0.06237220764160156, -0.05910015106201172, -0.055828094482421875, -0.05255603790283203, -0.04928398132324219, -0.046011924743652344, -0.0427398681640625, -0.039467811584472656, -0.03619575500488281, -0.03292369842529297, -0.029651641845703125, -0.02637958526611328, -0.023107528686523438, -0.019835472106933594, -0.01656341552734375, -0.013291358947753906, -0.010019302368164062, -0.006747245788574219, -0.003475189208984375, -0.00020313262939453125, 0.0030689239501953125, 0.006340980529785156, 0.009613037109375, 0.012885093688964844, 0.016157150268554688, 0.01942920684814453, 0.022701263427734375, 0.02597332000732422, 0.029245376586914062, 0.032517433166503906, 0.03578948974609375, 0.039061546325683594, 0.04233360290527344, 0.04560565948486328, 0.048877716064453125, 0.05214977264404297, 0.05542182922363281, 0.058693885803222656, 0.0619659423828125, 0.06523799896240234, 0.06851005554199219, 0.07178211212158203, 0.07505416870117188, 0.07832622528076172, 0.08159828186035156, 0.0848703384399414, 0.08814239501953125, 0.0914144515991211, 0.09468650817871094, 0.09795856475830078, 0.10123062133789062, 0.10450267791748047, 0.10777473449707031, 0.11104679107666016, 0.11431884765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 12.0, 14.0, 31.0, 30.0, 44.0, 57.0, 74.0, 117.0, 94.0, 112.0, 98.0, 93.0, 73.0, 51.0, 34.0, 24.0, 20.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3720266819000244, -1.329236388206482, -1.286446213722229, -1.2436559200286865, -1.2008657455444336, -1.1580754518508911, -1.1152851581573486, -1.0724949836730957, -1.0297046899795532, -0.9869144558906555, -0.9441242218017578, -0.9013339281082153, -0.8585436940193176, -0.8157534599304199, -0.7729632258415222, -0.7301729917526245, -0.6873827576637268, -0.6445925235748291, -0.6018022894859314, -0.5590120553970337, -0.5162217617034912, -0.4734315276145935, -0.4306412935256958, -0.3878510296344757, -0.345060795545578, -0.3022705614566803, -0.2594802975654602, -0.2166900634765625, -0.1738998144865036, -0.1311095654964447, -0.088319331407547, -0.045529067516326904, -0.0027388334274291992, 0.0400514118373394, 0.082841657102108, 0.1256318986415863, 0.1684221476316452, 0.2112123966217041, 0.2540026307106018, 0.2967928946018219, 0.3395831286907196, 0.3823733627796173, 0.4251636266708374, 0.4679538607597351, 0.5107440948486328, 0.5535343885421753, 0.5963245630264282, 0.6391148567199707, 0.6819050908088684, 0.7246953248977661, 0.7674855589866638, 0.8102757930755615, 0.853066086769104, 0.8958563208580017, 0.9386465549468994, 0.9814368486404419, 1.0242270231246948, 1.0670173168182373, 1.1098074913024902, 1.1525977849960327, 1.1953879594802856, 1.2381782531738281, 1.280968427658081, 1.3237587213516235, 1.366549015045166]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 1.0, 3.0, 6.0, 10.0, 12.0, 14.0, 15.0, 11.0, 17.0, 21.0, 28.0, 26.0, 31.0, 23.0, 33.0, 45.0, 36.0, 42.0, 42.0, 38.0, 44.0, 35.0, 32.0, 43.0, 48.0, 39.0, 33.0, 35.0, 34.0, 29.0, 27.0, 28.0, 18.0, 20.0, 17.0, 15.0, 16.0, 8.0, 4.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0769579410552979, -1.0398415327072144, -1.0027251243591309, -0.9656087756156921, -0.9284924268722534, -0.8913760185241699, -0.8542596101760864, -0.8171432018280029, -0.7800268530845642, -0.7429104447364807, -0.705794095993042, -0.6686776876449585, -0.631561279296875, -0.5944449305534363, -0.5573285222053528, -0.5202121734619141, -0.48309576511383057, -0.44597938656806946, -0.40886300802230835, -0.37174659967422485, -0.33463022112846375, -0.29751384258270264, -0.26039743423461914, -0.22328105568885803, -0.18616467714309692, -0.14904829859733582, -0.11193190515041351, -0.07481551915407181, -0.0376991331577301, -0.0005827546119689941, 0.03653363883495331, 0.07365003228187561, 0.11076641082763672, 0.14788278937339783, 0.18499918282032013, 0.22211557626724243, 0.25923195481300354, 0.29634833335876465, 0.33346474170684814, 0.37058112025260925, 0.40769749879837036, 0.44481387734413147, 0.4819302558898926, 0.5190466642379761, 0.5561630725860596, 0.5932794213294983, 0.6303958296775818, 0.6675121784210205, 0.704628586769104, 0.7417449951171875, 0.7788613438606262, 0.8159777522087097, 0.8530941009521484, 0.8902105093002319, 0.9273269176483154, 0.9644433259963989, 1.0015597343444824, 1.038676142692566, 1.0757925510406494, 1.1129088401794434, 1.1500252485275269, 1.1871416568756104, 1.2242580652236938, 1.2613744735717773, 1.2984907627105713]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 4.0, 16.0, 11.0, 16.0, 21.0, 37.0, 46.0, 31.0, 45.0, 70.0, 159.0, 492.0, 2987.0, 54056.0, 3617311.0, 507969.0, 9221.0, 1111.0, 247.0, 104.0, 72.0, 34.0, 44.0, 35.0, 21.0, 31.0, 19.0, 12.0, 8.0, 2.0, 10.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.052734375, -1.9918670654296875, -1.930999755859375, -1.8701324462890625, -1.80926513671875, -1.7483978271484375, -1.687530517578125, -1.6266632080078125, -1.5657958984375, -1.5049285888671875, -1.444061279296875, -1.3831939697265625, -1.32232666015625, -1.2614593505859375, -1.200592041015625, -1.1397247314453125, -1.078857421875, -1.0179901123046875, -0.957122802734375, -0.8962554931640625, -0.83538818359375, -0.7745208740234375, -0.713653564453125, -0.6527862548828125, -0.5919189453125, -0.5310516357421875, -0.470184326171875, -0.4093170166015625, -0.34844970703125, -0.2875823974609375, -0.226715087890625, -0.1658477783203125, -0.10498046875, -0.0441131591796875, 0.016754150390625, 0.0776214599609375, 0.13848876953125, 0.1993560791015625, 0.260223388671875, 0.3210906982421875, 0.3819580078125, 0.4428253173828125, 0.503692626953125, 0.5645599365234375, 0.62542724609375, 0.6862945556640625, 0.747161865234375, 0.8080291748046875, 0.868896484375, 0.9297637939453125, 0.990631103515625, 1.0514984130859375, 1.11236572265625, 1.1732330322265625, 1.234100341796875, 1.2949676513671875, 1.3558349609375, 1.4167022705078125, 1.477569580078125, 1.5384368896484375, 1.59930419921875, 1.6601715087890625, 1.721038818359375, 1.7819061279296875, 1.8427734375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 12.0, 14.0, 19.0, 23.0, 24.0, 30.0, 29.0, 28.0, 41.0, 41.0, 46.0, 39.0, 53.0, 59.0, 44.0, 56.0, 64.0, 46.0, 42.0, 43.0, 43.0, 43.0, 27.0, 23.0, 16.0, 18.0, 16.0, 13.0, 11.0, 8.0, 4.0, 1.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4729728698730469, -0.45742034912109375, -0.4418678283691406, -0.4263153076171875, -0.4107627868652344, -0.39521026611328125, -0.3796577453613281, -0.364105224609375, -0.3485527038574219, -0.33300018310546875, -0.3174476623535156, -0.3018951416015625, -0.2863426208496094, -0.27079010009765625, -0.2552375793457031, -0.23968505859375, -0.22413253784179688, -0.20858001708984375, -0.19302749633789062, -0.1774749755859375, -0.16192245483398438, -0.14636993408203125, -0.13081741333007812, -0.115264892578125, -0.09971237182617188, -0.08415985107421875, -0.06860733032226562, -0.0530548095703125, -0.037502288818359375, -0.02194976806640625, -0.006397247314453125, 0.0091552734375, 0.024707794189453125, 0.04026031494140625, 0.055812835693359375, 0.0713653564453125, 0.08691787719726562, 0.10247039794921875, 0.11802291870117188, 0.133575439453125, 0.14912796020507812, 0.16468048095703125, 0.18023300170898438, 0.1957855224609375, 0.21133804321289062, 0.22689056396484375, 0.24244308471679688, 0.25799560546875, 0.2735481262207031, 0.28910064697265625, 0.3046531677246094, 0.3202056884765625, 0.3357582092285156, 0.35131072998046875, 0.3668632507324219, 0.382415771484375, 0.3979682922363281, 0.41352081298828125, 0.4290733337402344, 0.4446258544921875, 0.4601783752441406, 0.47573089599609375, 0.4912834167480469, 0.5068359375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 4.0, 26.0, 26.0, 40.0, 76.0, 149.0, 325.0, 710.0, 2002.0, 8435.0, 86433.0, 3636868.0, 434598.0, 19168.0, 3464.0, 1049.0, 469.0, 204.0, 91.0, 50.0, 28.0, 20.0, 11.0, 7.0, 9.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.720703125, -1.673828125, -1.626953125, -1.580078125, -1.533203125, -1.486328125, -1.439453125, -1.392578125, -1.345703125, -1.298828125, -1.251953125, -1.205078125, -1.158203125, -1.111328125, -1.064453125, -1.017578125, -0.970703125, -0.923828125, -0.876953125, -0.830078125, -0.783203125, -0.736328125, -0.689453125, -0.642578125, -0.595703125, -0.548828125, -0.501953125, -0.455078125, -0.408203125, -0.361328125, -0.314453125, -0.267578125, -0.220703125, -0.173828125, -0.126953125, -0.080078125, -0.033203125, 0.013671875, 0.060546875, 0.107421875, 0.154296875, 0.201171875, 0.248046875, 0.294921875, 0.341796875, 0.388671875, 0.435546875, 0.482421875, 0.529296875, 0.576171875, 0.623046875, 0.669921875, 0.716796875, 0.763671875, 0.810546875, 0.857421875, 0.904296875, 0.951171875, 0.998046875, 1.044921875, 1.091796875, 1.138671875, 1.185546875, 1.232421875, 1.279296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 16.0, 14.0, 22.0, 27.0, 50.0, 67.0, 107.0, 187.0, 279.0, 493.0, 636.0, 717.0, 546.0, 349.0, 210.0, 113.0, 77.0, 55.0, 35.0, 23.0, 15.0, 7.0, 3.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.384033203125, -0.37421417236328125, -0.3643951416015625, -0.35457611083984375, -0.344757080078125, -0.33493804931640625, -0.3251190185546875, -0.31529998779296875, -0.30548095703125, -0.29566192626953125, -0.2858428955078125, -0.27602386474609375, -0.266204833984375, -0.25638580322265625, -0.2465667724609375, -0.23674774169921875, -0.2269287109375, -0.21710968017578125, -0.2072906494140625, -0.19747161865234375, -0.187652587890625, -0.17783355712890625, -0.1680145263671875, -0.15819549560546875, -0.14837646484375, -0.13855743408203125, -0.1287384033203125, -0.11891937255859375, -0.109100341796875, -0.09928131103515625, -0.0894622802734375, -0.07964324951171875, -0.06982421875, -0.06000518798828125, -0.0501861572265625, -0.04036712646484375, -0.030548095703125, -0.02072906494140625, -0.0109100341796875, -0.00109100341796875, 0.00872802734375, 0.01854705810546875, 0.0283660888671875, 0.03818511962890625, 0.048004150390625, 0.05782318115234375, 0.0676422119140625, 0.07746124267578125, 0.0872802734375, 0.09709930419921875, 0.1069183349609375, 0.11673736572265625, 0.126556396484375, 0.13637542724609375, 0.1461944580078125, 0.15601348876953125, 0.16583251953125, 0.17565155029296875, 0.1854705810546875, 0.19528961181640625, 0.205108642578125, 0.21492767333984375, 0.2247467041015625, 0.23456573486328125, 0.244384765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 13.0, 27.0, 52.0, 76.0, 86.0, 105.0, 128.0, 136.0, 127.0, 88.0, 56.0, 45.0, 26.0, 10.0, 6.0, 9.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.057590961456299, -2.0117831230163574, -1.9659751653671265, -1.920167326927185, -1.874359369277954, -1.8285515308380127, -1.7827436923980713, -1.7369357347488403, -1.6911277770996094, -1.645319938659668, -1.599511981010437, -1.5537041425704956, -1.5078961849212646, -1.4620883464813232, -1.4162805080413818, -1.3704725503921509, -1.3246647119522095, -1.278856873512268, -1.233048915863037, -1.1872410774230957, -1.1414331197738647, -1.0956252813339233, -1.0498173236846924, -1.004009485244751, -0.9582015872001648, -0.9123936891555786, -0.8665857911109924, -0.8207778930664062, -0.7749700546264648, -0.7291620969772339, -0.6833542585372925, -0.6375463604927063, -0.5917384624481201, -0.5459305644035339, -0.5001226663589478, -0.45431479811668396, -0.4085069000720978, -0.3626990020275116, -0.3168911337852478, -0.2710832357406616, -0.22527533769607544, -0.17946743965148926, -0.13365955650806427, -0.08785167336463928, -0.0420437753200531, 0.003764122724533081, 0.049571990966796875, 0.09537988901138306, 0.14118778705596924, 0.18699568510055542, 0.2328035682439804, 0.2786114513874054, 0.3244193494319916, 0.37022724747657776, 0.41603511571884155, 0.46184301376342773, 0.5076509118080139, 0.5534588098526001, 0.5992667078971863, 0.6450746059417725, 0.6908824443817139, 0.7366904020309448, 0.7824982404708862, 0.8283061385154724, 0.8741140365600586]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 5.0, 16.0, 10.0, 16.0, 34.0, 17.0, 19.0, 23.0, 20.0, 24.0, 30.0, 42.0, 41.0, 35.0, 38.0, 43.0, 32.0, 35.0, 33.0, 34.0, 39.0, 42.0, 37.0, 28.0, 31.0, 47.0, 26.0, 24.0, 28.0, 23.0, 28.0, 19.0, 19.0, 8.0, 6.0, 9.0, 6.0, 6.0, 5.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5137552618980408, -0.4969230890274048, -0.4800908863544464, -0.4632587134838104, -0.44642651081085205, -0.42959433794021606, -0.4127621650695801, -0.3959299921989441, -0.3790977895259857, -0.36226561665534973, -0.34543341398239136, -0.32860124111175537, -0.3117690682411194, -0.294936865568161, -0.278104692697525, -0.26127249002456665, -0.24444031715393066, -0.22760812938213348, -0.2107759416103363, -0.19394376873970032, -0.17711158096790314, -0.16027939319610596, -0.14344722032546997, -0.1266150325536728, -0.10978284478187561, -0.09295065701007843, -0.07611847668886185, -0.059286292642354965, -0.042454108595848083, -0.025621920824050903, -0.00878974050283432, 0.008042439818382263, 0.024874567985534668, 0.04170675203204155, 0.05853893607854843, 0.07537111639976501, 0.0922033041715622, 0.10903549194335938, 0.12586766481399536, 0.14269985258579254, 0.15953204035758972, 0.1763642281293869, 0.19319641590118408, 0.21002858877182007, 0.22686077654361725, 0.24369296431541443, 0.2605251371860504, 0.2773573398590088, 0.2941895127296448, 0.31102168560028076, 0.32785388827323914, 0.3446860611438751, 0.3615182638168335, 0.3783504366874695, 0.39518260955810547, 0.41201478242874146, 0.42884698510169983, 0.4456791579723358, 0.4625113606452942, 0.4793435335159302, 0.49617570638656616, 0.5130078792572021, 0.5298401117324829, 0.5466722846031189, 0.5635044574737549]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 15.0, 24.0, 54.0, 69.0, 119.0, 257.0, 602.0, 1671.0, 6031.0, 33947.0, 598491.0, 377202.0, 23076.0, 4584.0, 1398.0, 525.0, 214.0, 88.0, 53.0, 33.0, 32.0, 10.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37939453125, -0.363525390625, -0.34765625, -0.331787109375, -0.31591796875, -0.300048828125, -0.2841796875, -0.268310546875, -0.25244140625, -0.236572265625, -0.220703125, -0.204833984375, -0.18896484375, -0.173095703125, -0.1572265625, -0.141357421875, -0.12548828125, -0.109619140625, -0.09375, -0.077880859375, -0.06201171875, -0.046142578125, -0.0302734375, -0.014404296875, 0.00146484375, 0.017333984375, 0.033203125, 0.049072265625, 0.06494140625, 0.080810546875, 0.0966796875, 0.112548828125, 0.12841796875, 0.144287109375, 0.16015625, 0.176025390625, 0.19189453125, 0.207763671875, 0.2236328125, 0.239501953125, 0.25537109375, 0.271240234375, 0.287109375, 0.302978515625, 0.31884765625, 0.334716796875, 0.3505859375, 0.366455078125, 0.38232421875, 0.398193359375, 0.4140625, 0.429931640625, 0.44580078125, 0.461669921875, 0.4775390625, 0.493408203125, 0.50927734375, 0.525146484375, 0.541015625, 0.556884765625, 0.57275390625, 0.588623046875, 0.6044921875, 0.620361328125, 0.63623046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 6.0, 12.0, 9.0, 13.0, 24.0, 18.0, 24.0, 37.0, 35.0, 37.0, 46.0, 57.0, 46.0, 46.0, 52.0, 52.0, 52.0, 56.0, 45.0, 37.0, 56.0, 43.0, 41.0, 26.0, 31.0, 22.0, 22.0, 13.0, 12.0, 10.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3828125, -0.36733245849609375, -0.3518524169921875, -0.33637237548828125, -0.320892333984375, -0.30541229248046875, -0.2899322509765625, -0.27445220947265625, -0.25897216796875, -0.24349212646484375, -0.2280120849609375, -0.21253204345703125, -0.197052001953125, -0.18157196044921875, -0.1660919189453125, -0.15061187744140625, -0.1351318359375, -0.11965179443359375, -0.1041717529296875, -0.08869171142578125, -0.073211669921875, -0.05773162841796875, -0.0422515869140625, -0.02677154541015625, -0.01129150390625, 0.00418853759765625, 0.0196685791015625, 0.03514862060546875, 0.050628662109375, 0.06610870361328125, 0.0815887451171875, 0.09706878662109375, 0.112548828125, 0.12802886962890625, 0.1435089111328125, 0.15898895263671875, 0.174468994140625, 0.18994903564453125, 0.2054290771484375, 0.22090911865234375, 0.23638916015625, 0.25186920166015625, 0.2673492431640625, 0.28282928466796875, 0.298309326171875, 0.31378936767578125, 0.3292694091796875, 0.34474945068359375, 0.3602294921875, 0.37570953369140625, 0.3911895751953125, 0.40666961669921875, 0.422149658203125, 0.43762969970703125, 0.4531097412109375, 0.46858978271484375, 0.48406982421875, 0.49954986572265625, 0.5150299072265625, 0.5305099487304688, 0.545989990234375, 0.5614700317382812, 0.5769500732421875, 0.5924301147460938, 0.60791015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 10.0, 8.0, 12.0, 7.0, 18.0, 43.0, 53.0, 67.0, 101.0, 156.0, 272.0, 398.0, 738.0, 1222.0, 2235.0, 4453.0, 10070.0, 32382.0, 145275.0, 465817.0, 290053.0, 64592.0, 17034.0, 6359.0, 2995.0, 1635.0, 959.0, 607.0, 357.0, 208.0, 134.0, 91.0, 42.0, 44.0, 22.0, 23.0, 9.0, 13.0, 7.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1790771484375, -0.17343521118164062, -0.16779327392578125, -0.16215133666992188, -0.1565093994140625, -0.15086746215820312, -0.14522552490234375, -0.13958358764648438, -0.133941650390625, -0.12829971313476562, -0.12265777587890625, -0.11701583862304688, -0.1113739013671875, -0.10573196411132812, -0.10009002685546875, -0.09444808959960938, -0.08880615234375, -0.08316421508789062, -0.07752227783203125, -0.07188034057617188, -0.0662384033203125, -0.060596466064453125, -0.05495452880859375, -0.049312591552734375, -0.043670654296875, -0.038028717041015625, -0.03238677978515625, -0.026744842529296875, -0.0211029052734375, -0.015460968017578125, -0.00981903076171875, -0.004177093505859375, 0.00146484375, 0.007106781005859375, 0.01274871826171875, 0.018390655517578125, 0.0240325927734375, 0.029674530029296875, 0.03531646728515625, 0.040958404541015625, 0.046600341796875, 0.052242279052734375, 0.05788421630859375, 0.06352615356445312, 0.0691680908203125, 0.07481002807617188, 0.08045196533203125, 0.08609390258789062, 0.09173583984375, 0.09737777709960938, 0.10301971435546875, 0.10866165161132812, 0.1143035888671875, 0.11994552612304688, 0.12558746337890625, 0.13122940063476562, 0.136871337890625, 0.14251327514648438, 0.14815521240234375, 0.15379714965820312, 0.1594390869140625, 0.16508102416992188, 0.17072296142578125, 0.17636489868164062, 0.1820068359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 9.0, 7.0, 9.0, 16.0, 23.0, 19.0, 12.0, 13.0, 19.0, 32.0, 28.0, 28.0, 43.0, 29.0, 40.0, 47.0, 40.0, 32.0, 40.0, 38.0, 39.0, 41.0, 40.0, 37.0, 36.0, 34.0, 29.0, 31.0, 21.0, 27.0, 19.0, 14.0, 14.0, 15.0, 12.0, 10.0, 9.0, 6.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7900390625, -0.7660903930664062, -0.7421417236328125, -0.7181930541992188, -0.694244384765625, -0.6702957153320312, -0.6463470458984375, -0.6223983764648438, -0.59844970703125, -0.5745010375976562, -0.5505523681640625, -0.5266036987304688, -0.502655029296875, -0.47870635986328125, -0.4547576904296875, -0.43080902099609375, -0.4068603515625, -0.38291168212890625, -0.3589630126953125, -0.33501434326171875, -0.311065673828125, -0.28711700439453125, -0.2631683349609375, -0.23921966552734375, -0.21527099609375, -0.19132232666015625, -0.1673736572265625, -0.14342498779296875, -0.119476318359375, -0.09552764892578125, -0.0715789794921875, -0.04763031005859375, -0.023681640625, 0.00026702880859375, 0.0242156982421875, 0.04816436767578125, 0.072113037109375, 0.09606170654296875, 0.1200103759765625, 0.14395904541015625, 0.16790771484375, 0.19185638427734375, 0.2158050537109375, 0.23975372314453125, 0.263702392578125, 0.28765106201171875, 0.3115997314453125, 0.33554840087890625, 0.3594970703125, 0.38344573974609375, 0.4073944091796875, 0.43134307861328125, 0.455291748046875, 0.47924041748046875, 0.5031890869140625, 0.5271377563476562, 0.55108642578125, 0.5750350952148438, 0.5989837646484375, 0.6229324340820312, 0.646881103515625, 0.6708297729492188, 0.6947784423828125, 0.7187271118164062, 0.74267578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 15.0, 18.0, 25.0, 34.0, 60.0, 137.0, 232.0, 454.0, 949.0, 2310.0, 6549.0, 29064.0, 435808.0, 526979.0, 33679.0, 7399.0, 2557.0, 1086.0, 554.0, 242.0, 148.0, 92.0, 58.0, 36.0, 24.0, 11.0, 7.0, 6.0, 8.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.15030860900878906, -0.14546585083007812, -0.1406230926513672, -0.13578033447265625, -0.1309375762939453, -0.12609481811523438, -0.12125205993652344, -0.1164093017578125, -0.11156654357910156, -0.10672378540039062, -0.10188102722167969, -0.09703826904296875, -0.09219551086425781, -0.08735275268554688, -0.08250999450683594, -0.077667236328125, -0.07282447814941406, -0.06798171997070312, -0.06313896179199219, -0.05829620361328125, -0.05345344543457031, -0.048610687255859375, -0.04376792907714844, -0.0389251708984375, -0.03408241271972656, -0.029239654541015625, -0.024396896362304688, -0.01955413818359375, -0.014711380004882812, -0.009868621826171875, -0.0050258636474609375, -0.00018310546875, 0.0046596527099609375, 0.009502410888671875, 0.014345169067382812, 0.01918792724609375, 0.024030685424804688, 0.028873443603515625, 0.03371620178222656, 0.0385589599609375, 0.04340171813964844, 0.048244476318359375, 0.05308723449707031, 0.05792999267578125, 0.06277275085449219, 0.06761550903320312, 0.07245826721191406, 0.077301025390625, 0.08214378356933594, 0.08698654174804688, 0.09182929992675781, 0.09667205810546875, 0.10151481628417969, 0.10635757446289062, 0.11120033264160156, 0.1160430908203125, 0.12088584899902344, 0.12572860717773438, 0.1305713653564453, 0.13541412353515625, 0.1402568817138672, 0.14509963989257812, 0.14994239807128906, 0.15478515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 10.0, 23.0, 27.0, 58.0, 98.0, 206.0, 233.0, 164.0, 72.0, 48.0, 25.0, 14.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.246566772460938e-05, -6.046891212463379e-05, -5.84721565246582e-05, -5.647540092468262e-05, -5.447864532470703e-05, -5.2481889724731445e-05, -5.048513412475586e-05, -4.8488378524780273e-05, -4.649162292480469e-05, -4.44948673248291e-05, -4.2498111724853516e-05, -4.050135612487793e-05, -3.8504600524902344e-05, -3.650784492492676e-05, -3.451108932495117e-05, -3.2514333724975586e-05, -3.0517578125e-05, -2.8520822525024414e-05, -2.6524066925048828e-05, -2.4527311325073242e-05, -2.2530555725097656e-05, -2.053380012512207e-05, -1.8537044525146484e-05, -1.65402889251709e-05, -1.4543533325195312e-05, -1.2546777725219727e-05, -1.055002212524414e-05, -8.553266525268555e-06, -6.556510925292969e-06, -4.559755325317383e-06, -2.562999725341797e-06, -5.662441253662109e-07, 1.430511474609375e-06, 3.427267074584961e-06, 5.424022674560547e-06, 7.420778274536133e-06, 9.417533874511719e-06, 1.1414289474487305e-05, 1.341104507446289e-05, 1.5407800674438477e-05, 1.7404556274414062e-05, 1.940131187438965e-05, 2.1398067474365234e-05, 2.339482307434082e-05, 2.5391578674316406e-05, 2.7388334274291992e-05, 2.9385089874267578e-05, 3.1381845474243164e-05, 3.337860107421875e-05, 3.5375356674194336e-05, 3.737211227416992e-05, 3.936886787414551e-05, 4.1365623474121094e-05, 4.336237907409668e-05, 4.5359134674072266e-05, 4.735589027404785e-05, 4.935264587402344e-05, 5.1349401473999023e-05, 5.334615707397461e-05, 5.5342912673950195e-05, 5.733966827392578e-05, 5.933642387390137e-05, 6.133317947387695e-05, 6.332993507385254e-05, 6.532669067382812e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 4.0, 9.0, 14.0, 10.0, 24.0, 36.0, 48.0, 82.0, 155.0, 378.0, 993.0, 3303.0, 12288.0, 75478.0, 753149.0, 175154.0, 20167.0, 4916.0, 1423.0, 470.0, 194.0, 85.0, 60.0, 36.0, 21.0, 14.0, 11.0, 4.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174560546875, -0.16904640197753906, -0.16353225708007812, -0.1580181121826172, -0.15250396728515625, -0.1469898223876953, -0.14147567749023438, -0.13596153259277344, -0.1304473876953125, -0.12493324279785156, -0.11941909790039062, -0.11390495300292969, -0.10839080810546875, -0.10287666320800781, -0.09736251831054688, -0.09184837341308594, -0.086334228515625, -0.08082008361816406, -0.07530593872070312, -0.06979179382324219, -0.06427764892578125, -0.05876350402832031, -0.053249359130859375, -0.04773521423339844, -0.0422210693359375, -0.03670692443847656, -0.031192779541015625, -0.025678634643554688, -0.02016448974609375, -0.014650344848632812, -0.009136199951171875, -0.0036220550537109375, 0.00189208984375, 0.0074062347412109375, 0.012920379638671875, 0.018434524536132812, 0.02394866943359375, 0.029462814331054688, 0.034976959228515625, 0.04049110412597656, 0.0460052490234375, 0.05151939392089844, 0.057033538818359375, 0.06254768371582031, 0.06806182861328125, 0.07357597351074219, 0.07909011840820312, 0.08460426330566406, 0.090118408203125, 0.09563255310058594, 0.10114669799804688, 0.10666084289550781, 0.11217498779296875, 0.11768913269042969, 0.12320327758789062, 0.12871742248535156, 0.1342315673828125, 0.13974571228027344, 0.14525985717773438, 0.1507740020751953, 0.15628814697265625, 0.1618022918701172, 0.16731643676757812, 0.17283058166503906, 0.1783447265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 8.0, 6.0, 6.0, 12.0, 18.0, 17.0, 34.0, 41.0, 70.0, 105.0, 124.0, 132.0, 119.0, 89.0, 52.0, 50.0, 30.0, 20.0, 16.0, 12.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03448486328125, -0.033267974853515625, -0.03205108642578125, -0.030834197998046875, -0.0296173095703125, -0.028400421142578125, -0.02718353271484375, -0.025966644287109375, -0.024749755859375, -0.023532867431640625, -0.02231597900390625, -0.021099090576171875, -0.0198822021484375, -0.018665313720703125, -0.01744842529296875, -0.016231536865234375, -0.0150146484375, -0.013797760009765625, -0.01258087158203125, -0.011363983154296875, -0.0101470947265625, -0.008930206298828125, -0.00771331787109375, -0.006496429443359375, -0.005279541015625, -0.004062652587890625, -0.00284576416015625, -0.001628875732421875, -0.0004119873046875, 0.000804901123046875, 0.00202178955078125, 0.003238677978515625, 0.00445556640625, 0.005672454833984375, 0.00688934326171875, 0.008106231689453125, 0.0093231201171875, 0.010540008544921875, 0.01175689697265625, 0.012973785400390625, 0.014190673828125, 0.015407562255859375, 0.01662445068359375, 0.017841339111328125, 0.0190582275390625, 0.020275115966796875, 0.02149200439453125, 0.022708892822265625, 0.02392578125, 0.025142669677734375, 0.02635955810546875, 0.027576446533203125, 0.0287933349609375, 0.030010223388671875, 0.03122711181640625, 0.032444000244140625, 0.033660888671875, 0.034877777099609375, 0.03609466552734375, 0.037311553955078125, 0.0385284423828125, 0.039745330810546875, 0.04096221923828125, 0.042179107666015625, 0.04339599609375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 12.0, 8.0, 25.0, 44.0, 55.0, 62.0, 65.0, 81.0, 117.0, 110.0, 105.0, 80.0, 79.0, 57.0, 35.0, 25.0, 16.0, 5.0, 9.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8808908462524414, -0.856532633304596, -0.8321743607521057, -0.8078161478042603, -0.7834579348564148, -0.7590997219085693, -0.7347414493560791, -0.7103832364082336, -0.6860250234603882, -0.6616668105125427, -0.6373085379600525, -0.612950325012207, -0.5885921120643616, -0.5642338991165161, -0.5398756265640259, -0.5155174136161804, -0.4911591410636902, -0.46680089831352234, -0.4424426853656769, -0.41808444261550903, -0.3937262296676636, -0.3693679869174957, -0.3450097441673279, -0.3206515312194824, -0.2962932884693146, -0.27193504571914673, -0.24757683277130127, -0.22321859002113342, -0.19886036217212677, -0.17450213432312012, -0.15014389157295227, -0.12578566372394562, -0.10142743587493896, -0.07706920802593231, -0.05271097272634506, -0.028352737426757812, -0.00399450957775116, 0.020363718271255493, 0.04472196102142334, 0.06908018887042999, 0.09343841671943665, 0.1177966445684433, 0.14215487241744995, 0.1665131151676178, 0.19087134301662445, 0.2152295708656311, 0.23958781361579895, 0.2639460563659668, 0.28830426931381226, 0.3126625120639801, 0.33702072501182556, 0.3613789677619934, 0.38573718070983887, 0.4100954234600067, 0.43445366621017456, 0.45881187915802, 0.48317012190818787, 0.5075283646583557, 0.5318865776062012, 0.5562448501586914, 0.5806030631065369, 0.6049612760543823, 0.6293195486068726, 0.653677761554718, 0.6780359745025635]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 3.0, 13.0, 10.0, 22.0, 30.0, 17.0, 23.0, 27.0, 22.0, 29.0, 36.0, 36.0, 31.0, 32.0, 36.0, 53.0, 41.0, 29.0, 33.0, 37.0, 34.0, 31.0, 35.0, 45.0, 41.0, 36.0, 23.0, 25.0, 27.0, 20.0, 17.0, 17.0, 13.0, 14.0, 11.0, 7.0, 7.0, 4.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32876482605934143, -0.31749704480171204, -0.30622926354408264, -0.29496151208877563, -0.28369373083114624, -0.27242594957351685, -0.26115816831588745, -0.24989038705825806, -0.23862262070178986, -0.22735483944416046, -0.21608707308769226, -0.20481929183006287, -0.19355151057243347, -0.18228374421596527, -0.17101596295833588, -0.15974819660186768, -0.14848041534423828, -0.1372126340866089, -0.12594486773014069, -0.11467708647251129, -0.1034093126654625, -0.0921415388584137, -0.0808737576007843, -0.0696059837937355, -0.05833820998668671, -0.04707043617963791, -0.03580265864729881, -0.024534881114959717, -0.01326710730791092, -0.0019993335008621216, 0.009268447756767273, 0.02053622156381607, 0.03180399537086487, 0.043071769177913666, 0.05433954671025276, 0.06560732424259186, 0.07687509804964066, 0.08814287185668945, 0.09941065311431885, 0.11067842692136765, 0.12194620072841644, 0.13321398198604584, 0.14448174834251404, 0.15574952960014343, 0.16701731085777283, 0.17828507721424103, 0.18955285847187042, 0.20082062482833862, 0.21208840608596802, 0.2233561873435974, 0.2346239537000656, 0.245891734957695, 0.2571595013141632, 0.2684272825717926, 0.279695063829422, 0.2909628450870514, 0.3022305965423584, 0.3134983777999878, 0.3247661590576172, 0.3360339403152466, 0.3473016917705536, 0.358569473028183, 0.3698372542858124, 0.3811050355434418, 0.39237281680107117]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 8.0, 12.0, 12.0, 20.0, 20.0, 45.0, 57.0, 86.0, 100.0, 179.0, 286.0, 409.0, 725.0, 1212.0, 2419.0, 4983.0, 11363.0, 29534.0, 97737.0, 484824.0, 307540.0, 67428.0, 22115.0, 8736.0, 3966.0, 2019.0, 1064.0, 550.0, 363.0, 235.0, 164.0, 115.0, 55.0, 59.0, 30.0, 19.0, 13.0, 20.0, 8.0, 8.0, 9.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.53173828125, -0.5160331726074219, -0.5003280639648438, -0.4846229553222656, -0.4689178466796875, -0.4532127380371094, -0.43750762939453125, -0.4218025207519531, -0.406097412109375, -0.3903923034667969, -0.37468719482421875, -0.3589820861816406, -0.3432769775390625, -0.3275718688964844, -0.31186676025390625, -0.2961616516113281, -0.28045654296875, -0.2647514343261719, -0.24904632568359375, -0.23334121704101562, -0.2176361083984375, -0.20193099975585938, -0.18622589111328125, -0.17052078247070312, -0.154815673828125, -0.13911056518554688, -0.12340545654296875, -0.10770034790039062, -0.0919952392578125, -0.07629013061523438, -0.06058502197265625, -0.044879913330078125, -0.0291748046875, -0.013469696044921875, 0.00223541259765625, 0.017940521240234375, 0.0336456298828125, 0.049350738525390625, 0.06505584716796875, 0.08076095581054688, 0.096466064453125, 0.11217117309570312, 0.12787628173828125, 0.14358139038085938, 0.1592864990234375, 0.17499160766601562, 0.19069671630859375, 0.20640182495117188, 0.22210693359375, 0.23781204223632812, 0.25351715087890625, 0.2692222595214844, 0.2849273681640625, 0.3006324768066406, 0.31633758544921875, 0.3320426940917969, 0.347747802734375, 0.3634529113769531, 0.37915802001953125, 0.3948631286621094, 0.4105682373046875, 0.4262733459472656, 0.44197845458984375, 0.4576835632324219, 0.473388671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 5.0, 6.0, 13.0, 10.0, 19.0, 23.0, 29.0, 30.0, 31.0, 49.0, 37.0, 43.0, 51.0, 56.0, 55.0, 55.0, 41.0, 56.0, 43.0, 45.0, 47.0, 30.0, 48.0, 35.0, 23.0, 26.0, 14.0, 21.0, 16.0, 10.0, 1.0, 7.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.8096694946289062, -0.7824249267578125, -0.7551803588867188, -0.727935791015625, -0.7006912231445312, -0.6734466552734375, -0.6462020874023438, -0.61895751953125, -0.5917129516601562, -0.5644683837890625, -0.5372238159179688, -0.509979248046875, -0.48273468017578125, -0.4554901123046875, -0.42824554443359375, -0.4010009765625, -0.37375640869140625, -0.3465118408203125, -0.31926727294921875, -0.292022705078125, -0.26477813720703125, -0.2375335693359375, -0.21028900146484375, -0.18304443359375, -0.15579986572265625, -0.1285552978515625, -0.10131072998046875, -0.074066162109375, -0.04682159423828125, -0.0195770263671875, 0.00766754150390625, 0.034912109375, 0.06215667724609375, 0.0894012451171875, 0.11664581298828125, 0.143890380859375, 0.17113494873046875, 0.1983795166015625, 0.22562408447265625, 0.25286865234375, 0.28011322021484375, 0.3073577880859375, 0.33460235595703125, 0.361846923828125, 0.38909149169921875, 0.4163360595703125, 0.44358062744140625, 0.4708251953125, 0.49806976318359375, 0.5253143310546875, 0.5525588989257812, 0.579803466796875, 0.6070480346679688, 0.6342926025390625, 0.6615371704101562, 0.68878173828125, 0.7160263061523438, 0.7432708740234375, 0.7705154418945312, 0.797760009765625, 0.8250045776367188, 0.8522491455078125, 0.8794937133789062, 0.90673828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 11.0, 12.0, 15.0, 19.0, 23.0, 44.0, 62.0, 99.0, 159.0, 331.0, 988.0, 5693.0, 118651.0, 897729.0, 21380.0, 2156.0, 561.0, 203.0, 140.0, 76.0, 49.0, 38.0, 22.0, 14.0, 10.0, 11.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7665252685546875, -1.711761474609375, -1.6569976806640625, -1.60223388671875, -1.5474700927734375, -1.492706298828125, -1.4379425048828125, -1.3831787109375, -1.3284149169921875, -1.273651123046875, -1.2188873291015625, -1.16412353515625, -1.1093597412109375, -1.054595947265625, -0.9998321533203125, -0.945068359375, -0.8903045654296875, -0.835540771484375, -0.7807769775390625, -0.72601318359375, -0.6712493896484375, -0.616485595703125, -0.5617218017578125, -0.5069580078125, -0.4521942138671875, -0.397430419921875, -0.3426666259765625, -0.28790283203125, -0.2331390380859375, -0.178375244140625, -0.1236114501953125, -0.06884765625, -0.0140838623046875, 0.040679931640625, 0.0954437255859375, 0.15020751953125, 0.2049713134765625, 0.259735107421875, 0.3144989013671875, 0.3692626953125, 0.4240264892578125, 0.478790283203125, 0.5335540771484375, 0.58831787109375, 0.6430816650390625, 0.697845458984375, 0.7526092529296875, 0.807373046875, 0.8621368408203125, 0.916900634765625, 0.9716644287109375, 1.02642822265625, 1.0811920166015625, 1.135955810546875, 1.1907196044921875, 1.2454833984375, 1.3002471923828125, 1.355010986328125, 1.4097747802734375, 1.46453857421875, 1.5193023681640625, 1.574066162109375, 1.6288299560546875, 1.68359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 7.0, 10.0, 3.0, 2.0, 7.0, 10.0, 11.0, 14.0, 27.0, 28.0, 28.0, 31.0, 35.0, 36.0, 37.0, 55.0, 53.0, 68.0, 60.0, 55.0, 42.0, 47.0, 42.0, 43.0, 40.0, 38.0, 33.0, 26.0, 20.0, 21.0, 8.0, 9.0, 18.0, 7.0, 8.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.08203125, -1.0514602661132812, -1.0208892822265625, -0.9903182983398438, -0.959747314453125, -0.9291763305664062, -0.8986053466796875, -0.8680343627929688, -0.83746337890625, -0.8068923950195312, -0.7763214111328125, -0.7457504272460938, -0.715179443359375, -0.6846084594726562, -0.6540374755859375, -0.6234664916992188, -0.5928955078125, -0.5623245239257812, -0.5317535400390625, -0.5011825561523438, -0.470611572265625, -0.44004058837890625, -0.4094696044921875, -0.37889862060546875, -0.34832763671875, -0.31775665283203125, -0.2871856689453125, -0.25661468505859375, -0.226043701171875, -0.19547271728515625, -0.1649017333984375, -0.13433074951171875, -0.103759765625, -0.07318878173828125, -0.0426177978515625, -0.01204681396484375, 0.018524169921875, 0.04909515380859375, 0.0796661376953125, 0.11023712158203125, 0.14080810546875, 0.17137908935546875, 0.2019500732421875, 0.23252105712890625, 0.263092041015625, 0.29366302490234375, 0.3242340087890625, 0.35480499267578125, 0.3853759765625, 0.41594696044921875, 0.4465179443359375, 0.47708892822265625, 0.507659912109375, 0.5382308959960938, 0.5688018798828125, 0.5993728637695312, 0.62994384765625, 0.6605148315429688, 0.6910858154296875, 0.7216567993164062, 0.752227783203125, 0.7827987670898438, 0.8133697509765625, 0.8439407348632812, 0.87451171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 29.0, 36.0, 62.0, 87.0, 230.0, 573.0, 2181.0, 14151.0, 266774.0, 728353.0, 30891.0, 3696.0, 851.0, 329.0, 126.0, 55.0, 43.0, 24.0, 14.0, 10.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21167755126953125, -0.2016754150390625, -0.19167327880859375, -0.181671142578125, -0.17166900634765625, -0.1616668701171875, -0.15166473388671875, -0.14166259765625, -0.13166046142578125, -0.1216583251953125, -0.11165618896484375, -0.101654052734375, -0.09165191650390625, -0.0816497802734375, -0.07164764404296875, -0.0616455078125, -0.05164337158203125, -0.0416412353515625, -0.03163909912109375, -0.021636962890625, -0.01163482666015625, -0.0016326904296875, 0.00836944580078125, 0.01837158203125, 0.02837371826171875, 0.0383758544921875, 0.04837799072265625, 0.058380126953125, 0.06838226318359375, 0.0783843994140625, 0.08838653564453125, 0.098388671875, 0.10839080810546875, 0.1183929443359375, 0.12839508056640625, 0.138397216796875, 0.14839935302734375, 0.1584014892578125, 0.16840362548828125, 0.17840576171875, 0.18840789794921875, 0.1984100341796875, 0.20841217041015625, 0.218414306640625, 0.22841644287109375, 0.2384185791015625, 0.24842071533203125, 0.2584228515625, 0.26842498779296875, 0.2784271240234375, 0.28842926025390625, 0.298431396484375, 0.30843353271484375, 0.3184356689453125, 0.32843780517578125, 0.33843994140625, 0.34844207763671875, 0.3584442138671875, 0.36844635009765625, 0.378448486328125, 0.38845062255859375, 0.3984527587890625, 0.40845489501953125, 0.41845703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 13.0, 17.0, 24.0, 41.0, 49.0, 88.0, 152.0, 198.0, 146.0, 85.0, 65.0, 35.0, 25.0, 14.0, 7.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921531677246094e-05, -2.8461217880249023e-05, -2.7000904083251953e-05, -2.5540590286254883e-05, -2.4080276489257812e-05, -2.2619962692260742e-05, -2.1159648895263672e-05, -1.96993350982666e-05, -1.823902130126953e-05, -1.677870750427246e-05, -1.531839370727539e-05, -1.385807991027832e-05, -1.239776611328125e-05, -1.093745231628418e-05, -9.47713851928711e-06, -8.016824722290039e-06, -6.556510925292969e-06, -5.0961971282958984e-06, -3.635883331298828e-06, -2.175569534301758e-06, -7.152557373046875e-07, 7.450580596923828e-07, 2.205371856689453e-06, 3.6656856536865234e-06, 5.125999450683594e-06, 6.586313247680664e-06, 8.046627044677734e-06, 9.506940841674805e-06, 1.0967254638671875e-05, 1.2427568435668945e-05, 1.3887882232666016e-05, 1.5348196029663086e-05, 1.6808509826660156e-05, 1.8268823623657227e-05, 1.9729137420654297e-05, 2.1189451217651367e-05, 2.2649765014648438e-05, 2.4110078811645508e-05, 2.5570392608642578e-05, 2.703070640563965e-05, 2.849102020263672e-05, 2.995133399963379e-05, 3.141164779663086e-05, 3.287196159362793e-05, 3.4332275390625e-05, 3.579258918762207e-05, 3.725290298461914e-05, 3.871321678161621e-05, 4.017353057861328e-05, 4.163384437561035e-05, 4.309415817260742e-05, 4.455447196960449e-05, 4.601478576660156e-05, 4.747509956359863e-05, 4.89354133605957e-05, 5.0395727157592773e-05, 5.1856040954589844e-05, 5.3316354751586914e-05, 5.4776668548583984e-05, 5.6236982345581055e-05, 5.7697296142578125e-05, 5.9157609939575195e-05, 6.0617923736572266e-05, 6.207823753356934e-05, 6.35385513305664e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 23.0, 49.0, 81.0, 197.0, 444.0, 1326.0, 8145.0, 181141.0, 827390.0, 25739.0, 2778.0, 727.0, 258.0, 99.0, 57.0, 38.0, 21.0, 14.0, 6.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57421875, -0.5606193542480469, -0.5470199584960938, -0.5334205627441406, -0.5198211669921875, -0.5062217712402344, -0.49262237548828125, -0.4790229797363281, -0.465423583984375, -0.4518241882324219, -0.43822479248046875, -0.4246253967285156, -0.4110260009765625, -0.3974266052246094, -0.38382720947265625, -0.3702278137207031, -0.35662841796875, -0.3430290222167969, -0.32942962646484375, -0.3158302307128906, -0.3022308349609375, -0.2886314392089844, -0.27503204345703125, -0.2614326477050781, -0.247833251953125, -0.23423385620117188, -0.22063446044921875, -0.20703506469726562, -0.1934356689453125, -0.17983627319335938, -0.16623687744140625, -0.15263748168945312, -0.1390380859375, -0.12543869018554688, -0.11183929443359375, -0.09823989868164062, -0.0846405029296875, -0.07104110717773438, -0.05744171142578125, -0.043842315673828125, -0.030242919921875, -0.016643524169921875, -0.00304412841796875, 0.010555267333984375, 0.0241546630859375, 0.037754058837890625, 0.05135345458984375, 0.06495285034179688, 0.07855224609375, 0.09215164184570312, 0.10575103759765625, 0.11935043334960938, 0.1329498291015625, 0.14654922485351562, 0.16014862060546875, 0.17374801635742188, 0.187347412109375, 0.20094680786132812, 0.21454620361328125, 0.22814559936523438, 0.2417449951171875, 0.2553443908691406, 0.26894378662109375, 0.2825431823730469, 0.296142578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 12.0, 10.0, 25.0, 38.0, 93.0, 134.0, 256.0, 189.0, 101.0, 50.0, 30.0, 22.0, 14.0, 13.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.06971073150634766, -0.06465339660644531, -0.05959606170654297, -0.054538726806640625, -0.04948139190673828, -0.04442405700683594, -0.039366722106933594, -0.03430938720703125, -0.029252052307128906, -0.024194717407226562, -0.01913738250732422, -0.014080047607421875, -0.009022712707519531, -0.0039653778076171875, 0.0010919570922851562, 0.0061492919921875, 0.011206626892089844, 0.016263961791992188, 0.02132129669189453, 0.026378631591796875, 0.03143596649169922, 0.03649330139160156, 0.041550636291503906, 0.04660797119140625, 0.051665306091308594, 0.05672264099121094, 0.06177997589111328, 0.06683731079101562, 0.07189464569091797, 0.07695198059082031, 0.08200931549072266, 0.087066650390625, 0.09212398529052734, 0.09718132019042969, 0.10223865509033203, 0.10729598999023438, 0.11235332489013672, 0.11741065979003906, 0.1224679946899414, 0.12752532958984375, 0.1325826644897461, 0.13763999938964844, 0.14269733428955078, 0.14775466918945312, 0.15281200408935547, 0.1578693389892578, 0.16292667388916016, 0.1679840087890625, 0.17304134368896484, 0.1780986785888672, 0.18315601348876953, 0.18821334838867188, 0.19327068328857422, 0.19832801818847656, 0.2033853530883789, 0.20844268798828125, 0.2135000228881836, 0.21855735778808594, 0.22361469268798828, 0.22867202758789062, 0.23372936248779297, 0.2387866973876953, 0.24384403228759766, 0.2489013671875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 34.0, 60.0, 112.0, 102.0, 151.0, 149.0, 151.0, 100.0, 63.0, 34.0, 20.0, 10.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2313326597213745, -1.1596059799194336, -1.0878793001174927, -1.0161526203155518, -0.9444258809089661, -0.8726992011070251, -0.8009724617004395, -0.7292457818984985, -0.6575191020965576, -0.5857924222946167, -0.5140657424926758, -0.4423390030860901, -0.37061232328414917, -0.29888564348220825, -0.22715893387794495, -0.15543222427368164, -0.08370554447174072, -0.01197884976863861, 0.0597478449344635, 0.1314745396375656, 0.20320123434066772, 0.27492791414260864, 0.34665462374687195, 0.41838133335113525, 0.49010801315307617, 0.5618346929550171, 0.633561372756958, 0.7052881121635437, 0.7770147919654846, 0.8487414717674255, 0.9204682111740112, 0.9921948909759521, 1.0639216899871826, 1.1356483697891235, 1.2073750495910645, 1.2791017293930054, 1.3508284091949463, 1.4225552082061768, 1.4942818880081177, 1.5660085678100586, 1.6377352476119995, 1.7094619274139404, 1.7811886072158813, 1.8529152870178223, 1.9246420860290527, 1.996368646621704, 2.0680954456329346, 2.139822006225586, 2.2115488052368164, 2.283275604248047, 2.3550021648406982, 2.4267289638519287, 2.49845552444458, 2.5701823234558105, 2.641908884048462, 2.7136356830596924, 2.7853622436523438, 2.857089042663574, 2.9288156032562256, 3.000542402267456, 3.0722689628601074, 3.143995761871338, 3.2157223224639893, 3.2874491214752197, 3.35917592048645]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 2.0, 10.0, 3.0, 8.0, 4.0, 10.0, 17.0, 16.0, 16.0, 13.0, 28.0, 34.0, 26.0, 30.0, 27.0, 35.0, 32.0, 41.0, 41.0, 39.0, 40.0, 52.0, 41.0, 35.0, 36.0, 41.0, 34.0, 37.0, 29.0, 38.0, 29.0, 33.0, 21.0, 19.0, 18.0, 17.0, 10.0, 11.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3773609399795532, -1.333045482635498, -1.2887301445007324, -1.2444146871566772, -1.200099229812622, -1.155783772468567, -1.1114684343338013, -1.067152976989746, -1.022837519645691, -0.9785221219062805, -0.9342066645622253, -0.8898912668228149, -0.8455758094787598, -0.8012604117393494, -0.756945013999939, -0.7126295566558838, -0.6683141589164734, -0.623998761177063, -0.5796833038330078, -0.5353679060935974, -0.49105244874954224, -0.44673705101013184, -0.40242162346839905, -0.35810619592666626, -0.31379076838493347, -0.2694753408432007, -0.2251599133014679, -0.1808445006608963, -0.1365290731191635, -0.09221364557743073, -0.04789823293685913, -0.0035828053951263428, 0.040732622146606445, 0.08504804968833923, 0.12936347723007202, 0.17367888987064362, 0.2179943174123764, 0.262309730052948, 0.3066251575946808, 0.3509405851364136, 0.39525601267814636, 0.43957144021987915, 0.48388686776161194, 0.5282022953033447, 0.5725176930427551, 0.6168331503868103, 0.6611485481262207, 0.7054640054702759, 0.7497794032096863, 0.7940948009490967, 0.8384102582931519, 0.8827256560325623, 0.9270411133766174, 0.9713565111160278, 1.015671968460083, 1.0599873065948486, 1.1043027639389038, 1.148618221282959, 1.1929335594177246, 1.2372490167617798, 1.281564474105835, 1.3258799314498901, 1.3701952695846558, 1.414510726928711, 1.4588261842727661]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 15.0, 20.0, 25.0, 37.0, 30.0, 50.0, 82.0, 93.0, 143.0, 230.0, 407.0, 1022.0, 2493.0, 7809.0, 37971.0, 452097.0, 2827779.0, 791634.0, 55959.0, 10313.0, 3233.0, 1320.0, 592.0, 335.0, 168.0, 105.0, 87.0, 49.0, 37.0, 32.0, 18.0, 22.0, 13.0, 11.0, 4.0, 7.0, 4.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.97021484375, -0.93951416015625, -0.9088134765625, -0.87811279296875, -0.847412109375, -0.81671142578125, -0.7860107421875, -0.75531005859375, -0.724609375, -0.69390869140625, -0.6632080078125, -0.63250732421875, -0.601806640625, -0.57110595703125, -0.5404052734375, -0.50970458984375, -0.47900390625, -0.44830322265625, -0.4176025390625, -0.38690185546875, -0.356201171875, -0.32550048828125, -0.2947998046875, -0.26409912109375, -0.2333984375, -0.20269775390625, -0.1719970703125, -0.14129638671875, -0.110595703125, -0.07989501953125, -0.0491943359375, -0.01849365234375, 0.01220703125, 0.04290771484375, 0.0736083984375, 0.10430908203125, 0.135009765625, 0.16571044921875, 0.1964111328125, 0.22711181640625, 0.2578125, 0.28851318359375, 0.3192138671875, 0.34991455078125, 0.380615234375, 0.41131591796875, 0.4420166015625, 0.47271728515625, 0.50341796875, 0.53411865234375, 0.5648193359375, 0.59552001953125, 0.626220703125, 0.65692138671875, 0.6876220703125, 0.71832275390625, 0.7490234375, 0.77972412109375, 0.8104248046875, 0.84112548828125, 0.871826171875, 0.90252685546875, 0.9332275390625, 0.96392822265625, 0.99462890625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 12.0, 10.0, 12.0, 16.0, 14.0, 23.0, 30.0, 27.0, 23.0, 38.0, 51.0, 31.0, 35.0, 61.0, 35.0, 50.0, 44.0, 46.0, 49.0, 32.0, 46.0, 47.0, 37.0, 35.0, 23.0, 14.0, 28.0, 23.0, 15.0, 18.0, 17.0, 12.0, 11.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.39963531494140625, -0.3847198486328125, -0.36980438232421875, -0.354888916015625, -0.33997344970703125, -0.3250579833984375, -0.31014251708984375, -0.29522705078125, -0.28031158447265625, -0.2653961181640625, -0.25048065185546875, -0.235565185546875, -0.22064971923828125, -0.2057342529296875, -0.19081878662109375, -0.1759033203125, -0.16098785400390625, -0.1460723876953125, -0.13115692138671875, -0.116241455078125, -0.10132598876953125, -0.0864105224609375, -0.07149505615234375, -0.05657958984375, -0.04166412353515625, -0.0267486572265625, -0.01183319091796875, 0.003082275390625, 0.01799774169921875, 0.0329132080078125, 0.04782867431640625, 0.062744140625, 0.07765960693359375, 0.0925750732421875, 0.10749053955078125, 0.122406005859375, 0.13732147216796875, 0.1522369384765625, 0.16715240478515625, 0.18206787109375, 0.19698333740234375, 0.2118988037109375, 0.22681427001953125, 0.241729736328125, 0.25664520263671875, 0.2715606689453125, 0.28647613525390625, 0.3013916015625, 0.31630706787109375, 0.3312225341796875, 0.34613800048828125, 0.361053466796875, 0.37596893310546875, 0.3908843994140625, 0.40579986572265625, 0.42071533203125, 0.43563079833984375, 0.4505462646484375, 0.46546173095703125, 0.480377197265625, 0.49529266357421875, 0.5102081298828125, 0.5251235961914062, 0.5400390625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 15.0, 14.0, 22.0, 26.0, 54.0, 80.0, 115.0, 241.0, 528.0, 1256.0, 3823.0, 16930.0, 156813.0, 3529445.0, 447215.0, 29258.0, 5427.0, 1724.0, 622.0, 279.0, 160.0, 84.0, 40.0, 26.0, 27.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5810546875, -1.5390625, -1.4970703125, -1.455078125, -1.4130859375, -1.37109375, -1.3291015625, -1.287109375, -1.2451171875, -1.203125, -1.1611328125, -1.119140625, -1.0771484375, -1.03515625, -0.9931640625, -0.951171875, -0.9091796875, -0.8671875, -0.8251953125, -0.783203125, -0.7412109375, -0.69921875, -0.6572265625, -0.615234375, -0.5732421875, -0.53125, -0.4892578125, -0.447265625, -0.4052734375, -0.36328125, -0.3212890625, -0.279296875, -0.2373046875, -0.1953125, -0.1533203125, -0.111328125, -0.0693359375, -0.02734375, 0.0146484375, 0.056640625, 0.0986328125, 0.140625, 0.1826171875, 0.224609375, 0.2666015625, 0.30859375, 0.3505859375, 0.392578125, 0.4345703125, 0.4765625, 0.5185546875, 0.560546875, 0.6025390625, 0.64453125, 0.6865234375, 0.728515625, 0.7705078125, 0.8125, 0.8544921875, 0.896484375, 0.9384765625, 0.98046875, 1.0224609375, 1.064453125, 1.1064453125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 6.0, 9.0, 10.0, 16.0, 28.0, 29.0, 41.0, 68.0, 93.0, 137.0, 186.0, 268.0, 372.0, 467.0, 482.0, 489.0, 377.0, 287.0, 194.0, 152.0, 95.0, 58.0, 50.0, 26.0, 21.0, 23.0, 18.0, 12.0, 7.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.249267578125, -0.2411346435546875, -0.233001708984375, -0.2248687744140625, -0.21673583984375, -0.2086029052734375, -0.200469970703125, -0.1923370361328125, -0.1842041015625, -0.1760711669921875, -0.167938232421875, -0.1598052978515625, -0.15167236328125, -0.1435394287109375, -0.135406494140625, -0.1272735595703125, -0.119140625, -0.1110076904296875, -0.102874755859375, -0.0947418212890625, -0.08660888671875, -0.0784759521484375, -0.070343017578125, -0.0622100830078125, -0.0540771484375, -0.0459442138671875, -0.037811279296875, -0.0296783447265625, -0.02154541015625, -0.0134124755859375, -0.005279541015625, 0.0028533935546875, 0.010986328125, 0.0191192626953125, 0.027252197265625, 0.0353851318359375, 0.04351806640625, 0.0516510009765625, 0.059783935546875, 0.0679168701171875, 0.0760498046875, 0.0841827392578125, 0.092315673828125, 0.1004486083984375, 0.10858154296875, 0.1167144775390625, 0.124847412109375, 0.1329803466796875, 0.14111328125, 0.1492462158203125, 0.157379150390625, 0.1655120849609375, 0.17364501953125, 0.1817779541015625, 0.189910888671875, 0.1980438232421875, 0.2061767578125, 0.2143096923828125, 0.222442626953125, 0.2305755615234375, 0.23870849609375, 0.2468414306640625, 0.254974365234375, 0.2631072998046875, 0.271240234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 5.0, 7.0, 15.0, 13.0, 14.0, 29.0, 36.0, 52.0, 52.0, 65.0, 77.0, 68.0, 80.0, 80.0, 72.0, 49.0, 71.0, 64.0, 34.0, 32.0, 30.0, 11.0, 13.0, 9.0, 5.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0232040882110596, -0.994565486907959, -0.9659268260002136, -0.937288224697113, -0.9086496233940125, -0.8800109624862671, -0.8513723611831665, -0.8227337598800659, -0.7940950989723206, -0.76545649766922, -0.7368178367614746, -0.708179235458374, -0.6795406341552734, -0.6509019732475281, -0.6222633719444275, -0.5936247110366821, -0.5649861097335815, -0.536347508430481, -0.5077088475227356, -0.479070246219635, -0.45043161511421204, -0.42179298400878906, -0.3931543827056885, -0.3645157516002655, -0.3358771800994873, -0.30723854899406433, -0.27859994769096375, -0.24996131658554077, -0.2213226854801178, -0.19268406927585602, -0.16404545307159424, -0.13540682196617126, -0.10676819086074829, -0.07812956720590591, -0.049490947276353836, -0.020852327346801758, 0.007786296308040619, 0.036424919962882996, 0.06506353616714478, 0.09370216727256775, 0.12234078347682953, 0.1509793996810913, 0.17961803078651428, 0.20825664699077606, 0.23689526319503784, 0.2655338943004608, 0.2941725254058838, 0.3228111267089844, 0.35144975781440735, 0.3800883889198303, 0.4087269902229309, 0.4373656213283539, 0.46600425243377686, 0.49464285373687744, 0.523281455039978, 0.5519201159477234, 0.580558717250824, 0.6091973185539246, 0.6378359794616699, 0.6664745807647705, 0.6951131820678711, 0.7237518429756165, 0.752390444278717, 0.7810291051864624, 0.809667706489563]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 9.0, 9.0, 8.0, 17.0, 10.0, 14.0, 15.0, 27.0, 19.0, 33.0, 32.0, 31.0, 24.0, 29.0, 35.0, 37.0, 38.0, 43.0, 34.0, 46.0, 49.0, 36.0, 33.0, 35.0, 30.0, 32.0, 29.0, 24.0, 21.0, 22.0, 22.0, 17.0, 18.0, 18.0, 11.0, 17.0, 13.0, 11.0, 13.0, 11.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5270301699638367, -0.5106033682823181, -0.49417659640312195, -0.4777498245239258, -0.4613230228424072, -0.44489622116088867, -0.4284694492816925, -0.41204267740249634, -0.3956158757209778, -0.37918907403945923, -0.36276230216026306, -0.3463355302810669, -0.32990872859954834, -0.3134819269180298, -0.2970551550388336, -0.28062838315963745, -0.2642015814781189, -0.24777479469776154, -0.23134800791740417, -0.21492122113704681, -0.19849443435668945, -0.1820676475763321, -0.16564086079597473, -0.14921407401561737, -0.13278728723526, -0.11636050045490265, -0.09993371367454529, -0.08350692689418793, -0.06708014011383057, -0.050653353333473206, -0.034226566553115845, -0.017799779772758484, -0.0013729333877563477, 0.015053853392601013, 0.031480640172958374, 0.047907426953315735, 0.0643342137336731, 0.08076100051403046, 0.09718778729438782, 0.11361457407474518, 0.13004136085510254, 0.1464681476354599, 0.16289493441581726, 0.17932172119617462, 0.19574850797653198, 0.21217529475688934, 0.2286020815372467, 0.24502886831760406, 0.2614556550979614, 0.27788245677948, 0.29430922865867615, 0.3107360005378723, 0.32716280221939087, 0.3435896039009094, 0.3600163757801056, 0.37644314765930176, 0.3928699493408203, 0.40929675102233887, 0.42572352290153503, 0.4421502947807312, 0.45857709646224976, 0.4750038981437683, 0.4914306700229645, 0.5078574419021606, 0.5242842435836792]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 16.0, 25.0, 25.0, 61.0, 114.0, 212.0, 435.0, 919.0, 2425.0, 7231.0, 25352.0, 125125.0, 600014.0, 231190.0, 39428.0, 10274.0, 3329.0, 1199.0, 561.0, 268.0, 144.0, 81.0, 45.0, 32.0, 19.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24790573120117188, -0.23824310302734375, -0.22858047485351562, -0.2189178466796875, -0.20925521850585938, -0.19959259033203125, -0.18992996215820312, -0.180267333984375, -0.17060470581054688, -0.16094207763671875, -0.15127944946289062, -0.1416168212890625, -0.13195419311523438, -0.12229156494140625, -0.11262893676757812, -0.10296630859375, -0.09330368041992188, -0.08364105224609375, -0.07397842407226562, -0.0643157958984375, -0.054653167724609375, -0.04499053955078125, -0.035327911376953125, -0.025665283203125, -0.016002655029296875, -0.00634002685546875, 0.003322601318359375, 0.0129852294921875, 0.022647857666015625, 0.03231048583984375, 0.041973114013671875, 0.0516357421875, 0.061298370361328125, 0.07096099853515625, 0.08062362670898438, 0.0902862548828125, 0.09994888305664062, 0.10961151123046875, 0.11927413940429688, 0.128936767578125, 0.13859939575195312, 0.14826202392578125, 0.15792465209960938, 0.1675872802734375, 0.17724990844726562, 0.18691253662109375, 0.19657516479492188, 0.20623779296875, 0.21590042114257812, 0.22556304931640625, 0.23522567749023438, 0.2448883056640625, 0.2545509338378906, 0.26421356201171875, 0.2738761901855469, 0.283538818359375, 0.2932014465332031, 0.30286407470703125, 0.3125267028808594, 0.3221893310546875, 0.3318519592285156, 0.34151458740234375, 0.3511772155761719, 0.36083984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 8.0, 7.0, 16.0, 18.0, 21.0, 18.0, 42.0, 39.0, 46.0, 29.0, 49.0, 48.0, 54.0, 52.0, 54.0, 53.0, 61.0, 57.0, 40.0, 34.0, 36.0, 29.0, 35.0, 24.0, 21.0, 16.0, 16.0, 16.0, 11.0, 14.0, 11.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.441162109375, -0.42810821533203125, -0.4150543212890625, -0.40200042724609375, -0.388946533203125, -0.37589263916015625, -0.3628387451171875, -0.34978485107421875, -0.33673095703125, -0.32367706298828125, -0.3106231689453125, -0.29756927490234375, -0.284515380859375, -0.27146148681640625, -0.2584075927734375, -0.24535369873046875, -0.2322998046875, -0.21924591064453125, -0.2061920166015625, -0.19313812255859375, -0.180084228515625, -0.16703033447265625, -0.1539764404296875, -0.14092254638671875, -0.12786865234375, -0.11481475830078125, -0.1017608642578125, -0.08870697021484375, -0.075653076171875, -0.06259918212890625, -0.0495452880859375, -0.03649139404296875, -0.0234375, -0.01038360595703125, 0.0026702880859375, 0.01572418212890625, 0.028778076171875, 0.04183197021484375, 0.0548858642578125, 0.06793975830078125, 0.08099365234375, 0.09404754638671875, 0.1071014404296875, 0.12015533447265625, 0.133209228515625, 0.14626312255859375, 0.1593170166015625, 0.17237091064453125, 0.1854248046875, 0.19847869873046875, 0.2115325927734375, 0.22458648681640625, 0.237640380859375, 0.25069427490234375, 0.2637481689453125, 0.27680206298828125, 0.28985595703125, 0.30290985107421875, 0.3159637451171875, 0.32901763916015625, 0.342071533203125, 0.35512542724609375, 0.3681793212890625, 0.38123321533203125, 0.394287109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 8.0, 11.0, 7.0, 9.0, 17.0, 25.0, 32.0, 40.0, 69.0, 97.0, 109.0, 164.0, 243.0, 383.0, 608.0, 1077.0, 1986.0, 3961.0, 8346.0, 18845.0, 46699.0, 124843.0, 301668.0, 315857.0, 135346.0, 49904.0, 20033.0, 8885.0, 4142.0, 2112.0, 1124.0, 645.0, 395.0, 263.0, 174.0, 115.0, 91.0, 60.0, 35.0, 32.0, 26.0, 12.0, 15.0, 12.0, 5.0, 4.0, 10.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.124267578125, -0.12026405334472656, -0.11626052856445312, -0.11225700378417969, -0.10825347900390625, -0.10424995422363281, -0.10024642944335938, -0.09624290466308594, -0.0922393798828125, -0.08823585510253906, -0.08423233032226562, -0.08022880554199219, -0.07622528076171875, -0.07222175598144531, -0.06821823120117188, -0.06421470642089844, -0.060211181640625, -0.05620765686035156, -0.052204132080078125, -0.04820060729980469, -0.04419708251953125, -0.04019355773925781, -0.036190032958984375, -0.03218650817871094, -0.0281829833984375, -0.024179458618164062, -0.020175933837890625, -0.016172409057617188, -0.01216888427734375, -0.008165359497070312, -0.004161834716796875, -0.0001583099365234375, 0.00384521484375, 0.007848739624023438, 0.011852264404296875, 0.015855789184570312, 0.01985931396484375, 0.023862838745117188, 0.027866363525390625, 0.03186988830566406, 0.0358734130859375, 0.03987693786621094, 0.043880462646484375, 0.04788398742675781, 0.05188751220703125, 0.05589103698730469, 0.059894561767578125, 0.06389808654785156, 0.067901611328125, 0.07190513610839844, 0.07590866088867188, 0.07991218566894531, 0.08391571044921875, 0.08791923522949219, 0.09192276000976562, 0.09592628479003906, 0.0999298095703125, 0.10393333435058594, 0.10793685913085938, 0.11194038391113281, 0.11594390869140625, 0.11994743347167969, 0.12395095825195312, 0.12795448303222656, 0.1319580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 6.0, 4.0, 7.0, 4.0, 8.0, 5.0, 8.0, 9.0, 11.0, 16.0, 17.0, 16.0, 24.0, 24.0, 36.0, 32.0, 27.0, 43.0, 36.0, 65.0, 54.0, 68.0, 54.0, 48.0, 37.0, 52.0, 29.0, 33.0, 39.0, 27.0, 28.0, 30.0, 16.0, 14.0, 14.0, 12.0, 7.0, 8.0, 7.0, 5.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6480178833007812, -0.6236724853515625, -0.5993270874023438, -0.574981689453125, -0.5506362915039062, -0.5262908935546875, -0.5019454956054688, -0.47760009765625, -0.45325469970703125, -0.4289093017578125, -0.40456390380859375, -0.380218505859375, -0.35587310791015625, -0.3315277099609375, -0.30718231201171875, -0.2828369140625, -0.25849151611328125, -0.2341461181640625, -0.20980072021484375, -0.185455322265625, -0.16110992431640625, -0.1367645263671875, -0.11241912841796875, -0.08807373046875, -0.06372833251953125, -0.0393829345703125, -0.01503753662109375, 0.009307861328125, 0.03365325927734375, 0.0579986572265625, 0.08234405517578125, 0.106689453125, 0.13103485107421875, 0.1553802490234375, 0.17972564697265625, 0.204071044921875, 0.22841644287109375, 0.2527618408203125, 0.27710723876953125, 0.30145263671875, 0.32579803466796875, 0.3501434326171875, 0.37448883056640625, 0.398834228515625, 0.42317962646484375, 0.4475250244140625, 0.47187042236328125, 0.4962158203125, 0.5205612182617188, 0.5449066162109375, 0.5692520141601562, 0.593597412109375, 0.6179428100585938, 0.6422882080078125, 0.6666336059570312, 0.69097900390625, 0.7153244018554688, 0.7396697998046875, 0.7640151977539062, 0.788360595703125, 0.8127059936523438, 0.8370513916015625, 0.8613967895507812, 0.8857421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 1.0, 8.0, 17.0, 23.0, 32.0, 53.0, 67.0, 100.0, 144.0, 233.0, 347.0, 660.0, 1260.0, 2459.0, 5870.0, 14900.0, 44175.0, 183686.0, 532939.0, 189499.0, 45390.0, 15281.0, 5773.0, 2525.0, 1303.0, 678.0, 400.0, 237.0, 171.0, 100.0, 49.0, 47.0, 24.0, 26.0, 25.0, 15.0, 9.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10968017578125, -0.10640716552734375, -0.1031341552734375, -0.09986114501953125, -0.096588134765625, -0.09331512451171875, -0.0900421142578125, -0.08676910400390625, -0.08349609375, -0.08022308349609375, -0.0769500732421875, -0.07367706298828125, -0.070404052734375, -0.06713104248046875, -0.0638580322265625, -0.06058502197265625, -0.05731201171875, -0.05403900146484375, -0.0507659912109375, -0.04749298095703125, -0.044219970703125, -0.04094696044921875, -0.0376739501953125, -0.03440093994140625, -0.0311279296875, -0.02785491943359375, -0.0245819091796875, -0.02130889892578125, -0.018035888671875, -0.01476287841796875, -0.0114898681640625, -0.00821685791015625, -0.00494384765625, -0.00167083740234375, 0.0016021728515625, 0.00487518310546875, 0.008148193359375, 0.01142120361328125, 0.0146942138671875, 0.01796722412109375, 0.021240234375, 0.02451324462890625, 0.0277862548828125, 0.03105926513671875, 0.034332275390625, 0.03760528564453125, 0.0408782958984375, 0.04415130615234375, 0.04742431640625, 0.05069732666015625, 0.0539703369140625, 0.05724334716796875, 0.060516357421875, 0.06378936767578125, 0.0670623779296875, 0.07033538818359375, 0.0736083984375, 0.07688140869140625, 0.0801544189453125, 0.08342742919921875, 0.086700439453125, 0.08997344970703125, 0.0932464599609375, 0.09651947021484375, 0.09979248046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 10.0, 11.0, 8.0, 10.0, 11.0, 23.0, 23.0, 34.0, 51.0, 63.0, 70.0, 92.0, 97.0, 94.0, 88.0, 74.0, 56.0, 40.0, 29.0, 29.0, 20.0, 19.0, 6.0, 7.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.337860107421875e-05, -3.2220035791397095e-05, -3.106147050857544e-05, -2.9902905225753784e-05, -2.874433994293213e-05, -2.7585774660110474e-05, -2.642720937728882e-05, -2.5268644094467163e-05, -2.4110078811645508e-05, -2.2951513528823853e-05, -2.1792948246002197e-05, -2.0634382963180542e-05, -1.9475817680358887e-05, -1.831725239753723e-05, -1.7158687114715576e-05, -1.600012183189392e-05, -1.4841556549072266e-05, -1.368299126625061e-05, -1.2524425983428955e-05, -1.13658607006073e-05, -1.0207295417785645e-05, -9.04873013496399e-06, -7.890164852142334e-06, -6.731599569320679e-06, -5.5730342864990234e-06, -4.414469003677368e-06, -3.255903720855713e-06, -2.0973384380340576e-06, -9.387731552124023e-07, 2.1979212760925293e-07, 1.3783574104309082e-06, 2.5369226932525635e-06, 3.6954879760742188e-06, 4.854053258895874e-06, 6.012618541717529e-06, 7.1711838245391846e-06, 8.32974910736084e-06, 9.488314390182495e-06, 1.064687967300415e-05, 1.1805444955825806e-05, 1.2964010238647461e-05, 1.4122575521469116e-05, 1.528114080429077e-05, 1.6439706087112427e-05, 1.7598271369934082e-05, 1.8756836652755737e-05, 1.9915401935577393e-05, 2.1073967218399048e-05, 2.2232532501220703e-05, 2.339109778404236e-05, 2.4549663066864014e-05, 2.570822834968567e-05, 2.6866793632507324e-05, 2.802535891532898e-05, 2.9183924198150635e-05, 3.034248948097229e-05, 3.1501054763793945e-05, 3.26596200466156e-05, 3.3818185329437256e-05, 3.497675061225891e-05, 3.6135315895080566e-05, 3.729388117790222e-05, 3.845244646072388e-05, 3.961101174354553e-05, 4.076957702636719e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 12.0, 20.0, 14.0, 32.0, 42.0, 70.0, 152.0, 258.0, 616.0, 1599.0, 4868.0, 18216.0, 91957.0, 610388.0, 267415.0, 39205.0, 9148.0, 2686.0, 983.0, 410.0, 196.0, 101.0, 56.0, 36.0, 26.0, 10.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23583984375, -0.23005294799804688, -0.22426605224609375, -0.21847915649414062, -0.2126922607421875, -0.20690536499023438, -0.20111846923828125, -0.19533157348632812, -0.189544677734375, -0.18375778198242188, -0.17797088623046875, -0.17218399047851562, -0.1663970947265625, -0.16061019897460938, -0.15482330322265625, -0.14903640747070312, -0.14324951171875, -0.13746261596679688, -0.13167572021484375, -0.12588882446289062, -0.1201019287109375, -0.11431503295898438, -0.10852813720703125, -0.10274124145507812, -0.096954345703125, -0.09116744995117188, -0.08538055419921875, -0.07959365844726562, -0.0738067626953125, -0.06801986694335938, -0.06223297119140625, -0.056446075439453125, -0.0506591796875, -0.044872283935546875, -0.03908538818359375, -0.033298492431640625, -0.0275115966796875, -0.021724700927734375, -0.01593780517578125, -0.010150909423828125, -0.004364013671875, 0.001422882080078125, 0.00720977783203125, 0.012996673583984375, 0.0187835693359375, 0.024570465087890625, 0.03035736083984375, 0.036144256591796875, 0.04193115234375, 0.047718048095703125, 0.05350494384765625, 0.059291839599609375, 0.0650787353515625, 0.07086563110351562, 0.07665252685546875, 0.08243942260742188, 0.088226318359375, 0.09401321411132812, 0.09980010986328125, 0.10558700561523438, 0.1113739013671875, 0.11716079711914062, 0.12294769287109375, 0.12873458862304688, 0.134521484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 11.0, 7.0, 11.0, 12.0, 15.0, 18.0, 35.0, 23.0, 38.0, 57.0, 65.0, 79.0, 96.0, 113.0, 98.0, 58.0, 60.0, 37.0, 35.0, 27.0, 20.0, 20.0, 19.0, 12.0, 6.0, 4.0, 6.0, 0.0, 1.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02777099609375, -0.026614665985107422, -0.025458335876464844, -0.024302005767822266, -0.023145675659179688, -0.02198934555053711, -0.02083301544189453, -0.019676685333251953, -0.018520355224609375, -0.017364025115966797, -0.01620769500732422, -0.01505136489868164, -0.013895034790039062, -0.012738704681396484, -0.011582374572753906, -0.010426044464111328, -0.00926971435546875, -0.008113384246826172, -0.006957054138183594, -0.005800724029541016, -0.0046443939208984375, -0.0034880638122558594, -0.0023317337036132812, -0.0011754035949707031, -1.9073486328125e-05, 0.0011372566223144531, 0.0022935867309570312, 0.0034499168395996094, 0.0046062469482421875, 0.005762577056884766, 0.006918907165527344, 0.008075237274169922, 0.0092315673828125, 0.010387897491455078, 0.011544227600097656, 0.012700557708740234, 0.013856887817382812, 0.01501321792602539, 0.01616954803466797, 0.017325878143310547, 0.018482208251953125, 0.019638538360595703, 0.02079486846923828, 0.02195119857788086, 0.023107528686523438, 0.024263858795166016, 0.025420188903808594, 0.026576519012451172, 0.02773284912109375, 0.028889179229736328, 0.030045509338378906, 0.031201839447021484, 0.03235816955566406, 0.03351449966430664, 0.03467082977294922, 0.0358271598815918, 0.036983489990234375, 0.03813982009887695, 0.03929615020751953, 0.04045248031616211, 0.04160881042480469, 0.042765140533447266, 0.043921470642089844, 0.04507780075073242, 0.046234130859375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 11.0, 7.0, 16.0, 19.0, 38.0, 45.0, 63.0, 83.0, 95.0, 104.0, 95.0, 108.0, 85.0, 69.0, 50.0, 32.0, 32.0, 18.0, 15.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6906836628913879, -0.6698765158653259, -0.6490693092346191, -0.6282621622085571, -0.6074550151824951, -0.5866478681564331, -0.5658407211303711, -0.5450335144996643, -0.5242263674736023, -0.5034192204475403, -0.4826120436191559, -0.4618048667907715, -0.4409977197647095, -0.42019057273864746, -0.39938339591026306, -0.37857621908187866, -0.35776907205581665, -0.33696192502975464, -0.31615474820137024, -0.29534757137298584, -0.27454042434692383, -0.2537332773208618, -0.23292610049247742, -0.2121189385652542, -0.191311776638031, -0.1705046147108078, -0.1496974527835846, -0.1288902908563614, -0.10808312892913818, -0.08727596700191498, -0.06646880507469177, -0.04566164314746857, -0.024854540824890137, -0.004047378897666931, 0.016759783029556274, 0.03756694495677948, 0.058374106884002686, 0.07918126881122589, 0.0999884307384491, 0.1207955926656723, 0.1416027545928955, 0.1624099165201187, 0.18321707844734192, 0.20402424037456512, 0.22483140230178833, 0.24563856422901154, 0.26644572615623474, 0.28725290298461914, 0.30806005001068115, 0.32886719703674316, 0.34967437386512756, 0.37048155069351196, 0.391288697719574, 0.412095844745636, 0.4329030215740204, 0.4537101984024048, 0.4745173454284668, 0.4953244924545288, 0.5161316394805908, 0.5369388461112976, 0.5577459931373596, 0.5785531401634216, 0.5993603467941284, 0.6201674938201904, 0.6409746408462524]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 10.0, 13.0, 14.0, 19.0, 17.0, 29.0, 30.0, 24.0, 32.0, 35.0, 45.0, 47.0, 49.0, 43.0, 49.0, 48.0, 66.0, 46.0, 47.0, 39.0, 31.0, 30.0, 31.0, 36.0, 21.0, 25.0, 28.0, 14.0, 19.0, 12.0, 12.0, 9.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43076878786087036, -0.4190334975719452, -0.40729817748069763, -0.39556288719177246, -0.3838275671005249, -0.37209227681159973, -0.36035698652267456, -0.348621666431427, -0.33688637614250183, -0.32515108585357666, -0.3134157657623291, -0.30168047547340393, -0.28994518518447876, -0.2782098650932312, -0.26647457480430603, -0.25473928451538086, -0.2430039644241333, -0.23126865923404694, -0.21953335404396057, -0.2077980637550354, -0.19606275856494904, -0.18432745337486267, -0.1725921630859375, -0.16085685789585114, -0.14912155270576477, -0.1373862475156784, -0.12565094232559204, -0.11391565203666687, -0.1021803468465805, -0.09044504165649414, -0.07870974391698837, -0.0669744461774826, -0.05523917078971863, -0.04350386932492256, -0.031768567860126495, -0.02003326639533043, -0.008297964930534363, 0.0034373365342617035, 0.01517263799905777, 0.026907935738563538, 0.0386432409286499, 0.05037854239344597, 0.062113843858242035, 0.0738491415977478, 0.08558444678783417, 0.09731975197792053, 0.1090550497174263, 0.12079034745693207, 0.13252565264701843, 0.1442609578371048, 0.15599626302719116, 0.16773155331611633, 0.1794668585062027, 0.19120216369628906, 0.20293745398521423, 0.2146727591753006, 0.22640806436538696, 0.23814336955547333, 0.2498786747455597, 0.26161396503448486, 0.2733492851257324, 0.2850845754146576, 0.29681986570358276, 0.3085551857948303, 0.3202904760837555]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 7.0, 10.0, 19.0, 18.0, 50.0, 89.0, 227.0, 425.0, 975.0, 2231.0, 5805.0, 17618.0, 79869.0, 556619.0, 318694.0, 46689.0, 11956.0, 4196.0, 1621.0, 736.0, 342.0, 169.0, 81.0, 41.0, 22.0, 13.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8271484375, -0.802703857421875, -0.77825927734375, -0.753814697265625, -0.7293701171875, -0.704925537109375, -0.68048095703125, -0.656036376953125, -0.631591796875, -0.607147216796875, -0.58270263671875, -0.558258056640625, -0.5338134765625, -0.509368896484375, -0.48492431640625, -0.460479736328125, -0.43603515625, -0.411590576171875, -0.38714599609375, -0.362701416015625, -0.3382568359375, -0.313812255859375, -0.28936767578125, -0.264923095703125, -0.240478515625, -0.216033935546875, -0.19158935546875, -0.167144775390625, -0.1427001953125, -0.118255615234375, -0.09381103515625, -0.069366455078125, -0.044921875, -0.020477294921875, 0.00396728515625, 0.028411865234375, 0.0528564453125, 0.077301025390625, 0.10174560546875, 0.126190185546875, 0.150634765625, 0.175079345703125, 0.19952392578125, 0.223968505859375, 0.2484130859375, 0.272857666015625, 0.29730224609375, 0.321746826171875, 0.34619140625, 0.370635986328125, 0.39508056640625, 0.419525146484375, 0.4439697265625, 0.468414306640625, 0.49285888671875, 0.517303466796875, 0.541748046875, 0.566192626953125, 0.59063720703125, 0.615081787109375, 0.6395263671875, 0.663970947265625, 0.68841552734375, 0.712860107421875, 0.7373046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 5.0, 12.0, 14.0, 21.0, 13.0, 20.0, 24.0, 30.0, 35.0, 42.0, 30.0, 32.0, 45.0, 45.0, 47.0, 41.0, 59.0, 48.0, 47.0, 42.0, 39.0, 35.0, 36.0, 30.0, 23.0, 30.0, 14.0, 27.0, 16.0, 20.0, 16.0, 18.0, 7.0, 10.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6590347290039062, -0.6359405517578125, -0.6128463745117188, -0.589752197265625, -0.5666580200195312, -0.5435638427734375, -0.5204696655273438, -0.49737548828125, -0.47428131103515625, -0.4511871337890625, -0.42809295654296875, -0.404998779296875, -0.38190460205078125, -0.3588104248046875, -0.33571624755859375, -0.3126220703125, -0.28952789306640625, -0.2664337158203125, -0.24333953857421875, -0.220245361328125, -0.19715118408203125, -0.1740570068359375, -0.15096282958984375, -0.12786865234375, -0.10477447509765625, -0.0816802978515625, -0.05858612060546875, -0.035491943359375, -0.01239776611328125, 0.0106964111328125, 0.03379058837890625, 0.056884765625, 0.07997894287109375, 0.1030731201171875, 0.12616729736328125, 0.149261474609375, 0.17235565185546875, 0.1954498291015625, 0.21854400634765625, 0.24163818359375, 0.26473236083984375, 0.2878265380859375, 0.31092071533203125, 0.334014892578125, 0.35710906982421875, 0.3802032470703125, 0.40329742431640625, 0.4263916015625, 0.44948577880859375, 0.4725799560546875, 0.49567413330078125, 0.518768310546875, 0.5418624877929688, 0.5649566650390625, 0.5880508422851562, 0.61114501953125, 0.6342391967773438, 0.6573333740234375, 0.6804275512695312, 0.703521728515625, 0.7266159057617188, 0.7497100830078125, 0.7728042602539062, 0.7958984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 15.0, 14.0, 26.0, 35.0, 49.0, 88.0, 130.0, 260.0, 546.0, 1195.0, 3859.0, 17716.0, 204095.0, 752363.0, 56152.0, 8094.0, 2230.0, 800.0, 381.0, 199.0, 98.0, 57.0, 53.0, 23.0, 20.0, 18.0, 7.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.4817962646484375, -1.444061279296875, -1.4063262939453125, -1.36859130859375, -1.3308563232421875, -1.293121337890625, -1.2553863525390625, -1.2176513671875, -1.1799163818359375, -1.142181396484375, -1.1044464111328125, -1.06671142578125, -1.0289764404296875, -0.991241455078125, -0.9535064697265625, -0.915771484375, -0.8780364990234375, -0.840301513671875, -0.8025665283203125, -0.76483154296875, -0.7270965576171875, -0.689361572265625, -0.6516265869140625, -0.6138916015625, -0.5761566162109375, -0.538421630859375, -0.5006866455078125, -0.46295166015625, -0.4252166748046875, -0.387481689453125, -0.3497467041015625, -0.31201171875, -0.2742767333984375, -0.236541748046875, -0.1988067626953125, -0.16107177734375, -0.1233367919921875, -0.085601806640625, -0.0478668212890625, -0.0101318359375, 0.0276031494140625, 0.065338134765625, 0.1030731201171875, 0.14080810546875, 0.1785430908203125, 0.216278076171875, 0.2540130615234375, 0.291748046875, 0.3294830322265625, 0.367218017578125, 0.4049530029296875, 0.44268798828125, 0.4804229736328125, 0.518157958984375, 0.5558929443359375, 0.5936279296875, 0.6313629150390625, 0.669097900390625, 0.7068328857421875, 0.74456787109375, 0.7823028564453125, 0.820037841796875, 0.8577728271484375, 0.8955078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 5.0, 5.0, 4.0, 8.0, 4.0, 10.0, 11.0, 13.0, 26.0, 18.0, 37.0, 43.0, 52.0, 55.0, 56.0, 50.0, 53.0, 81.0, 59.0, 57.0, 49.0, 56.0, 43.0, 41.0, 29.0, 21.0, 18.0, 22.0, 17.0, 8.0, 11.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.11328125, -1.080780029296875, -1.04827880859375, -1.015777587890625, -0.9832763671875, -0.950775146484375, -0.91827392578125, -0.885772705078125, -0.853271484375, -0.820770263671875, -0.78826904296875, -0.755767822265625, -0.7232666015625, -0.690765380859375, -0.65826416015625, -0.625762939453125, -0.59326171875, -0.560760498046875, -0.52825927734375, -0.495758056640625, -0.4632568359375, -0.430755615234375, -0.39825439453125, -0.365753173828125, -0.333251953125, -0.300750732421875, -0.26824951171875, -0.235748291015625, -0.2032470703125, -0.170745849609375, -0.13824462890625, -0.105743408203125, -0.0732421875, -0.040740966796875, -0.00823974609375, 0.024261474609375, 0.0567626953125, 0.089263916015625, 0.12176513671875, 0.154266357421875, 0.186767578125, 0.219268798828125, 0.25177001953125, 0.284271240234375, 0.3167724609375, 0.349273681640625, 0.38177490234375, 0.414276123046875, 0.44677734375, 0.479278564453125, 0.51177978515625, 0.544281005859375, 0.5767822265625, 0.609283447265625, 0.64178466796875, 0.674285888671875, 0.706787109375, 0.739288330078125, 0.77178955078125, 0.804290771484375, 0.8367919921875, 0.869293212890625, 0.90179443359375, 0.934295654296875, 0.966796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 12.0, 15.0, 35.0, 64.0, 130.0, 244.0, 733.0, 2712.0, 14242.0, 139338.0, 781119.0, 95711.0, 10872.0, 2235.0, 620.0, 233.0, 109.0, 46.0, 23.0, 11.0, 11.0, 7.0, 10.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.292236328125, -0.2837486267089844, -0.27526092529296875, -0.2667732238769531, -0.2582855224609375, -0.24979782104492188, -0.24131011962890625, -0.23282241821289062, -0.224334716796875, -0.21584701538085938, -0.20735931396484375, -0.19887161254882812, -0.1903839111328125, -0.18189620971679688, -0.17340850830078125, -0.16492080688476562, -0.15643310546875, -0.14794540405273438, -0.13945770263671875, -0.13097000122070312, -0.1224822998046875, -0.11399459838867188, -0.10550689697265625, -0.09701919555664062, -0.088531494140625, -0.08004379272460938, -0.07155609130859375, -0.06306838989257812, -0.0545806884765625, -0.046092987060546875, -0.03760528564453125, -0.029117584228515625, -0.0206298828125, -0.012142181396484375, -0.00365447998046875, 0.004833221435546875, 0.0133209228515625, 0.021808624267578125, 0.03029632568359375, 0.038784027099609375, 0.047271728515625, 0.055759429931640625, 0.06424713134765625, 0.07273483276367188, 0.0812225341796875, 0.08971023559570312, 0.09819793701171875, 0.10668563842773438, 0.11517333984375, 0.12366104125976562, 0.13214874267578125, 0.14063644409179688, 0.1491241455078125, 0.15761184692382812, 0.16609954833984375, 0.17458724975585938, 0.183074951171875, 0.19156265258789062, 0.20005035400390625, 0.20853805541992188, 0.2170257568359375, 0.22551345825195312, 0.23400115966796875, 0.24248886108398438, 0.2509765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 6.0, 13.0, 14.0, 17.0, 39.0, 58.0, 85.0, 118.0, 147.0, 130.0, 115.0, 86.0, 50.0, 41.0, 29.0, 16.0, 7.0, 6.0, 4.0, 4.0, 0.0, 6.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.661083221435547e-05, -4.550628364086151e-05, -4.4401735067367554e-05, -4.3297186493873596e-05, -4.219263792037964e-05, -4.108808934688568e-05, -3.9983540773391724e-05, -3.8878992199897766e-05, -3.777444362640381e-05, -3.666989505290985e-05, -3.5565346479415894e-05, -3.4460797905921936e-05, -3.335624933242798e-05, -3.225170075893402e-05, -3.1147152185440063e-05, -3.0042603611946106e-05, -2.893805503845215e-05, -2.783350646495819e-05, -2.6728957891464233e-05, -2.5624409317970276e-05, -2.451986074447632e-05, -2.341531217098236e-05, -2.2310763597488403e-05, -2.1206215023994446e-05, -2.0101666450500488e-05, -1.899711787700653e-05, -1.7892569303512573e-05, -1.6788020730018616e-05, -1.5683472156524658e-05, -1.45789235830307e-05, -1.3474375009536743e-05, -1.2369826436042786e-05, -1.1265277862548828e-05, -1.016072928905487e-05, -9.056180715560913e-06, -7.951632142066956e-06, -6.847083568572998e-06, -5.7425349950790405e-06, -4.637986421585083e-06, -3.5334378480911255e-06, -2.428889274597168e-06, -1.3243407011032104e-06, -2.1979212760925293e-07, 8.847564458847046e-07, 1.989305019378662e-06, 3.0938535928726196e-06, 4.198402166366577e-06, 5.302950739860535e-06, 6.407499313354492e-06, 7.51204788684845e-06, 8.616596460342407e-06, 9.721145033836365e-06, 1.0825693607330322e-05, 1.193024218082428e-05, 1.3034790754318237e-05, 1.4139339327812195e-05, 1.5243887901306152e-05, 1.634843647480011e-05, 1.7452985048294067e-05, 1.8557533621788025e-05, 1.9662082195281982e-05, 2.076663076877594e-05, 2.1871179342269897e-05, 2.2975727915763855e-05, 2.4080276489257812e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 8.0, 19.0, 19.0, 45.0, 70.0, 180.0, 653.0, 2405.0, 13944.0, 252277.0, 737485.0, 35432.0, 4406.0, 1041.0, 290.0, 123.0, 65.0, 25.0, 22.0, 13.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.5068359375, -0.49390411376953125, -0.4809722900390625, -0.46804046630859375, -0.455108642578125, -0.44217681884765625, -0.4292449951171875, -0.41631317138671875, -0.40338134765625, -0.39044952392578125, -0.3775177001953125, -0.36458587646484375, -0.351654052734375, -0.33872222900390625, -0.3257904052734375, -0.31285858154296875, -0.2999267578125, -0.28699493408203125, -0.2740631103515625, -0.26113128662109375, -0.248199462890625, -0.23526763916015625, -0.2223358154296875, -0.20940399169921875, -0.19647216796875, -0.18354034423828125, -0.1706085205078125, -0.15767669677734375, -0.144744873046875, -0.13181304931640625, -0.1188812255859375, -0.10594940185546875, -0.093017578125, -0.08008575439453125, -0.0671539306640625, -0.05422210693359375, -0.041290283203125, -0.02835845947265625, -0.0154266357421875, -0.00249481201171875, 0.01043701171875, 0.02336883544921875, 0.0363006591796875, 0.04923248291015625, 0.062164306640625, 0.07509613037109375, 0.0880279541015625, 0.10095977783203125, 0.1138916015625, 0.12682342529296875, 0.1397552490234375, 0.15268707275390625, 0.165618896484375, 0.17855072021484375, 0.1914825439453125, 0.20441436767578125, 0.21734619140625, 0.23027801513671875, 0.2432098388671875, 0.25614166259765625, 0.269073486328125, 0.28200531005859375, 0.2949371337890625, 0.30786895751953125, 0.32080078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 19.0, 28.0, 42.0, 73.0, 91.0, 114.0, 175.0, 151.0, 97.0, 85.0, 39.0, 27.0, 12.0, 9.0, 3.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1116943359375, -0.107177734375, -0.1026611328125, -0.09814453125, -0.0936279296875, -0.089111328125, -0.0845947265625, -0.080078125, -0.0755615234375, -0.071044921875, -0.0665283203125, -0.06201171875, -0.0574951171875, -0.052978515625, -0.0484619140625, -0.0439453125, -0.0394287109375, -0.034912109375, -0.0303955078125, -0.02587890625, -0.0213623046875, -0.016845703125, -0.0123291015625, -0.0078125, -0.0032958984375, 0.001220703125, 0.0057373046875, 0.01025390625, 0.0147705078125, 0.019287109375, 0.0238037109375, 0.0283203125, 0.0328369140625, 0.037353515625, 0.0418701171875, 0.04638671875, 0.0509033203125, 0.055419921875, 0.0599365234375, 0.064453125, 0.0689697265625, 0.073486328125, 0.0780029296875, 0.08251953125, 0.0870361328125, 0.091552734375, 0.0960693359375, 0.1005859375, 0.1051025390625, 0.109619140625, 0.1141357421875, 0.11865234375, 0.1231689453125, 0.127685546875, 0.1322021484375, 0.13671875, 0.1412353515625, 0.145751953125, 0.1502685546875, 0.15478515625, 0.1593017578125, 0.163818359375, 0.1683349609375, 0.1728515625, 0.1773681640625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 11.0, 27.0, 44.0, 123.0, 185.0, 191.0, 178.0, 134.0, 65.0, 34.0, 13.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.579605221748352, -1.4899643659591675, -1.4003233909606934, -1.3106825351715088, -1.2210416793823242, -1.1314008235931396, -1.041759967803955, -0.952118992805481, -0.8624781370162964, -0.7728372812271118, -0.6831963658332825, -0.5935554504394531, -0.5039145946502686, -0.4142737090587616, -0.32463282346725464, -0.2349919080734253, -0.14535105228424072, -0.055710166692733765, 0.03393071889877319, 0.12357160449028015, 0.2132124900817871, 0.30285337567329407, 0.392494261264801, 0.48213517665863037, 0.5717760324478149, 0.6614168882369995, 0.7510578036308289, 0.8406987190246582, 0.9303395748138428, 1.0199804306030273, 1.109621286392212, 1.199262261390686, 1.2889032363891602, 1.3785440921783447, 1.4681849479675293, 1.5578259229660034, 1.647466778755188, 1.7371076345443726, 1.8267486095428467, 1.9163894653320312, 2.006030321121216, 2.0956711769104004, 2.185312032699585, 2.2749528884887695, 2.364593982696533, 2.4542348384857178, 2.5438756942749023, 2.633516550064087, 2.7231574058532715, 2.812798261642456, 2.9024391174316406, 2.992079973220825, 3.0817208290100098, 3.1713619232177734, 3.261002779006958, 3.3506436347961426, 3.440284490585327, 3.5299253463745117, 3.6195662021636963, 3.709207057952881, 3.7988481521606445, 3.888489007949829, 3.9781298637390137, 4.067770957946777, 4.157411575317383]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 4.0, 2.0, 12.0, 15.0, 10.0, 21.0, 10.0, 19.0, 14.0, 24.0, 16.0, 26.0, 24.0, 37.0, 35.0, 31.0, 41.0, 43.0, 56.0, 49.0, 43.0, 47.0, 35.0, 41.0, 46.0, 37.0, 35.0, 30.0, 33.0, 20.0, 26.0, 14.0, 19.0, 17.0, 9.0, 7.0, 10.0, 15.0, 7.0, 9.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2883727550506592, -1.2457438707351685, -1.2031149864196777, -1.1604862213134766, -1.1178573369979858, -1.0752284526824951, -1.0325995683670044, -0.9899707436561584, -0.9473419189453125, -0.9047130346298218, -0.8620842099189758, -0.8194553256034851, -0.7768265008926392, -0.7341976165771484, -0.6915687322616577, -0.6489399075508118, -0.606311023235321, -0.5636821389198303, -0.5210533142089844, -0.47842442989349365, -0.4357956051826477, -0.393166720867157, -0.35053786635398865, -0.3079090118408203, -0.265280157327652, -0.22265130281448364, -0.1800224483013153, -0.13739357888698578, -0.09476472437381744, -0.05213586986064911, -0.00950700044631958, 0.033121854066848755, 0.07575070858001709, 0.11837956309318542, 0.16100841760635376, 0.2036372870206833, 0.24626614153385162, 0.28889501094818115, 0.3315238654613495, 0.3741527199745178, 0.41678157448768616, 0.4594104290008545, 0.5020393133163452, 0.5446681380271912, 0.5872970223426819, 0.6299258470535278, 0.6725547313690186, 0.7151836156845093, 0.7578124403953552, 0.800441324710846, 0.8430701494216919, 0.8856990337371826, 0.9283278584480286, 0.9709567427635193, 1.0135855674743652, 1.056214451789856, 1.0988433361053467, 1.1414722204208374, 1.1841011047363281, 1.2267298698425293, 1.26935875415802, 1.3119876384735107, 1.3546165227890015, 1.3972454071044922, 1.4398741722106934]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 7.0, 10.0, 12.0, 15.0, 18.0, 24.0, 35.0, 40.0, 51.0, 85.0, 149.0, 241.0, 466.0, 1014.0, 2397.0, 7093.0, 30366.0, 355066.0, 2993356.0, 741667.0, 46951.0, 9446.0, 3146.0, 1228.0, 569.0, 281.0, 189.0, 107.0, 51.0, 51.0, 23.0, 25.0, 15.0, 13.0, 14.0, 12.0, 10.0, 7.0, 5.0, 7.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.99609375, -0.96356201171875, -0.9310302734375, -0.89849853515625, -0.865966796875, -0.83343505859375, -0.8009033203125, -0.76837158203125, -0.73583984375, -0.70330810546875, -0.6707763671875, -0.63824462890625, -0.605712890625, -0.57318115234375, -0.5406494140625, -0.50811767578125, -0.4755859375, -0.44305419921875, -0.4105224609375, -0.37799072265625, -0.345458984375, -0.31292724609375, -0.2803955078125, -0.24786376953125, -0.21533203125, -0.18280029296875, -0.1502685546875, -0.11773681640625, -0.085205078125, -0.05267333984375, -0.0201416015625, 0.01239013671875, 0.044921875, 0.07745361328125, 0.1099853515625, 0.14251708984375, 0.175048828125, 0.20758056640625, 0.2401123046875, 0.27264404296875, 0.30517578125, 0.33770751953125, 0.3702392578125, 0.40277099609375, 0.435302734375, 0.46783447265625, 0.5003662109375, 0.53289794921875, 0.5654296875, 0.59796142578125, 0.6304931640625, 0.66302490234375, 0.695556640625, 0.72808837890625, 0.7606201171875, 0.79315185546875, 0.82568359375, 0.85821533203125, 0.8907470703125, 0.92327880859375, 0.955810546875, 0.98834228515625, 1.0208740234375, 1.05340576171875, 1.0859375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 9.0, 8.0, 2.0, 13.0, 13.0, 14.0, 24.0, 22.0, 17.0, 21.0, 38.0, 28.0, 40.0, 41.0, 38.0, 36.0, 44.0, 43.0, 43.0, 38.0, 47.0, 40.0, 41.0, 37.0, 40.0, 36.0, 33.0, 24.0, 26.0, 26.0, 26.0, 11.0, 14.0, 8.0, 11.0, 6.0, 8.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3603630065917969, -0.34792327880859375, -0.3354835510253906, -0.3230438232421875, -0.3106040954589844, -0.29816436767578125, -0.2857246398925781, -0.273284912109375, -0.2608451843261719, -0.24840545654296875, -0.23596572875976562, -0.2235260009765625, -0.21108627319335938, -0.19864654541015625, -0.18620681762695312, -0.17376708984375, -0.16132736206054688, -0.14888763427734375, -0.13644790649414062, -0.1240081787109375, -0.11156845092773438, -0.09912872314453125, -0.08668899536132812, -0.074249267578125, -0.061809539794921875, -0.04936981201171875, -0.036930084228515625, -0.0244903564453125, -0.012050628662109375, 0.00038909912109375, 0.012828826904296875, 0.0252685546875, 0.037708282470703125, 0.05014801025390625, 0.06258773803710938, 0.0750274658203125, 0.08746719360351562, 0.09990692138671875, 0.11234664916992188, 0.124786376953125, 0.13722610473632812, 0.14966583251953125, 0.16210556030273438, 0.1745452880859375, 0.18698501586914062, 0.19942474365234375, 0.21186447143554688, 0.22430419921875, 0.23674392700195312, 0.24918365478515625, 0.2616233825683594, 0.2740631103515625, 0.2865028381347656, 0.29894256591796875, 0.3113822937011719, 0.323822021484375, 0.3362617492675781, 0.34870147705078125, 0.3611412048339844, 0.3735809326171875, 0.3860206604003906, 0.39846038818359375, 0.4109001159667969, 0.42333984375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 14.0, 14.0, 20.0, 41.0, 98.0, 201.0, 701.0, 2785.0, 19486.0, 1660781.0, 2482533.0, 23300.0, 3121.0, 702.0, 239.0, 95.0, 50.0, 31.0, 13.0, 15.0, 12.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.3198699951171875, -2.258880615234375, -2.1978912353515625, -2.13690185546875, -2.0759124755859375, -2.014923095703125, -1.9539337158203125, -1.8929443359375, -1.8319549560546875, -1.770965576171875, -1.7099761962890625, -1.64898681640625, -1.5879974365234375, -1.527008056640625, -1.4660186767578125, -1.405029296875, -1.3440399169921875, -1.283050537109375, -1.2220611572265625, -1.16107177734375, -1.1000823974609375, -1.039093017578125, -0.9781036376953125, -0.9171142578125, -0.8561248779296875, -0.795135498046875, -0.7341461181640625, -0.67315673828125, -0.6121673583984375, -0.551177978515625, -0.4901885986328125, -0.42919921875, -0.3682098388671875, -0.307220458984375, -0.2462310791015625, -0.18524169921875, -0.1242523193359375, -0.063262939453125, -0.0022735595703125, 0.0587158203125, 0.1197052001953125, 0.180694580078125, 0.2416839599609375, 0.30267333984375, 0.3636627197265625, 0.424652099609375, 0.4856414794921875, 0.546630859375, 0.6076202392578125, 0.668609619140625, 0.7295989990234375, 0.79058837890625, 0.8515777587890625, 0.912567138671875, 0.9735565185546875, 1.0345458984375, 1.0955352783203125, 1.156524658203125, 1.2175140380859375, 1.27850341796875, 1.3394927978515625, 1.400482177734375, 1.4614715576171875, 1.5224609375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 9.0, 13.0, 24.0, 37.0, 63.0, 128.0, 223.0, 451.0, 745.0, 865.0, 641.0, 388.0, 216.0, 100.0, 59.0, 42.0, 21.0, 12.0, 14.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.2987518310546875, -0.285980224609375, -0.2732086181640625, -0.26043701171875, -0.2476654052734375, -0.234893798828125, -0.2221221923828125, -0.2093505859375, -0.1965789794921875, -0.183807373046875, -0.1710357666015625, -0.15826416015625, -0.1454925537109375, -0.132720947265625, -0.1199493408203125, -0.107177734375, -0.0944061279296875, -0.081634521484375, -0.0688629150390625, -0.05609130859375, -0.0433197021484375, -0.030548095703125, -0.0177764892578125, -0.0050048828125, 0.0077667236328125, 0.020538330078125, 0.0333099365234375, 0.04608154296875, 0.0588531494140625, 0.071624755859375, 0.0843963623046875, 0.09716796875, 0.1099395751953125, 0.122711181640625, 0.1354827880859375, 0.14825439453125, 0.1610260009765625, 0.173797607421875, 0.1865692138671875, 0.1993408203125, 0.2121124267578125, 0.224884033203125, 0.2376556396484375, 0.25042724609375, 0.2631988525390625, 0.275970458984375, 0.2887420654296875, 0.301513671875, 0.3142852783203125, 0.327056884765625, 0.3398284912109375, 0.35260009765625, 0.3653717041015625, 0.378143310546875, 0.3909149169921875, 0.4036865234375, 0.4164581298828125, 0.429229736328125, 0.4420013427734375, 0.45477294921875, 0.4675445556640625, 0.480316162109375, 0.4930877685546875, 0.505859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 3.0, 4.0, 6.0, 8.0, 20.0, 11.0, 19.0, 21.0, 29.0, 30.0, 30.0, 38.0, 48.0, 48.0, 36.0, 55.0, 55.0, 66.0, 63.0, 55.0, 62.0, 46.0, 33.0, 46.0, 40.0, 35.0, 16.0, 21.0, 15.0, 9.0, 6.0, 9.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.711143970489502, -0.6911450028419495, -0.6711459755897522, -0.6511470079421997, -0.6311479806900024, -0.61114901304245, -0.5911499857902527, -0.5711510181427002, -0.5511519908905029, -0.5311530232429504, -0.5111539959907532, -0.4911549985408783, -0.4711560010910034, -0.4511570334434509, -0.43115803599357605, -0.41115903854370117, -0.3911600708961487, -0.3711610734462738, -0.3511620759963989, -0.33116307854652405, -0.31116408109664917, -0.2911651134490967, -0.2711661159992218, -0.2511671185493469, -0.23116812109947205, -0.21116912364959717, -0.1911701261997223, -0.1711711436510086, -0.15117214620113373, -0.13117314875125885, -0.11117415875196457, -0.09117516875267029, -0.07117623090744019, -0.051177237182855606, -0.031178243458271027, -0.011179249733686447, 0.008819743990898132, 0.02881874144077301, 0.04881773144006729, 0.06881672143936157, 0.08881571888923645, 0.10881471633911133, 0.1288137137889862, 0.1488126963376999, 0.16881169378757477, 0.18881069123744965, 0.20880967378616333, 0.2288086712360382, 0.24880766868591309, 0.26880666613578796, 0.28880566358566284, 0.3088046610355377, 0.3288036584854126, 0.3488026261329651, 0.36880162358283997, 0.38880062103271484, 0.4087996184825897, 0.4287986159324646, 0.4487976133823395, 0.46879661083221436, 0.48879557847976685, 0.5087946057319641, 0.5287935733795166, 0.5487926006317139, 0.5687915682792664]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 7.0, 7.0, 14.0, 23.0, 13.0, 14.0, 23.0, 22.0, 33.0, 30.0, 33.0, 32.0, 38.0, 48.0, 55.0, 51.0, 52.0, 51.0, 43.0, 39.0, 35.0, 51.0, 43.0, 30.0, 22.0, 26.0, 33.0, 23.0, 14.0, 23.0, 16.0, 5.0, 8.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.5663232207298279, -0.549354076385498, -0.5323849320411682, -0.5154157876968384, -0.49844664335250854, -0.4814774990081787, -0.4645083248615265, -0.44753918051719666, -0.4305700361728668, -0.413600891828537, -0.39663174748420715, -0.3796626031398773, -0.3626934289932251, -0.34572428464889526, -0.32875514030456543, -0.3117859959602356, -0.29481685161590576, -0.2778477072715759, -0.2608785629272461, -0.24390940368175507, -0.22694025933742523, -0.2099711149930954, -0.19300195574760437, -0.17603281140327454, -0.1590636670589447, -0.14209452271461487, -0.12512537837028503, -0.108156219124794, -0.09118707478046417, -0.07421793043613434, -0.05724877864122391, -0.04027962684631348, -0.023310542106628418, -0.0063413940370082855, 0.010627754032611847, 0.02759690210223198, 0.04456605017185211, 0.061535194516181946, 0.07850434631109238, 0.09547349810600281, 0.11244264245033264, 0.12941178679466248, 0.1463809311389923, 0.16335009038448334, 0.18031923472881317, 0.197288379073143, 0.21425753831863403, 0.23122668266296387, 0.2481958270072937, 0.26516497135162354, 0.28213411569595337, 0.2991032600402832, 0.31607240438461304, 0.33304154872894287, 0.3500107228755951, 0.3669798672199249, 0.38394901156425476, 0.4009181559085846, 0.41788730025291443, 0.43485644459724426, 0.4518256187438965, 0.4687947630882263, 0.48576390743255615, 0.502733051776886, 0.5197021961212158]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 8.0, 12.0, 13.0, 15.0, 26.0, 30.0, 36.0, 39.0, 74.0, 81.0, 136.0, 167.0, 334.0, 537.0, 918.0, 1466.0, 2610.0, 4912.0, 12233.0, 65680.0, 532870.0, 366607.0, 40356.0, 9404.0, 4337.0, 2280.0, 1260.0, 737.0, 431.0, 263.0, 193.0, 134.0, 84.0, 74.0, 51.0, 31.0, 20.0, 20.0, 17.0, 19.0, 10.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.18768882751464844, -0.18140792846679688, -0.1751270294189453, -0.16884613037109375, -0.1625652313232422, -0.15628433227539062, -0.15000343322753906, -0.1437225341796875, -0.13744163513183594, -0.13116073608398438, -0.12487983703613281, -0.11859893798828125, -0.11231803894042969, -0.10603713989257812, -0.09975624084472656, -0.093475341796875, -0.08719444274902344, -0.08091354370117188, -0.07463264465332031, -0.06835174560546875, -0.06207084655761719, -0.055789947509765625, -0.04950904846191406, -0.0432281494140625, -0.03694725036621094, -0.030666351318359375, -0.024385452270507812, -0.01810455322265625, -0.011823654174804688, -0.005542755126953125, 0.0007381439208984375, 0.00701904296875, 0.013299942016601562, 0.019580841064453125, 0.025861740112304688, 0.03214263916015625, 0.03842353820800781, 0.044704437255859375, 0.05098533630371094, 0.0572662353515625, 0.06354713439941406, 0.06982803344726562, 0.07610893249511719, 0.08238983154296875, 0.08867073059082031, 0.09495162963867188, 0.10123252868652344, 0.107513427734375, 0.11379432678222656, 0.12007522583007812, 0.1263561248779297, 0.13263702392578125, 0.1389179229736328, 0.14519882202148438, 0.15147972106933594, 0.1577606201171875, 0.16404151916503906, 0.17032241821289062, 0.1766033172607422, 0.18288421630859375, 0.1891651153564453, 0.19544601440429688, 0.20172691345214844, 0.2080078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 5.0, 8.0, 12.0, 14.0, 15.0, 14.0, 19.0, 22.0, 28.0, 27.0, 34.0, 28.0, 32.0, 37.0, 43.0, 41.0, 41.0, 35.0, 54.0, 38.0, 38.0, 45.0, 41.0, 43.0, 35.0, 35.0, 26.0, 24.0, 18.0, 18.0, 27.0, 14.0, 16.0, 14.0, 5.0, 6.0, 4.0, 2.0, 4.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.3271484375, -0.3172607421875, -0.307373046875, -0.2974853515625, -0.28759765625, -0.2777099609375, -0.267822265625, -0.2579345703125, -0.248046875, -0.2381591796875, -0.228271484375, -0.2183837890625, -0.20849609375, -0.1986083984375, -0.188720703125, -0.1788330078125, -0.1689453125, -0.1590576171875, -0.149169921875, -0.1392822265625, -0.12939453125, -0.1195068359375, -0.109619140625, -0.0997314453125, -0.08984375, -0.0799560546875, -0.070068359375, -0.0601806640625, -0.05029296875, -0.0404052734375, -0.030517578125, -0.0206298828125, -0.0107421875, -0.0008544921875, 0.009033203125, 0.0189208984375, 0.02880859375, 0.0386962890625, 0.048583984375, 0.0584716796875, 0.068359375, 0.0782470703125, 0.088134765625, 0.0980224609375, 0.10791015625, 0.1177978515625, 0.127685546875, 0.1375732421875, 0.1474609375, 0.1573486328125, 0.167236328125, 0.1771240234375, 0.18701171875, 0.1968994140625, 0.206787109375, 0.2166748046875, 0.2265625, 0.2364501953125, 0.246337890625, 0.2562255859375, 0.26611328125, 0.2760009765625, 0.285888671875, 0.2957763671875, 0.3056640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 16.0, 25.0, 42.0, 61.0, 102.0, 224.0, 392.0, 818.0, 1873.0, 4851.0, 19584.0, 226327.0, 698008.0, 79718.0, 10418.0, 3403.0, 1291.0, 631.0, 309.0, 169.0, 108.0, 60.0, 34.0, 31.0, 14.0, 3.0, 6.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.215576171875, -0.208221435546875, -0.20086669921875, -0.193511962890625, -0.1861572265625, -0.178802490234375, -0.17144775390625, -0.164093017578125, -0.15673828125, -0.149383544921875, -0.14202880859375, -0.134674072265625, -0.1273193359375, -0.119964599609375, -0.11260986328125, -0.105255126953125, -0.097900390625, -0.090545654296875, -0.08319091796875, -0.075836181640625, -0.0684814453125, -0.061126708984375, -0.05377197265625, -0.046417236328125, -0.0390625, -0.031707763671875, -0.02435302734375, -0.016998291015625, -0.0096435546875, -0.002288818359375, 0.00506591796875, 0.012420654296875, 0.019775390625, 0.027130126953125, 0.03448486328125, 0.041839599609375, 0.0491943359375, 0.056549072265625, 0.06390380859375, 0.071258544921875, 0.07861328125, 0.085968017578125, 0.09332275390625, 0.100677490234375, 0.1080322265625, 0.115386962890625, 0.12274169921875, 0.130096435546875, 0.137451171875, 0.144805908203125, 0.15216064453125, 0.159515380859375, 0.1668701171875, 0.174224853515625, 0.18157958984375, 0.188934326171875, 0.1962890625, 0.203643798828125, 0.21099853515625, 0.218353271484375, 0.2257080078125, 0.233062744140625, 0.24041748046875, 0.247772216796875, 0.255126953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 7.0, 13.0, 7.0, 9.0, 11.0, 12.0, 10.0, 19.0, 26.0, 30.0, 26.0, 36.0, 30.0, 28.0, 41.0, 42.0, 39.0, 42.0, 47.0, 47.0, 54.0, 54.0, 56.0, 39.0, 30.0, 28.0, 28.0, 27.0, 21.0, 19.0, 22.0, 19.0, 11.0, 14.0, 16.0, 6.0, 3.0, 10.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8349609375, -0.8071136474609375, -0.779266357421875, -0.7514190673828125, -0.72357177734375, -0.6957244873046875, -0.667877197265625, -0.6400299072265625, -0.6121826171875, -0.5843353271484375, -0.556488037109375, -0.5286407470703125, -0.50079345703125, -0.4729461669921875, -0.445098876953125, -0.4172515869140625, -0.389404296875, -0.3615570068359375, -0.333709716796875, -0.3058624267578125, -0.27801513671875, -0.2501678466796875, -0.222320556640625, -0.1944732666015625, -0.1666259765625, -0.1387786865234375, -0.110931396484375, -0.0830841064453125, -0.05523681640625, -0.0273895263671875, 0.000457763671875, 0.0283050537109375, 0.05615234375, 0.0839996337890625, 0.111846923828125, 0.1396942138671875, 0.16754150390625, 0.1953887939453125, 0.223236083984375, 0.2510833740234375, 0.2789306640625, 0.3067779541015625, 0.334625244140625, 0.3624725341796875, 0.39031982421875, 0.4181671142578125, 0.446014404296875, 0.4738616943359375, 0.501708984375, 0.5295562744140625, 0.557403564453125, 0.5852508544921875, 0.61309814453125, 0.6409454345703125, 0.668792724609375, 0.6966400146484375, 0.7244873046875, 0.7523345947265625, 0.780181884765625, 0.8080291748046875, 0.83587646484375, 0.8637237548828125, 0.891571044921875, 0.9194183349609375, 0.947265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 11.0, 14.0, 14.0, 17.0, 28.0, 38.0, 47.0, 86.0, 121.0, 178.0, 342.0, 498.0, 957.0, 1963.0, 4458.0, 11812.0, 49729.0, 466734.0, 444244.0, 47132.0, 11520.0, 4412.0, 1907.0, 942.0, 490.0, 293.0, 190.0, 127.0, 61.0, 57.0, 35.0, 19.0, 21.0, 17.0, 7.0, 10.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1080322265625, -0.10454559326171875, -0.1010589599609375, -0.09757232666015625, -0.094085693359375, -0.09059906005859375, -0.0871124267578125, -0.08362579345703125, -0.08013916015625, -0.07665252685546875, -0.0731658935546875, -0.06967926025390625, -0.066192626953125, -0.06270599365234375, -0.0592193603515625, -0.05573272705078125, -0.05224609375, -0.04875946044921875, -0.0452728271484375, -0.04178619384765625, -0.038299560546875, -0.03481292724609375, -0.0313262939453125, -0.02783966064453125, -0.02435302734375, -0.02086639404296875, -0.0173797607421875, -0.01389312744140625, -0.010406494140625, -0.00691986083984375, -0.0034332275390625, 5.340576171875e-05, 0.0035400390625, 0.00702667236328125, 0.0105133056640625, 0.01399993896484375, 0.017486572265625, 0.02097320556640625, 0.0244598388671875, 0.02794647216796875, 0.03143310546875, 0.03491973876953125, 0.0384063720703125, 0.04189300537109375, 0.045379638671875, 0.04886627197265625, 0.0523529052734375, 0.05583953857421875, 0.059326171875, 0.06281280517578125, 0.0662994384765625, 0.06978607177734375, 0.073272705078125, 0.07675933837890625, 0.0802459716796875, 0.08373260498046875, 0.08721923828125, 0.09070587158203125, 0.0941925048828125, 0.09767913818359375, 0.101165771484375, 0.10465240478515625, 0.1081390380859375, 0.11162567138671875, 0.1151123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 11.0, 4.0, 10.0, 7.0, 12.0, 33.0, 55.0, 75.0, 92.0, 150.0, 124.0, 131.0, 97.0, 62.0, 39.0, 17.0, 19.0, 13.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.510713577270508e-05, -3.381911665201187e-05, -3.2531097531318665e-05, -3.124307841062546e-05, -2.995505928993225e-05, -2.8667040169239044e-05, -2.7379021048545837e-05, -2.609100192785263e-05, -2.4802982807159424e-05, -2.3514963686466217e-05, -2.222694456577301e-05, -2.0938925445079803e-05, -1.9650906324386597e-05, -1.836288720369339e-05, -1.7074868083000183e-05, -1.5786848962306976e-05, -1.449882984161377e-05, -1.3210810720920563e-05, -1.1922791600227356e-05, -1.063477247953415e-05, -9.346753358840942e-06, -8.058734238147736e-06, -6.770715117454529e-06, -5.482695996761322e-06, -4.194676876068115e-06, -2.9066577553749084e-06, -1.6186386346817017e-06, -3.3061951398849487e-07, 9.57399606704712e-07, 2.2454187273979187e-06, 3.5334378480911255e-06, 4.821456968784332e-06, 6.109476089477539e-06, 7.397495210170746e-06, 8.685514330863953e-06, 9.97353345155716e-06, 1.1261552572250366e-05, 1.2549571692943573e-05, 1.383759081363678e-05, 1.5125609934329987e-05, 1.6413629055023193e-05, 1.77016481757164e-05, 1.8989667296409607e-05, 2.0277686417102814e-05, 2.156570553779602e-05, 2.2853724658489227e-05, 2.4141743779182434e-05, 2.542976289987564e-05, 2.6717782020568848e-05, 2.8005801141262054e-05, 2.929382026195526e-05, 3.058183938264847e-05, 3.1869858503341675e-05, 3.315787762403488e-05, 3.444589674472809e-05, 3.5733915865421295e-05, 3.70219349861145e-05, 3.830995410680771e-05, 3.9597973227500916e-05, 4.088599234819412e-05, 4.217401146888733e-05, 4.3462030589580536e-05, 4.475004971027374e-05, 4.603806883096695e-05, 4.7326087951660156e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 5.0, 11.0, 13.0, 15.0, 32.0, 34.0, 49.0, 85.0, 158.0, 252.0, 463.0, 825.0, 1501.0, 2757.0, 5378.0, 11221.0, 28845.0, 108549.0, 406893.0, 350647.0, 85844.0, 24694.0, 9802.0, 4649.0, 2492.0, 1410.0, 768.0, 446.0, 287.0, 157.0, 91.0, 57.0, 35.0, 22.0, 13.0, 7.0, 15.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07275390625, -0.07060909271240234, -0.06846427917480469, -0.06631946563720703, -0.06417465209960938, -0.06202983856201172, -0.05988502502441406, -0.057740211486816406, -0.05559539794921875, -0.053450584411621094, -0.05130577087402344, -0.04916095733642578, -0.047016143798828125, -0.04487133026123047, -0.04272651672363281, -0.040581703186035156, -0.0384368896484375, -0.036292076110839844, -0.03414726257324219, -0.03200244903564453, -0.029857635498046875, -0.02771282196044922, -0.025568008422851562, -0.023423194885253906, -0.02127838134765625, -0.019133567810058594, -0.016988754272460938, -0.014843940734863281, -0.012699127197265625, -0.010554313659667969, -0.008409500122070312, -0.006264686584472656, -0.004119873046875, -0.0019750595092773438, 0.0001697540283203125, 0.0023145675659179688, 0.004459381103515625, 0.006604194641113281, 0.008749008178710938, 0.010893821716308594, 0.01303863525390625, 0.015183448791503906, 0.017328262329101562, 0.01947307586669922, 0.021617889404296875, 0.02376270294189453, 0.025907516479492188, 0.028052330017089844, 0.0301971435546875, 0.032341957092285156, 0.03448677062988281, 0.03663158416748047, 0.038776397705078125, 0.04092121124267578, 0.04306602478027344, 0.045210838317871094, 0.04735565185546875, 0.049500465393066406, 0.05164527893066406, 0.05379009246826172, 0.055934906005859375, 0.05807971954345703, 0.06022453308105469, 0.062369346618652344, 0.06451416015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 6.0, 9.0, 11.0, 10.0, 21.0, 21.0, 29.0, 67.0, 84.0, 114.0, 135.0, 120.0, 104.0, 75.0, 45.0, 37.0, 27.0, 14.0, 5.0, 17.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.0285952091217041, -0.027634143829345703, -0.026673078536987305, -0.025712013244628906, -0.024750947952270508, -0.02378988265991211, -0.02282881736755371, -0.021867752075195312, -0.020906686782836914, -0.019945621490478516, -0.018984556198120117, -0.01802349090576172, -0.01706242561340332, -0.016101360321044922, -0.015140295028686523, -0.014179229736328125, -0.013218164443969727, -0.012257099151611328, -0.01129603385925293, -0.010334968566894531, -0.009373903274536133, -0.008412837982177734, -0.007451772689819336, -0.0064907073974609375, -0.005529642105102539, -0.004568576812744141, -0.003607511520385742, -0.0026464462280273438, -0.0016853809356689453, -0.0007243156433105469, 0.00023674964904785156, 0.00119781494140625, 0.0021588802337646484, 0.003119945526123047, 0.004081010818481445, 0.005042076110839844, 0.006003141403198242, 0.006964206695556641, 0.007925271987915039, 0.008886337280273438, 0.009847402572631836, 0.010808467864990234, 0.011769533157348633, 0.012730598449707031, 0.01369166374206543, 0.014652729034423828, 0.015613794326782227, 0.016574859619140625, 0.017535924911499023, 0.018496990203857422, 0.01945805549621582, 0.02041912078857422, 0.021380186080932617, 0.022341251373291016, 0.023302316665649414, 0.024263381958007812, 0.02522444725036621, 0.02618551254272461, 0.027146577835083008, 0.028107643127441406, 0.029068708419799805, 0.030029773712158203, 0.0309908390045166, 0.031951904296875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 8.0, 4.0, 5.0, 9.0, 11.0, 22.0, 24.0, 30.0, 27.0, 58.0, 44.0, 58.0, 58.0, 60.0, 79.0, 83.0, 64.0, 68.0, 55.0, 63.0, 40.0, 31.0, 39.0, 20.0, 15.0, 7.0, 11.0, 7.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49564194679260254, -0.4810281991958618, -0.4664144515991211, -0.45180070400238037, -0.43718698620796204, -0.4225732386112213, -0.4079594910144806, -0.39334574341773987, -0.37873199582099915, -0.3641182482242584, -0.3495045006275177, -0.33489078283309937, -0.32027703523635864, -0.3056632876396179, -0.2910495400428772, -0.2764357924461365, -0.26182204484939575, -0.24720829725265503, -0.2325945645570755, -0.21798081696033478, -0.20336706936359406, -0.18875333666801453, -0.1741395890712738, -0.15952584147453308, -0.14491212368011475, -0.13029837608337402, -0.1156846359372139, -0.10107089579105377, -0.08645714819431305, -0.07184340804815292, -0.0572296679019928, -0.042615920305252075, -0.028002172708511353, -0.013388429768383503, 0.0012253131717443466, 0.01583905518054962, 0.030452799052000046, 0.04506654292345047, 0.059680283069610596, 0.07429403066635132, 0.08890777081251144, 0.10352151095867157, 0.11813525855541229, 0.13274899125099182, 0.14736273884773254, 0.16197648644447327, 0.176590234041214, 0.1912039816379547, 0.20581771433353424, 0.22043146193027496, 0.2350451946258545, 0.24965894222259521, 0.26427268981933594, 0.27888643741607666, 0.2935001850128174, 0.3081139326095581, 0.32272765040397644, 0.33734139800071716, 0.3519551455974579, 0.3665688633918762, 0.38118261098861694, 0.39579635858535767, 0.4104101061820984, 0.4250238537788391, 0.43963760137557983]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 5.0, 8.0, 10.0, 10.0, 11.0, 18.0, 13.0, 21.0, 33.0, 27.0, 30.0, 41.0, 26.0, 46.0, 45.0, 48.0, 54.0, 53.0, 54.0, 50.0, 50.0, 35.0, 36.0, 38.0, 33.0, 25.0, 32.0, 16.0, 20.0, 29.0, 10.0, 11.0, 9.0, 10.0, 10.0, 3.0, 2.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.3357851505279541, -0.32553255558013916, -0.3152799606323242, -0.30502739548683167, -0.2947748005390167, -0.2845222055912018, -0.27426961064338684, -0.2640170156955719, -0.25376445055007935, -0.2435118556022644, -0.23325927555561066, -0.22300668060779572, -0.21275410056114197, -0.20250150561332703, -0.19224891066551208, -0.18199631571769714, -0.1717437207698822, -0.16149112582206726, -0.1512385457754135, -0.14098595082759857, -0.13073337078094482, -0.12048077583312988, -0.11022818088531494, -0.0999755933880806, -0.08972300589084625, -0.07947041839361191, -0.06921783089637756, -0.05896523594856262, -0.04871264845132828, -0.03846006095409393, -0.02820746973156929, -0.017954878509044647, -0.007702291011810303, 0.002550298348069191, 0.012802887707948685, 0.02305547706782818, 0.03330806642770767, 0.04356065392494202, 0.05381324514746666, 0.0640658363699913, 0.07431842386722565, 0.08457101136445999, 0.09482359886169434, 0.10507619380950928, 0.11532878130674362, 0.12558136880397797, 0.1358339637517929, 0.14608654379844666, 0.1563391387462616, 0.16659173369407654, 0.17684431374073029, 0.18709690868854523, 0.19734948873519897, 0.20760208368301392, 0.21785467863082886, 0.2281072735786438, 0.23835985362529755, 0.2486124485731125, 0.25886502861976624, 0.2691176235675812, 0.2793702185153961, 0.28962278366088867, 0.2998753786087036, 0.31012797355651855, 0.3203805685043335]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 5.0, 10.0, 29.0, 30.0, 51.0, 87.0, 104.0, 156.0, 355.0, 559.0, 1073.0, 2070.0, 4422.0, 9875.0, 22534.0, 54019.0, 153354.0, 424413.0, 242136.0, 77249.0, 31026.0, 13118.0, 5911.0, 2846.0, 1427.0, 676.0, 412.0, 226.0, 144.0, 94.0, 58.0, 35.0, 14.0, 7.0, 9.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5390625, -0.51959228515625, -0.5001220703125, -0.48065185546875, -0.461181640625, -0.44171142578125, -0.4222412109375, -0.40277099609375, -0.38330078125, -0.36383056640625, -0.3443603515625, -0.32489013671875, -0.305419921875, -0.28594970703125, -0.2664794921875, -0.24700927734375, -0.2275390625, -0.20806884765625, -0.1885986328125, -0.16912841796875, -0.149658203125, -0.13018798828125, -0.1107177734375, -0.09124755859375, -0.07177734375, -0.05230712890625, -0.0328369140625, -0.01336669921875, 0.006103515625, 0.02557373046875, 0.0450439453125, 0.06451416015625, 0.083984375, 0.10345458984375, 0.1229248046875, 0.14239501953125, 0.161865234375, 0.18133544921875, 0.2008056640625, 0.22027587890625, 0.23974609375, 0.25921630859375, 0.2786865234375, 0.29815673828125, 0.317626953125, 0.33709716796875, 0.3565673828125, 0.37603759765625, 0.3955078125, 0.41497802734375, 0.4344482421875, 0.45391845703125, 0.473388671875, 0.49285888671875, 0.5123291015625, 0.53179931640625, 0.55126953125, 0.57073974609375, 0.5902099609375, 0.60968017578125, 0.629150390625, 0.64862060546875, 0.6680908203125, 0.68756103515625, 0.70703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 19.0, 17.0, 15.0, 20.0, 31.0, 35.0, 29.0, 25.0, 52.0, 41.0, 42.0, 53.0, 52.0, 54.0, 45.0, 57.0, 47.0, 31.0, 35.0, 24.0, 35.0, 22.0, 18.0, 21.0, 19.0, 25.0, 13.0, 19.0, 8.0, 8.0, 4.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.49764251708984375, -0.4811248779296875, -0.46460723876953125, -0.448089599609375, -0.43157196044921875, -0.4150543212890625, -0.39853668212890625, -0.38201904296875, -0.36550140380859375, -0.3489837646484375, -0.33246612548828125, -0.315948486328125, -0.29943084716796875, -0.2829132080078125, -0.26639556884765625, -0.2498779296875, -0.23336029052734375, -0.2168426513671875, -0.20032501220703125, -0.183807373046875, -0.16728973388671875, -0.1507720947265625, -0.13425445556640625, -0.11773681640625, -0.10121917724609375, -0.0847015380859375, -0.06818389892578125, -0.051666259765625, -0.03514862060546875, -0.0186309814453125, -0.00211334228515625, 0.014404296875, 0.03092193603515625, 0.0474395751953125, 0.06395721435546875, 0.080474853515625, 0.09699249267578125, 0.1135101318359375, 0.13002777099609375, 0.14654541015625, 0.16306304931640625, 0.1795806884765625, 0.19609832763671875, 0.212615966796875, 0.22913360595703125, 0.2456512451171875, 0.26216888427734375, 0.2786865234375, 0.29520416259765625, 0.3117218017578125, 0.32823944091796875, 0.344757080078125, 0.36127471923828125, 0.3777923583984375, 0.39430999755859375, 0.41082763671875, 0.42734527587890625, 0.4438629150390625, 0.46038055419921875, 0.476898193359375, 0.49341583251953125, 0.5099334716796875, 0.5264511108398438, 0.54296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 5.0, 6.0, 9.0, 14.0, 17.0, 23.0, 43.0, 46.0, 72.0, 106.0, 133.0, 152.0, 261.0, 403.0, 607.0, 1085.0, 2103.0, 4222.0, 9244.0, 22099.0, 54137.0, 158423.0, 429438.0, 237535.0, 75421.0, 29060.0, 12339.0, 5484.0, 2541.0, 1318.0, 765.0, 460.0, 263.0, 212.0, 143.0, 103.0, 68.0, 55.0, 37.0, 26.0, 16.0, 24.0, 14.0, 8.0, 4.0, 3.0, 8.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6763916015625, -0.655029296875, -0.6336669921875, -0.6123046875, -0.5909423828125, -0.569580078125, -0.5482177734375, -0.52685546875, -0.5054931640625, -0.484130859375, -0.4627685546875, -0.44140625, -0.4200439453125, -0.398681640625, -0.3773193359375, -0.35595703125, -0.3345947265625, -0.313232421875, -0.2918701171875, -0.2705078125, -0.2491455078125, -0.227783203125, -0.2064208984375, -0.18505859375, -0.1636962890625, -0.142333984375, -0.1209716796875, -0.099609375, -0.0782470703125, -0.056884765625, -0.0355224609375, -0.01416015625, 0.0072021484375, 0.028564453125, 0.0499267578125, 0.0712890625, 0.0926513671875, 0.114013671875, 0.1353759765625, 0.15673828125, 0.1781005859375, 0.199462890625, 0.2208251953125, 0.2421875, 0.2635498046875, 0.284912109375, 0.3062744140625, 0.32763671875, 0.3489990234375, 0.370361328125, 0.3917236328125, 0.4130859375, 0.4344482421875, 0.455810546875, 0.4771728515625, 0.49853515625, 0.5198974609375, 0.541259765625, 0.5626220703125, 0.583984375, 0.6053466796875, 0.626708984375, 0.6480712890625, 0.66943359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 12.0, 16.0, 17.0, 19.0, 21.0, 36.0, 42.0, 25.0, 34.0, 53.0, 50.0, 57.0, 43.0, 56.0, 57.0, 41.0, 55.0, 49.0, 35.0, 35.0, 33.0, 28.0, 23.0, 20.0, 20.0, 12.0, 9.0, 18.0, 9.0, 13.0, 6.0, 5.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5658340454101562, -0.5462188720703125, -0.5266036987304688, -0.506988525390625, -0.48737335205078125, -0.4677581787109375, -0.44814300537109375, -0.42852783203125, -0.40891265869140625, -0.3892974853515625, -0.36968231201171875, -0.350067138671875, -0.33045196533203125, -0.3108367919921875, -0.29122161865234375, -0.2716064453125, -0.25199127197265625, -0.2323760986328125, -0.21276092529296875, -0.193145751953125, -0.17353057861328125, -0.1539154052734375, -0.13430023193359375, -0.11468505859375, -0.09506988525390625, -0.0754547119140625, -0.05583953857421875, -0.036224365234375, -0.01660919189453125, 0.0030059814453125, 0.02262115478515625, 0.042236328125, 0.06185150146484375, 0.0814666748046875, 0.10108184814453125, 0.120697021484375, 0.14031219482421875, 0.1599273681640625, 0.17954254150390625, 0.19915771484375, 0.21877288818359375, 0.2383880615234375, 0.25800323486328125, 0.277618408203125, 0.29723358154296875, 0.3168487548828125, 0.33646392822265625, 0.3560791015625, 0.37569427490234375, 0.3953094482421875, 0.41492462158203125, 0.434539794921875, 0.45415496826171875, 0.4737701416015625, 0.49338531494140625, 0.51300048828125, 0.5326156616210938, 0.5522308349609375, 0.5718460083007812, 0.591461181640625, 0.6110763549804688, 0.6306915283203125, 0.6503067016601562, 0.669921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 13.0, 11.0, 15.0, 29.0, 50.0, 81.0, 140.0, 249.0, 427.0, 824.0, 1544.0, 3109.0, 6988.0, 18253.0, 65122.0, 325906.0, 491880.0, 94222.0, 23606.0, 8499.0, 3699.0, 1740.0, 895.0, 492.0, 299.0, 172.0, 116.0, 55.0, 35.0, 22.0, 22.0, 10.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165771484375, -0.1600780487060547, -0.15438461303710938, -0.14869117736816406, -0.14299774169921875, -0.13730430603027344, -0.13161087036132812, -0.1259174346923828, -0.1202239990234375, -0.11453056335449219, -0.10883712768554688, -0.10314369201660156, -0.09745025634765625, -0.09175682067871094, -0.08606338500976562, -0.08036994934082031, -0.074676513671875, -0.06898307800292969, -0.06328964233398438, -0.05759620666503906, -0.05190277099609375, -0.04620933532714844, -0.040515899658203125, -0.03482246398925781, -0.0291290283203125, -0.023435592651367188, -0.017742156982421875, -0.012048721313476562, -0.00635528564453125, -0.0006618499755859375, 0.005031585693359375, 0.010725021362304688, 0.01641845703125, 0.022111892700195312, 0.027805328369140625, 0.03349876403808594, 0.03919219970703125, 0.04488563537597656, 0.050579071044921875, 0.05627250671386719, 0.0619659423828125, 0.06765937805175781, 0.07335281372070312, 0.07904624938964844, 0.08473968505859375, 0.09043312072753906, 0.09612655639648438, 0.10181999206542969, 0.107513427734375, 0.11320686340332031, 0.11890029907226562, 0.12459373474121094, 0.13028717041015625, 0.13598060607910156, 0.14167404174804688, 0.1473674774169922, 0.1530609130859375, 0.1587543487548828, 0.16444778442382812, 0.17014122009277344, 0.17583465576171875, 0.18152809143066406, 0.18722152709960938, 0.1929149627685547, 0.1986083984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 12.0, 13.0, 22.0, 30.0, 21.0, 35.0, 35.0, 57.0, 64.0, 73.0, 139.0, 76.0, 77.0, 73.0, 52.0, 34.0, 29.0, 25.0, 25.0, 21.0, 14.0, 8.0, 6.0, 9.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9490718841552734e-05, -1.8673017621040344e-05, -1.7855316400527954e-05, -1.7037615180015564e-05, -1.6219913959503174e-05, -1.5402212738990784e-05, -1.4584511518478394e-05, -1.3766810297966003e-05, -1.2949109077453613e-05, -1.2131407856941223e-05, -1.1313706636428833e-05, -1.0496005415916443e-05, -9.678304195404053e-06, -8.860602974891663e-06, -8.042901754379272e-06, -7.225200533866882e-06, -6.407499313354492e-06, -5.589798092842102e-06, -4.772096872329712e-06, -3.954395651817322e-06, -3.1366944313049316e-06, -2.3189932107925415e-06, -1.5012919902801514e-06, -6.835907697677612e-07, 1.341104507446289e-07, 9.51811671257019e-07, 1.7695128917694092e-06, 2.5872141122817993e-06, 3.4049153327941895e-06, 4.22261655330658e-06, 5.04031777381897e-06, 5.85801899433136e-06, 6.67572021484375e-06, 7.49342143535614e-06, 8.31112265586853e-06, 9.12882387638092e-06, 9.94652509689331e-06, 1.07642263174057e-05, 1.158192753791809e-05, 1.2399628758430481e-05, 1.3217329978942871e-05, 1.4035031199455261e-05, 1.4852732419967651e-05, 1.567043364048004e-05, 1.648813486099243e-05, 1.7305836081504822e-05, 1.8123537302017212e-05, 1.8941238522529602e-05, 1.9758939743041992e-05, 2.0576640963554382e-05, 2.1394342184066772e-05, 2.2212043404579163e-05, 2.3029744625091553e-05, 2.3847445845603943e-05, 2.4665147066116333e-05, 2.5482848286628723e-05, 2.6300549507141113e-05, 2.7118250727653503e-05, 2.7935951948165894e-05, 2.8753653168678284e-05, 2.9571354389190674e-05, 3.0389055609703064e-05, 3.1206756830215454e-05, 3.2024458050727844e-05, 3.2842159271240234e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 10.0, 17.0, 33.0, 38.0, 40.0, 83.0, 100.0, 156.0, 248.0, 320.0, 540.0, 1006.0, 1767.0, 3365.0, 7130.0, 18128.0, 73148.0, 535458.0, 329890.0, 50254.0, 14193.0, 5845.0, 2928.0, 1493.0, 864.0, 514.0, 294.0, 206.0, 150.0, 109.0, 51.0, 49.0, 38.0, 25.0, 16.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263916015625, -0.25537109375, -0.246826171875, -0.23828125, -0.229736328125, -0.22119140625, -0.212646484375, -0.2041015625, -0.195556640625, -0.18701171875, -0.178466796875, -0.169921875, -0.161376953125, -0.15283203125, -0.144287109375, -0.1357421875, -0.127197265625, -0.11865234375, -0.110107421875, -0.1015625, -0.093017578125, -0.08447265625, -0.075927734375, -0.0673828125, -0.058837890625, -0.05029296875, -0.041748046875, -0.033203125, -0.024658203125, -0.01611328125, -0.007568359375, 0.0009765625, 0.009521484375, 0.01806640625, 0.026611328125, 0.03515625, 0.043701171875, 0.05224609375, 0.060791015625, 0.0693359375, 0.077880859375, 0.08642578125, 0.094970703125, 0.103515625, 0.112060546875, 0.12060546875, 0.129150390625, 0.1376953125, 0.146240234375, 0.15478515625, 0.163330078125, 0.171875, 0.180419921875, 0.18896484375, 0.197509765625, 0.2060546875, 0.214599609375, 0.22314453125, 0.231689453125, 0.240234375, 0.248779296875, 0.25732421875, 0.265869140625, 0.2744140625, 0.282958984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 7.0, 20.0, 29.0, 26.0, 64.0, 62.0, 117.0, 208.0, 120.0, 102.0, 74.0, 50.0, 29.0, 22.0, 11.0, 7.0, 6.0, 8.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1729736328125, -0.1682720184326172, -0.16357040405273438, -0.15886878967285156, -0.15416717529296875, -0.14946556091308594, -0.14476394653320312, -0.1400623321533203, -0.1353607177734375, -0.1306591033935547, -0.12595748901367188, -0.12125587463378906, -0.11655426025390625, -0.11185264587402344, -0.10715103149414062, -0.10244941711425781, -0.097747802734375, -0.09304618835449219, -0.08834457397460938, -0.08364295959472656, -0.07894134521484375, -0.07423973083496094, -0.06953811645507812, -0.06483650207519531, -0.0601348876953125, -0.05543327331542969, -0.050731658935546875, -0.04603004455566406, -0.04132843017578125, -0.03662681579589844, -0.031925201416015625, -0.027223587036132812, -0.02252197265625, -0.017820358276367188, -0.013118743896484375, -0.008417129516601562, -0.00371551513671875, 0.0009860992431640625, 0.005687713623046875, 0.010389328002929688, 0.0150909423828125, 0.019792556762695312, 0.024494171142578125, 0.029195785522460938, 0.03389739990234375, 0.03859901428222656, 0.043300628662109375, 0.04800224304199219, 0.052703857421875, 0.05740547180175781, 0.062107086181640625, 0.06680870056152344, 0.07151031494140625, 0.07621192932128906, 0.08091354370117188, 0.08561515808105469, 0.0903167724609375, 0.09501838684082031, 0.09972000122070312, 0.10442161560058594, 0.10912322998046875, 0.11382484436035156, 0.11852645874023438, 0.12322807312011719, 0.1279296875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 16.0, 28.0, 116.0, 166.0, 237.0, 200.0, 128.0, 68.0, 22.0, 8.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.209085941314697, -4.1206746101379395, -4.032263278961182, -3.943851947784424, -3.855440855026245, -3.7670295238494873, -3.6786181926727295, -3.5902068614959717, -3.501795530319214, -3.413384199142456, -3.3249728679656982, -3.2365617752075195, -3.1481504440307617, -3.059739112854004, -2.971327781677246, -2.8829164505004883, -2.7945051193237305, -2.7060937881469727, -2.617682456970215, -2.529271125793457, -2.4408600330352783, -2.3524487018585205, -2.2640373706817627, -2.175626039505005, -2.087214946746826, -1.9988036155700684, -1.9103924036026, -1.8219810724258423, -1.7335697412490845, -1.6451585292816162, -1.5567471981048584, -1.4683358669281006, -1.3799244165420532, -1.2915130853652954, -1.2031018733978271, -1.1146905422210693, -1.0262792110443115, -0.9378679394721985, -0.8494566679000854, -0.7610453367233276, -0.6726340651512146, -0.5842227935791016, -0.49581146240234375, -0.4074001908302307, -0.3189888894557953, -0.23057758808135986, -0.14216631650924683, -0.053754985332489014, 0.03465628623962402, 0.12306758016347885, 0.21147887408733368, 0.2998901605606079, 0.38830146193504333, 0.47671276330947876, 0.5651240348815918, 0.6535353660583496, 0.7419466376304626, 0.8303579092025757, 0.9187692403793335, 1.0071804523468018, 1.0955917835235596, 1.1840031147003174, 1.2724144458770752, 1.360825777053833, 1.4492369890213013]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 15.0, 9.0, 12.0, 15.0, 14.0, 12.0, 12.0, 17.0, 20.0, 30.0, 27.0, 30.0, 36.0, 38.0, 52.0, 54.0, 37.0, 32.0, 46.0, 54.0, 39.0, 47.0, 40.0, 41.0, 32.0, 36.0, 32.0, 27.0, 17.0, 18.0, 17.0, 13.0, 15.0, 13.0, 6.0, 9.0, 5.0, 6.0, 2.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0428986549377441, -1.0138063430786133, -0.9847139716148376, -0.9556216597557068, -0.9265292882919312, -0.8974369764328003, -0.8683446645736694, -0.8392523527145386, -0.8101599812507629, -0.7810676693916321, -0.7519752979278564, -0.7228829860687256, -0.6937906742095947, -0.6646983027458191, -0.6356059908866882, -0.6065136194229126, -0.5774213075637817, -0.5483289957046509, -0.5192366242408752, -0.4901443123817444, -0.46105197072029114, -0.4319596290588379, -0.40286731719970703, -0.3737749755382538, -0.34468263387680054, -0.3155902922153473, -0.28649795055389404, -0.2574056386947632, -0.22831329703330994, -0.1992209553718567, -0.17012862861156464, -0.14103630185127258, -0.11194390058517456, -0.08285156637430191, -0.05375923216342926, -0.02466689795255661, 0.00442543625831604, 0.03351777791976929, 0.06261010468006134, 0.0917024314403534, 0.12079477310180664, 0.1498871147632599, 0.17897944152355194, 0.208071768283844, 0.23716410994529724, 0.2662564516067505, 0.29534876346588135, 0.3244411051273346, 0.35353344678878784, 0.3826257884502411, 0.41171813011169434, 0.4408104419708252, 0.46990278363227844, 0.4989951252937317, 0.5280874371528625, 0.5571798086166382, 0.586272120475769, 0.6153644323348999, 0.6444568037986755, 0.6735491156578064, 0.702641487121582, 0.7317337989807129, 0.7608261108398438, 0.7899184226989746, 0.8190107941627502]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 7.0, 6.0, 12.0, 27.0, 32.0, 32.0, 36.0, 54.0, 101.0, 107.0, 186.0, 271.0, 361.0, 537.0, 790.0, 1211.0, 1682.0, 2235.0, 2804.0, 1029642.0, 2783.0, 2241.0, 1670.0, 1151.0, 813.0, 553.0, 372.0, 239.0, 190.0, 128.0, 98.0, 69.0, 49.0, 32.0, 33.0, 11.0, 15.0, 7.0, 6.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.102470874786377, -1.0650981664657593, -1.0277254581451416, -0.9903526902198792, -0.9529799818992615, -0.9156072735786438, -0.8782345056533813, -0.8408617973327637, -0.803489089012146, -0.7661163806915283, -0.7287436723709106, -0.6913709044456482, -0.6539981961250305, -0.6166254878044128, -0.5792527198791504, -0.5418800115585327, -0.504507303237915, -0.46713459491729736, -0.4297618567943573, -0.39238911867141724, -0.35501641035079956, -0.3176437020301819, -0.2802709639072418, -0.24289822578430176, -0.20552551746368408, -0.1681527942419052, -0.13078007102012634, -0.09340734779834747, -0.056034624576568604, -0.018661901354789734, 0.018710821866989136, 0.0560835599899292, 0.09345626831054688, 0.13082899153232574, 0.16820171475410461, 0.20557443797588348, 0.24294716119766235, 0.28031986951828003, 0.3176926076412201, 0.35506534576416016, 0.39243805408477783, 0.4298107624053955, 0.46718350052833557, 0.5045562386512756, 0.5419289469718933, 0.579301655292511, 0.6166744232177734, 0.6540471315383911, 0.6914198398590088, 0.7287925481796265, 0.7661652565002441, 0.8035380244255066, 0.8409107327461243, 0.8782834410667419, 0.9156562089920044, 0.9530289173126221, 0.9904016256332397, 1.0277743339538574, 1.065147042274475, 1.1025197505950928, 1.139892578125, 1.1772652864456177, 1.2146379947662354, 1.252010703086853, 1.2893834114074707]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 9.0, 18.0, 37.0, 35.0, 31.0, 53.0, 83.0, 174.0, 331.0, 750.0, 1650.0, 3636.0, 8640.0, 26235.0, 51376248.0, 32427.0, 11523.0, 5236.0, 2226.0, 1023.0, 457.0, 244.0, 130.0, 55.0, 38.0, 22.0, 18.0, 10.0, 5.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4312098026275635, -2.3461198806762695, -2.2610301971435547, -2.1759402751922607, -2.090850353240967, -2.005760669708252, -1.920670747756958, -1.8355809450149536, -1.7504911422729492, -1.6654013395309448, -1.5803115367889404, -1.4952216148376465, -1.410131812095642, -1.3250420093536377, -1.2399520874023438, -1.1548622846603394, -1.069772481918335, -0.9846826791763306, -0.8995928168296814, -0.8145029544830322, -0.7294131517410278, -0.6443233489990234, -0.5592334866523743, -0.4741436243057251, -0.3890538215637207, -0.3039639890193939, -0.21887415647506714, -0.13378432393074036, -0.048694491386413574, 0.03639534115791321, 0.12148517370223999, 0.20657503604888916, 0.29166460037231445, 0.37675443291664124, 0.461844265460968, 0.5469341278076172, 0.6320239305496216, 0.717113733291626, 0.8022035956382751, 0.8872934579849243, 0.9723832607269287, 1.057473063468933, 1.1425628662109375, 1.2276527881622314, 1.3127425909042358, 1.3978323936462402, 1.4829223155975342, 1.5680121183395386, 1.653101921081543, 1.7381917238235474, 1.8232815265655518, 1.9083714485168457, 1.99346125125885, 2.0785510540008545, 2.1636409759521484, 2.2487306594848633, 2.3338205814361572, 2.418910503387451, 2.504000186920166, 2.58909010887146, 2.674180030822754, 2.7592697143554688, 2.8443596363067627, 2.9294495582580566, 3.0145392417907715]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 9.0, 10.0, 10.0, 27.0, 16.0, 47.0, 61.0, 114.0, 177.0, 259.0, 405.0, 635.0, 1043.0, 1717.0, 2746.0, 4578.0, 7771.0, 13473.0, 23609.0, 41709.0, 72761.0, 125100.0, 201762.0, 303046.0, 443251.0, 2658529.0, 1316024.0, 384994.0, 267931.0, 174106.0, 103459.0, 60633.0, 34104.0, 19394.0, 11166.0, 6532.0, 3866.0, 2358.0, 1492.0, 916.0, 582.0, 366.0, 229.0, 168.0, 72.0, 73.0, 37.0, 25.0, 21.0, 14.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.471923828125, -0.4566230773925781, -0.44132232666015625, -0.4260215759277344, -0.4107208251953125, -0.3954200744628906, -0.38011932373046875, -0.3648185729980469, -0.349517822265625, -0.3342170715332031, -0.31891632080078125, -0.3036155700683594, -0.2883148193359375, -0.2730140686035156, -0.25771331787109375, -0.24241256713867188, -0.22711181640625, -0.21181106567382812, -0.19651031494140625, -0.18120956420898438, -0.1659088134765625, -0.15060806274414062, -0.13530731201171875, -0.12000656127929688, -0.104705810546875, -0.08940505981445312, -0.07410430908203125, -0.058803558349609375, -0.0435028076171875, -0.028202056884765625, -0.01290130615234375, 0.002399444580078125, 0.0177001953125, 0.033000946044921875, 0.04830169677734375, 0.06360244750976562, 0.0789031982421875, 0.09420394897460938, 0.10950469970703125, 0.12480545043945312, 0.140106201171875, 0.15540695190429688, 0.17070770263671875, 0.18600845336914062, 0.2013092041015625, 0.21660995483398438, 0.23191070556640625, 0.24721145629882812, 0.26251220703125, 0.2778129577636719, 0.29311370849609375, 0.3084144592285156, 0.3237152099609375, 0.3390159606933594, 0.35431671142578125, 0.3696174621582031, 0.384918212890625, 0.4002189636230469, 0.41551971435546875, 0.4308204650878906, 0.4461212158203125, 0.4614219665527344, 0.47672271728515625, 0.4920234680175781, 0.50732421875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 7.0, 6.0, 13.0, 9.0, 12.0, 13.0, 19.0, 28.0, 26.0, 26.0, 27.0, 34.0, 42.0, 36.0, 41.0, 40.0, 56.0, 235.0, 820.0, 82.0, 44.0, 38.0, 43.0, 45.0, 37.0, 27.0, 29.0, 29.0, 28.0, 11.0, 24.0, 15.0, 16.0, 15.0, 6.0, 11.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.482086181640625, -2.38409423828125, -2.286102294921875, -2.1881103515625, -2.090118408203125, -1.99212646484375, -1.894134521484375, -1.796142578125, -1.698150634765625, -1.60015869140625, -1.502166748046875, -1.4041748046875, -1.306182861328125, -1.20819091796875, -1.110198974609375, -1.01220703125, -0.914215087890625, -0.81622314453125, -0.718231201171875, -0.6202392578125, -0.522247314453125, -0.42425537109375, -0.326263427734375, -0.228271484375, -0.130279541015625, -0.03228759765625, 0.065704345703125, 0.1636962890625, 0.261688232421875, 0.35968017578125, 0.457672119140625, 0.5556640625, 0.653656005859375, 0.75164794921875, 0.849639892578125, 0.9476318359375, 1.045623779296875, 1.14361572265625, 1.241607666015625, 1.339599609375, 1.437591552734375, 1.53558349609375, 1.633575439453125, 1.7315673828125, 1.829559326171875, 1.92755126953125, 2.025543212890625, 2.12353515625, 2.221527099609375, 2.31951904296875, 2.417510986328125, 2.5155029296875, 2.613494873046875, 2.71148681640625, 2.809478759765625, 2.907470703125, 3.005462646484375, 3.10345458984375, 3.201446533203125, 3.2994384765625, 3.397430419921875, 3.49542236328125, 3.593414306640625, 3.69140625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 6.0, 13.0, 14.0, 17.0, 31.0, 57.0, 124.0, 197.0, 325.0, 507.0, 830.0, 1290.0, 2212.0, 3645.0, 5770.0, 9100.0, 14405.0, 21905.0, 32916.0, 48375.0, 69495.0, 96311.0, 129889.0, 166330.0, 204097.0, 243352.0, 386362.0, 1940707.0, 1571495.0, 332352.0, 236844.0, 198838.0, 160050.0, 123157.0, 91572.0, 66020.0, 45797.0, 31339.0, 20358.0, 13061.0, 8485.0, 5399.0, 3255.0, 2009.0, 1212.0, 789.0, 443.0, 274.0, 160.0, 100.0, 60.0, 47.0, 23.0, 11.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.2449951171875, -0.2373199462890625, -0.229644775390625, -0.2219696044921875, -0.21429443359375, -0.2066192626953125, -0.198944091796875, -0.1912689208984375, -0.18359375, -0.1759185791015625, -0.168243408203125, -0.1605682373046875, -0.15289306640625, -0.1452178955078125, -0.137542724609375, -0.1298675537109375, -0.1221923828125, -0.1145172119140625, -0.106842041015625, -0.0991668701171875, -0.09149169921875, -0.0838165283203125, -0.076141357421875, -0.0684661865234375, -0.060791015625, -0.0531158447265625, -0.045440673828125, -0.0377655029296875, -0.03009033203125, -0.0224151611328125, -0.014739990234375, -0.0070648193359375, 0.0006103515625, 0.0082855224609375, 0.015960693359375, 0.0236358642578125, 0.03131103515625, 0.0389862060546875, 0.046661376953125, 0.0543365478515625, 0.06201171875, 0.0696868896484375, 0.077362060546875, 0.0850372314453125, 0.09271240234375, 0.1003875732421875, 0.108062744140625, 0.1157379150390625, 0.1234130859375, 0.1310882568359375, 0.138763427734375, 0.1464385986328125, 0.15411376953125, 0.1617889404296875, 0.169464111328125, 0.1771392822265625, 0.184814453125, 0.1924896240234375, 0.200164794921875, 0.2078399658203125, 0.21551513671875, 0.2231903076171875, 0.230865478515625, 0.2385406494140625, 0.2462158203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 9.0, 9.0, 6.0, 8.0, 13.0, 13.0, 25.0, 25.0, 16.0, 34.0, 24.0, 28.0, 23.0, 29.0, 43.0, 34.0, 39.0, 45.0, 79.0, 479.0, 548.0, 62.0, 43.0, 46.0, 46.0, 29.0, 35.0, 30.0, 21.0, 27.0, 18.0, 28.0, 19.0, 8.0, 11.0, 13.0, 13.0, 11.0, 7.0, 3.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9287109375, -1.8644561767578125, -1.800201416015625, -1.7359466552734375, -1.67169189453125, -1.6074371337890625, -1.543182373046875, -1.4789276123046875, -1.4146728515625, -1.3504180908203125, -1.286163330078125, -1.2219085693359375, -1.15765380859375, -1.0933990478515625, -1.029144287109375, -0.9648895263671875, -0.900634765625, -0.8363800048828125, -0.772125244140625, -0.7078704833984375, -0.64361572265625, -0.5793609619140625, -0.515106201171875, -0.4508514404296875, -0.3865966796875, -0.3223419189453125, -0.258087158203125, -0.1938323974609375, -0.12957763671875, -0.0653228759765625, -0.001068115234375, 0.0631866455078125, 0.12744140625, 0.1916961669921875, 0.255950927734375, 0.3202056884765625, 0.38446044921875, 0.4487152099609375, 0.512969970703125, 0.5772247314453125, 0.6414794921875, 0.7057342529296875, 0.769989013671875, 0.8342437744140625, 0.89849853515625, 0.9627532958984375, 1.027008056640625, 1.0912628173828125, 1.155517578125, 1.2197723388671875, 1.284027099609375, 1.3482818603515625, 1.41253662109375, 1.4767913818359375, 1.541046142578125, 1.6053009033203125, 1.6695556640625, 1.7338104248046875, 1.798065185546875, 1.8623199462890625, 1.92657470703125, 1.9908294677734375, 2.055084228515625, 2.1193389892578125, 2.18359375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 6.0, 12.0, 8.0, 31.0, 36.0, 66.0, 79.0, 116.0, 153.0, 200.0, 305.0, 414.0, 608.0, 901.0, 1426.0, 2448.0, 4925.0, 12407.0, 37849.0, 120746.0, 342806.0, 753404.0, 3981437.0, 622313.0, 270037.0, 90345.0, 28460.0, 9984.0, 4006.0, 2036.0, 1274.0, 819.0, 559.0, 351.0, 255.0, 199.0, 105.0, 87.0, 53.0, 53.0, 38.0, 24.0, 17.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.67529296875, -0.6544342041015625, -0.633575439453125, -0.6127166748046875, -0.59185791015625, -0.5709991455078125, -0.550140380859375, -0.5292816162109375, -0.5084228515625, -0.4875640869140625, -0.466705322265625, -0.4458465576171875, -0.42498779296875, -0.4041290283203125, -0.383270263671875, -0.3624114990234375, -0.341552734375, -0.3206939697265625, -0.299835205078125, -0.2789764404296875, -0.25811767578125, -0.2372589111328125, -0.216400146484375, -0.1955413818359375, -0.1746826171875, -0.1538238525390625, -0.132965087890625, -0.1121063232421875, -0.09124755859375, -0.0703887939453125, -0.049530029296875, -0.0286712646484375, -0.0078125, 0.0130462646484375, 0.033905029296875, 0.0547637939453125, 0.07562255859375, 0.0964813232421875, 0.117340087890625, 0.1381988525390625, 0.1590576171875, 0.1799163818359375, 0.200775146484375, 0.2216339111328125, 0.24249267578125, 0.2633514404296875, 0.284210205078125, 0.3050689697265625, 0.325927734375, 0.3467864990234375, 0.367645263671875, 0.3885040283203125, 0.40936279296875, 0.4302215576171875, 0.451080322265625, 0.4719390869140625, 0.4927978515625, 0.5136566162109375, 0.534515380859375, 0.5553741455078125, 0.57623291015625, 0.5970916748046875, 0.617950439453125, 0.6388092041015625, 0.65966796875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 6.0, 11.0, 14.0, 16.0, 14.0, 18.0, 29.0, 35.0, 35.0, 25.0, 32.0, 46.0, 29.0, 40.0, 46.0, 83.0, 561.0, 495.0, 60.0, 47.0, 29.0, 29.0, 35.0, 42.0, 31.0, 35.0, 31.0, 19.0, 22.0, 17.0, 13.0, 9.0, 9.0, 12.0, 7.0, 6.0, 2.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.716796875, -1.6647491455078125, -1.612701416015625, -1.5606536865234375, -1.50860595703125, -1.4565582275390625, -1.404510498046875, -1.3524627685546875, -1.3004150390625, -1.2483673095703125, -1.196319580078125, -1.1442718505859375, -1.09222412109375, -1.0401763916015625, -0.988128662109375, -0.9360809326171875, -0.884033203125, -0.8319854736328125, -0.779937744140625, -0.7278900146484375, -0.67584228515625, -0.6237945556640625, -0.571746826171875, -0.5196990966796875, -0.4676513671875, -0.4156036376953125, -0.363555908203125, -0.3115081787109375, -0.25946044921875, -0.2074127197265625, -0.155364990234375, -0.1033172607421875, -0.05126953125, 0.0007781982421875, 0.052825927734375, 0.1048736572265625, 0.15692138671875, 0.2089691162109375, 0.261016845703125, 0.3130645751953125, 0.3651123046875, 0.4171600341796875, 0.469207763671875, 0.5212554931640625, 0.57330322265625, 0.6253509521484375, 0.677398681640625, 0.7294464111328125, 0.781494140625, 0.8335418701171875, 0.885589599609375, 0.9376373291015625, 0.98968505859375, 1.0417327880859375, 1.093780517578125, 1.1458282470703125, 1.1978759765625, 1.2499237060546875, 1.301971435546875, 1.3540191650390625, 1.40606689453125, 1.4581146240234375, 1.510162353515625, 1.5622100830078125, 1.6142578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 10.0, 49.0, 268.0, 488.0, 157.0, 28.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.158155918121338, -3.7573583126068115, -3.356560468673706, -2.9557628631591797, -2.554965019226074, -2.154167413711548, -1.7533698081970215, -1.352571964263916, -0.9517743587493896, -0.5509766340255737, -0.1501789689064026, 0.25061869621276855, 0.6514164209365845, 1.0522141456604004, 1.4530117511749268, 1.8538095951080322, 2.2546072006225586, 2.655404806137085, 3.0562026500701904, 3.457000255584717, 3.8577980995178223, 4.2585954666137695, 4.659393310546875, 5.0601911544799805, 5.460988998413086, 5.861786842346191, 6.262584209442139, 6.663382053375244, 7.06417989730835, 7.464977264404297, 7.865775108337402, 8.266572952270508, 8.667370796203613, 9.068168640136719, 9.468966484069824, 9.86976432800293, 10.270561218261719, 10.671359062194824, 11.07215690612793, 11.472954750061035, 11.87375259399414, 12.274550437927246, 12.675348281860352, 13.07614517211914, 13.476943016052246, 13.877740859985352, 14.278538703918457, 14.679336547851562, 15.080133438110352, 15.480931282043457, 15.881729125976562, 16.28252601623535, 16.683324813842773, 17.084121704101562, 17.484920501708984, 17.885717391967773, 18.286516189575195, 18.687313079833984, 19.088111877441406, 19.488908767700195, 19.889707565307617, 20.290504455566406, 20.691303253173828, 21.092100143432617, 21.492897033691406]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 4.0, 6.0, 12.0, 5.0, 10.0, 8.0, 12.0, 24.0, 23.0, 28.0, 29.0, 34.0, 30.0, 31.0, 33.0, 38.0, 27.0, 35.0, 48.0, 30.0, 41.0, 50.0, 36.0, 30.0, 30.0, 29.0, 39.0, 28.0, 29.0, 30.0, 23.0, 24.0, 19.0, 15.0, 17.0, 12.0, 15.0, 7.0, 13.0, 4.0, 7.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.381347894668579, -2.302940845489502, -2.224534034729004, -2.146127223968506, -2.0677201747894287, -1.9893132448196411, -1.9109063148498535, -1.832499384880066, -1.7540924549102783, -1.6756855249404907, -1.5972785949707031, -1.5188716650009155, -1.440464735031128, -1.3620578050613403, -1.2836508750915527, -1.2052439451217651, -1.1268370151519775, -1.04843008518219, -0.9700231552124023, -0.8916162252426147, -0.8132092952728271, -0.7348023653030396, -0.656395435333252, -0.5779885053634644, -0.49958157539367676, -0.42117464542388916, -0.34276771545410156, -0.26436078548431396, -0.18595385551452637, -0.10754692554473877, -0.029139995574951172, 0.049266934394836426, 0.12767410278320312, 0.20608103275299072, 0.2844879627227783, 0.3628948926925659, 0.4413018226623535, 0.5197087526321411, 0.5981156826019287, 0.6765226125717163, 0.7549295425415039, 0.8333364725112915, 0.9117434024810791, 0.9901503324508667, 1.0685572624206543, 1.146964192390442, 1.2253711223602295, 1.303778052330017, 1.3821849822998047, 1.4605919122695923, 1.5389988422393799, 1.6174057722091675, 1.695812702178955, 1.7742196321487427, 1.8526265621185303, 1.9310334920883179, 2.0094404220581055, 2.0878472328186035, 2.1662542819976807, 2.244661331176758, 2.323068141937256, 2.401474952697754, 2.479882001876831, 2.558289051055908, 2.6366958618164062]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 11.0, 16.0, 17.0, 45.0, 54.0, 87.0, 135.0, 284.0, 512.0, 1022.0, 2208.0, 4768.0, 11201.0, 29802.0, 122478.0, 1739321.0, 2061914.0, 164351.0, 33323.0, 12494.0, 5451.0, 2473.0, 1069.0, 532.0, 270.0, 164.0, 93.0, 43.0, 34.0, 21.0, 14.0, 15.0, 7.0, 6.0, 10.0, 3.0, 1.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.12022686004638672, -0.11679649353027344, -0.11336612701416016, -0.10993576049804688, -0.1065053939819336, -0.10307502746582031, -0.09964466094970703, -0.09621429443359375, -0.09278392791748047, -0.08935356140136719, -0.0859231948852539, -0.08249282836914062, -0.07906246185302734, -0.07563209533691406, -0.07220172882080078, -0.0687713623046875, -0.06534099578857422, -0.06191062927246094, -0.058480262756347656, -0.055049896240234375, -0.051619529724121094, -0.04818916320800781, -0.04475879669189453, -0.04132843017578125, -0.03789806365966797, -0.03446769714355469, -0.031037330627441406, -0.027606964111328125, -0.024176597595214844, -0.020746231079101562, -0.01731586456298828, -0.013885498046875, -0.010455131530761719, -0.0070247650146484375, -0.0035943984985351562, -0.000164031982421875, 0.0032663345336914062, 0.0066967010498046875, 0.010127067565917969, 0.01355743408203125, 0.01698780059814453, 0.020418167114257812, 0.023848533630371094, 0.027278900146484375, 0.030709266662597656, 0.03413963317871094, 0.03756999969482422, 0.0410003662109375, 0.04443073272705078, 0.04786109924316406, 0.051291465759277344, 0.054721832275390625, 0.058152198791503906, 0.06158256530761719, 0.06501293182373047, 0.06844329833984375, 0.07187366485595703, 0.07530403137207031, 0.0787343978881836, 0.08216476440429688, 0.08559513092041016, 0.08902549743652344, 0.09245586395263672, 0.09588623046875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 7.0, 6.0, 6.0, 8.0, 11.0, 16.0, 21.0, 10.0, 22.0, 25.0, 33.0, 47.0, 36.0, 49.0, 46.0, 64.0, 44.0, 54.0, 60.0, 47.0, 53.0, 50.0, 42.0, 38.0, 27.0, 26.0, 32.0, 26.0, 17.0, 21.0, 8.0, 10.0, 8.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04217529296875, -0.04074430465698242, -0.039313316345214844, -0.037882328033447266, -0.03645133972167969, -0.03502035140991211, -0.03358936309814453, -0.03215837478637695, -0.030727386474609375, -0.029296398162841797, -0.02786540985107422, -0.02643442153930664, -0.025003433227539062, -0.023572444915771484, -0.022141456604003906, -0.020710468292236328, -0.01927947998046875, -0.017848491668701172, -0.016417503356933594, -0.014986515045166016, -0.013555526733398438, -0.01212453842163086, -0.010693550109863281, -0.009262561798095703, -0.007831573486328125, -0.006400585174560547, -0.004969596862792969, -0.0035386085510253906, -0.0021076202392578125, -0.0006766319274902344, 0.0007543563842773438, 0.002185344696044922, 0.0036163330078125, 0.005047321319580078, 0.006478309631347656, 0.007909297943115234, 0.009340286254882812, 0.01077127456665039, 0.012202262878417969, 0.013633251190185547, 0.015064239501953125, 0.016495227813720703, 0.01792621612548828, 0.01935720443725586, 0.020788192749023438, 0.022219181060791016, 0.023650169372558594, 0.025081157684326172, 0.02651214599609375, 0.027943134307861328, 0.029374122619628906, 0.030805110931396484, 0.03223609924316406, 0.03366708755493164, 0.03509807586669922, 0.0365290641784668, 0.037960052490234375, 0.03939104080200195, 0.04082202911376953, 0.04225301742553711, 0.04368400573730469, 0.045114994049072266, 0.046545982360839844, 0.04797697067260742, 0.049407958984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 3.0, 7.0, 8.0, 5.0, 9.0, 13.0, 18.0, 25.0, 31.0, 50.0, 67.0, 177.0, 588.0, 3074.0, 30865.0, 1265365.0, 2818255.0, 69248.0, 5159.0, 820.0, 253.0, 85.0, 41.0, 27.0, 21.0, 19.0, 4.0, 10.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.154296875, -0.15014171600341797, -0.14598655700683594, -0.1418313980102539, -0.13767623901367188, -0.13352108001708984, -0.1293659210205078, -0.12521076202392578, -0.12105560302734375, -0.11690044403076172, -0.11274528503417969, -0.10859012603759766, -0.10443496704101562, -0.1002798080444336, -0.09612464904785156, -0.09196949005126953, -0.0878143310546875, -0.08365917205810547, -0.07950401306152344, -0.0753488540649414, -0.07119369506835938, -0.06703853607177734, -0.06288337707519531, -0.05872821807861328, -0.05457305908203125, -0.05041790008544922, -0.04626274108886719, -0.042107582092285156, -0.037952423095703125, -0.033797264099121094, -0.029642105102539062, -0.02548694610595703, -0.021331787109375, -0.01717662811279297, -0.013021469116210938, -0.008866310119628906, -0.004711151123046875, -0.0005559921264648438, 0.0035991668701171875, 0.007754325866699219, 0.01190948486328125, 0.01606464385986328, 0.020219802856445312, 0.024374961853027344, 0.028530120849609375, 0.032685279846191406, 0.03684043884277344, 0.04099559783935547, 0.0451507568359375, 0.04930591583251953, 0.05346107482910156, 0.057616233825683594, 0.061771392822265625, 0.06592655181884766, 0.07008171081542969, 0.07423686981201172, 0.07839202880859375, 0.08254718780517578, 0.08670234680175781, 0.09085750579833984, 0.09501266479492188, 0.0991678237915039, 0.10332298278808594, 0.10747814178466797, 0.11163330078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 13.0, 12.0, 19.0, 15.0, 36.0, 42.0, 65.0, 82.0, 124.0, 164.0, 259.0, 356.0, 470.0, 516.0, 518.0, 381.0, 286.0, 208.0, 124.0, 93.0, 72.0, 61.0, 28.0, 19.0, 17.0, 12.0, 12.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.048919677734375, -0.04736757278442383, -0.045815467834472656, -0.044263362884521484, -0.04271125793457031, -0.04115915298461914, -0.03960704803466797, -0.0380549430847168, -0.036502838134765625, -0.03495073318481445, -0.03339862823486328, -0.03184652328491211, -0.030294418334960938, -0.028742313385009766, -0.027190208435058594, -0.025638103485107422, -0.02408599853515625, -0.022533893585205078, -0.020981788635253906, -0.019429683685302734, -0.017877578735351562, -0.01632547378540039, -0.014773368835449219, -0.013221263885498047, -0.011669158935546875, -0.010117053985595703, -0.008564949035644531, -0.007012844085693359, -0.0054607391357421875, -0.003908634185791016, -0.0023565292358398438, -0.0008044242858886719, 0.0007476806640625, 0.002299785614013672, 0.0038518905639648438, 0.005403995513916016, 0.0069561004638671875, 0.00850820541381836, 0.010060310363769531, 0.011612415313720703, 0.013164520263671875, 0.014716625213623047, 0.01626873016357422, 0.01782083511352539, 0.019372940063476562, 0.020925045013427734, 0.022477149963378906, 0.024029254913330078, 0.02558135986328125, 0.027133464813232422, 0.028685569763183594, 0.030237674713134766, 0.03178977966308594, 0.03334188461303711, 0.03489398956298828, 0.03644609451293945, 0.037998199462890625, 0.0395503044128418, 0.04110240936279297, 0.04265451431274414, 0.04420661926269531, 0.045758724212646484, 0.047310829162597656, 0.04886293411254883, 0.0504150390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 9.0, 103.0, 584.0, 289.0, 23.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17688630521297455, -0.13938170671463013, -0.1018771082162857, -0.06437250971794128, -0.026867911219596863, 0.010636687278747559, 0.04814128577709198, 0.08564586937427521, 0.12315048277378082, 0.16065508127212524, 0.19815967977046967, 0.2356642782688141, 0.2731688618659973, 0.31067347526550293, 0.34817808866500854, 0.3856826424598694, 0.423187255859375, 0.4606918692588806, 0.49819645285606384, 0.5357010364532471, 0.5732056498527527, 0.6107102632522583, 0.6482148170471191, 0.6857194304466248, 0.7232240438461304, 0.760728657245636, 0.7982332706451416, 0.8357378244400024, 0.8732424378395081, 0.9107470512390137, 0.9482516050338745, 0.9857562184333801, 1.0232608318328857, 1.0607653856277466, 1.098270058631897, 1.1357746124267578, 1.1732792854309082, 1.210783839225769, 1.2482883930206299, 1.2857930660247803, 1.3232976198196411, 1.360802173614502, 1.3983068466186523, 1.4358114004135132, 1.473315954208374, 1.5108206272125244, 1.5483251810073853, 1.585829734802246, 1.6233344078063965, 1.6608389616012573, 1.6983436346054077, 1.7358481884002686, 1.773352861404419, 1.8108574151992798, 1.8483619689941406, 1.885866641998291, 1.9233711957931519, 1.9608757495880127, 1.998380422592163, 2.0358850955963135, 2.0733895301818848, 2.110894203186035, 2.1483988761901855, 2.185903310775757, 2.2234079837799072]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 7.0, 7.0, 10.0, 11.0, 23.0, 30.0, 25.0, 26.0, 34.0, 54.0, 43.0, 47.0, 52.0, 51.0, 47.0, 50.0, 60.0, 52.0, 52.0, 57.0, 37.0, 36.0, 31.0, 22.0, 23.0, 24.0, 22.0, 13.0, 10.0, 8.0, 9.0, 5.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18044090270996094, -0.17483706772327423, -0.16923323273658752, -0.16362939774990082, -0.1580255627632141, -0.1524217128753662, -0.1468178778886795, -0.1412140429019928, -0.1356102079153061, -0.13000637292861938, -0.12440253794193268, -0.11879869550466537, -0.11319486051797867, -0.10759102553129196, -0.10198718309402466, -0.09638334810733795, -0.09077951312065125, -0.08517567813396454, -0.07957184314727783, -0.07396800071001053, -0.06836416572332382, -0.06276033073663712, -0.05715649202466011, -0.051552653312683105, -0.0459488183259964, -0.04034498333930969, -0.03474114462733269, -0.02913730777800083, -0.023533470928668976, -0.01792963407933712, -0.012325797230005264, -0.006721958518028259, -0.0011181235313415527, 0.004485713317990303, 0.010089550167322159, 0.015693387016654015, 0.02129722386598587, 0.026901060715317726, 0.03250489756464958, 0.03810873627662659, 0.04371257126331329, 0.04931640625, 0.054920244961977005, 0.06052408367395401, 0.06612791866064072, 0.07173175364732742, 0.07733559608459473, 0.08293943107128143, 0.08854326605796814, 0.09414710104465485, 0.09975093603134155, 0.10535477846860886, 0.11095861345529556, 0.11656244844198227, 0.12216629087924957, 0.12777012586593628, 0.13337396085262299, 0.1389777958393097, 0.1445816308259964, 0.1501854658126831, 0.155789315700531, 0.1613931506872177, 0.16699698567390442, 0.17260082066059113, 0.17820465564727783]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 16.0, 19.0, 23.0, 44.0, 45.0, 60.0, 83.0, 122.0, 195.0, 297.0, 454.0, 656.0, 1090.0, 1957.0, 3563.0, 7942.0, 22141.0, 95390.0, 475330.0, 345522.0, 63344.0, 16469.0, 6324.0, 2996.0, 1648.0, 998.0, 563.0, 377.0, 235.0, 178.0, 114.0, 100.0, 49.0, 52.0, 25.0, 28.0, 13.0, 11.0, 11.0, 9.0, 7.0, 4.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.09619140625, -0.09307575225830078, -0.08996009826660156, -0.08684444427490234, -0.08372879028320312, -0.0806131362915039, -0.07749748229980469, -0.07438182830810547, -0.07126617431640625, -0.06815052032470703, -0.06503486633300781, -0.061919212341308594, -0.058803558349609375, -0.055687904357910156, -0.05257225036621094, -0.04945659637451172, -0.0463409423828125, -0.04322528839111328, -0.04010963439941406, -0.036993980407714844, -0.033878326416015625, -0.030762672424316406, -0.027647018432617188, -0.02453136444091797, -0.02141571044921875, -0.01830005645751953, -0.015184402465820312, -0.012068748474121094, -0.008953094482421875, -0.005837440490722656, -0.0027217864990234375, 0.00039386749267578125, 0.003509521484375, 0.006625175476074219, 0.009740829467773438, 0.012856483459472656, 0.015972137451171875, 0.019087791442871094, 0.022203445434570312, 0.02531909942626953, 0.02843475341796875, 0.03155040740966797, 0.03466606140136719, 0.037781715393066406, 0.040897369384765625, 0.044013023376464844, 0.04712867736816406, 0.05024433135986328, 0.0533599853515625, 0.05647563934326172, 0.05959129333496094, 0.06270694732666016, 0.06582260131835938, 0.0689382553100586, 0.07205390930175781, 0.07516956329345703, 0.07828521728515625, 0.08140087127685547, 0.08451652526855469, 0.0876321792602539, 0.09074783325195312, 0.09386348724365234, 0.09697914123535156, 0.10009479522705078, 0.10321044921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 7.0, 8.0, 11.0, 19.0, 16.0, 16.0, 29.0, 35.0, 42.0, 42.0, 58.0, 63.0, 58.0, 49.0, 75.0, 55.0, 74.0, 50.0, 60.0, 38.0, 32.0, 30.0, 30.0, 27.0, 12.0, 13.0, 14.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045684814453125, -0.04401063919067383, -0.042336463928222656, -0.040662288665771484, -0.03898811340332031, -0.03731393814086914, -0.03563976287841797, -0.0339655876159668, -0.032291412353515625, -0.030617237091064453, -0.02894306182861328, -0.02726888656616211, -0.025594711303710938, -0.023920536041259766, -0.022246360778808594, -0.020572185516357422, -0.01889801025390625, -0.017223834991455078, -0.015549659729003906, -0.013875484466552734, -0.012201309204101562, -0.01052713394165039, -0.008852958679199219, -0.007178783416748047, -0.005504608154296875, -0.003830432891845703, -0.0021562576293945312, -0.0004820823669433594, 0.0011920928955078125, 0.0028662681579589844, 0.004540443420410156, 0.006214618682861328, 0.0078887939453125, 0.009562969207763672, 0.011237144470214844, 0.012911319732666016, 0.014585494995117188, 0.01625967025756836, 0.01793384552001953, 0.019608020782470703, 0.021282196044921875, 0.022956371307373047, 0.02463054656982422, 0.02630472183227539, 0.027978897094726562, 0.029653072357177734, 0.031327247619628906, 0.03300142288208008, 0.03467559814453125, 0.03634977340698242, 0.038023948669433594, 0.039698123931884766, 0.04137229919433594, 0.04304647445678711, 0.04472064971923828, 0.04639482498168945, 0.048069000244140625, 0.0497431755065918, 0.05141735076904297, 0.05309152603149414, 0.05476570129394531, 0.056439876556396484, 0.058114051818847656, 0.05978822708129883, 0.06146240234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 4.0, 7.0, 8.0, 10.0, 13.0, 21.0, 32.0, 28.0, 72.0, 111.0, 230.0, 514.0, 1075.0, 2683.0, 7195.0, 19758.0, 56288.0, 148455.0, 294363.0, 290025.0, 143298.0, 53343.0, 19305.0, 6906.0, 2635.0, 1114.0, 517.0, 218.0, 131.0, 76.0, 34.0, 24.0, 17.0, 10.0, 11.0, 7.0, 4.0, 6.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.054962158203125, -0.05329561233520508, -0.051629066467285156, -0.049962520599365234, -0.04829597473144531, -0.04662942886352539, -0.04496288299560547, -0.04329633712768555, -0.041629791259765625, -0.0399632453918457, -0.03829669952392578, -0.03663015365600586, -0.03496360778808594, -0.033297061920166016, -0.031630516052246094, -0.029963970184326172, -0.02829742431640625, -0.026630878448486328, -0.024964332580566406, -0.023297786712646484, -0.021631240844726562, -0.01996469497680664, -0.01829814910888672, -0.016631603240966797, -0.014965057373046875, -0.013298511505126953, -0.011631965637207031, -0.00996541976928711, -0.008298873901367188, -0.006632328033447266, -0.004965782165527344, -0.003299236297607422, -0.0016326904296875, 3.3855438232421875e-05, 0.0017004013061523438, 0.0033669471740722656, 0.0050334930419921875, 0.006700038909912109, 0.008366584777832031, 0.010033130645751953, 0.011699676513671875, 0.013366222381591797, 0.015032768249511719, 0.01669931411743164, 0.018365859985351562, 0.020032405853271484, 0.021698951721191406, 0.023365497589111328, 0.02503204345703125, 0.026698589324951172, 0.028365135192871094, 0.030031681060791016, 0.03169822692871094, 0.03336477279663086, 0.03503131866455078, 0.0366978645324707, 0.038364410400390625, 0.04003095626831055, 0.04169750213623047, 0.04336404800415039, 0.04503059387207031, 0.046697139739990234, 0.048363685607910156, 0.05003023147583008, 0.05169677734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 15.0, 8.0, 8.0, 18.0, 15.0, 14.0, 34.0, 22.0, 20.0, 28.0, 36.0, 39.0, 41.0, 42.0, 43.0, 52.0, 39.0, 45.0, 48.0, 39.0, 47.0, 29.0, 41.0, 32.0, 29.0, 31.0, 23.0, 23.0, 28.0, 18.0, 14.0, 13.0, 13.0, 5.0, 14.0, 6.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09053516387939453, -0.08719825744628906, -0.0838613510131836, -0.08052444458007812, -0.07718753814697266, -0.07385063171386719, -0.07051372528076172, -0.06717681884765625, -0.06383991241455078, -0.06050300598144531, -0.057166099548339844, -0.053829193115234375, -0.050492286682128906, -0.04715538024902344, -0.04381847381591797, -0.0404815673828125, -0.03714466094970703, -0.03380775451660156, -0.030470848083496094, -0.027133941650390625, -0.023797035217285156, -0.020460128784179688, -0.01712322235107422, -0.01378631591796875, -0.010449409484863281, -0.0071125030517578125, -0.0037755966186523438, -0.000438690185546875, 0.0028982162475585938, 0.0062351226806640625, 0.009572029113769531, 0.012908935546875, 0.01624584197998047, 0.019582748413085938, 0.022919654846191406, 0.026256561279296875, 0.029593467712402344, 0.03293037414550781, 0.03626728057861328, 0.03960418701171875, 0.04294109344482422, 0.04627799987792969, 0.049614906311035156, 0.052951812744140625, 0.056288719177246094, 0.05962562561035156, 0.06296253204345703, 0.0662994384765625, 0.06963634490966797, 0.07297325134277344, 0.0763101577758789, 0.07964706420898438, 0.08298397064208984, 0.08632087707519531, 0.08965778350830078, 0.09299468994140625, 0.09633159637451172, 0.09966850280761719, 0.10300540924072266, 0.10634231567382812, 0.1096792221069336, 0.11301612854003906, 0.11635303497314453, 0.11968994140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 16.0, 17.0, 41.0, 57.0, 97.0, 184.0, 642.0, 4212.0, 137676.0, 881934.0, 21257.0, 1707.0, 356.0, 144.0, 89.0, 52.0, 29.0, 15.0, 12.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09738636016845703, -0.09436988830566406, -0.0913534164428711, -0.08833694458007812, -0.08532047271728516, -0.08230400085449219, -0.07928752899169922, -0.07627105712890625, -0.07325458526611328, -0.07023811340332031, -0.06722164154052734, -0.06420516967773438, -0.061188697814941406, -0.05817222595214844, -0.05515575408935547, -0.0521392822265625, -0.04912281036376953, -0.04610633850097656, -0.043089866638183594, -0.040073394775390625, -0.037056922912597656, -0.03404045104980469, -0.03102397918701172, -0.02800750732421875, -0.02499103546142578, -0.021974563598632812, -0.018958091735839844, -0.015941619873046875, -0.012925148010253906, -0.009908676147460938, -0.006892204284667969, -0.003875732421875, -0.0008592605590820312, 0.0021572113037109375, 0.005173683166503906, 0.008190155029296875, 0.011206626892089844, 0.014223098754882812, 0.01723957061767578, 0.02025604248046875, 0.02327251434326172, 0.026288986206054688, 0.029305458068847656, 0.032321929931640625, 0.035338401794433594, 0.03835487365722656, 0.04137134552001953, 0.0443878173828125, 0.04740428924560547, 0.05042076110839844, 0.053437232971191406, 0.056453704833984375, 0.059470176696777344, 0.06248664855957031, 0.06550312042236328, 0.06851959228515625, 0.07153606414794922, 0.07455253601074219, 0.07756900787353516, 0.08058547973632812, 0.0836019515991211, 0.08661842346191406, 0.08963489532470703, 0.0926513671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 12.0, 7.0, 13.0, 25.0, 29.0, 45.0, 47.0, 61.0, 66.0, 76.0, 83.0, 67.0, 79.0, 74.0, 56.0, 45.0, 49.0, 36.0, 26.0, 29.0, 17.0, 17.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.225440979003906e-06, -7.935799658298492e-06, -7.646158337593079e-06, -7.356517016887665e-06, -7.066875696182251e-06, -6.777234375476837e-06, -6.487593054771423e-06, -6.1979517340660095e-06, -5.908310413360596e-06, -5.618669092655182e-06, -5.329027771949768e-06, -5.039386451244354e-06, -4.7497451305389404e-06, -4.460103809833527e-06, -4.170462489128113e-06, -3.880821168422699e-06, -3.591179847717285e-06, -3.3015385270118713e-06, -3.0118972063064575e-06, -2.7222558856010437e-06, -2.43261456489563e-06, -2.142973244190216e-06, -1.8533319234848022e-06, -1.5636906027793884e-06, -1.2740492820739746e-06, -9.844079613685608e-07, -6.94766640663147e-07, -4.0512531995773315e-07, -1.1548399925231934e-07, 1.7415732145309448e-07, 4.637986421585083e-07, 7.534399628639221e-07, 1.043081283569336e-06, 1.3327226042747498e-06, 1.6223639249801636e-06, 1.9120052456855774e-06, 2.201646566390991e-06, 2.491287887096405e-06, 2.780929207801819e-06, 3.0705705285072327e-06, 3.3602118492126465e-06, 3.6498531699180603e-06, 3.939494490623474e-06, 4.229135811328888e-06, 4.518777132034302e-06, 4.8084184527397156e-06, 5.098059773445129e-06, 5.387701094150543e-06, 5.677342414855957e-06, 5.966983735561371e-06, 6.256625056266785e-06, 6.5462663769721985e-06, 6.835907697677612e-06, 7.125549018383026e-06, 7.41519033908844e-06, 7.704831659793854e-06, 7.994472980499268e-06, 8.284114301204681e-06, 8.573755621910095e-06, 8.863396942615509e-06, 9.153038263320923e-06, 9.442679584026337e-06, 9.73232090473175e-06, 1.0021962225437164e-05, 1.0311603546142578e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 12.0, 17.0, 24.0, 35.0, 41.0, 69.0, 160.0, 243.0, 440.0, 783.0, 1443.0, 3369.0, 9552.0, 37552.0, 201600.0, 553671.0, 188860.0, 35200.0, 9062.0, 3173.0, 1440.0, 752.0, 413.0, 260.0, 135.0, 79.0, 51.0, 38.0, 24.0, 14.0, 6.0, 10.0, 1.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034881591796875, -0.0337371826171875, -0.0325927734375, -0.0314483642578125, -0.030303955078125, -0.0291595458984375, -0.02801513671875, -0.0268707275390625, -0.025726318359375, -0.0245819091796875, -0.0234375, -0.0222930908203125, -0.021148681640625, -0.0200042724609375, -0.01885986328125, -0.0177154541015625, -0.016571044921875, -0.0154266357421875, -0.0142822265625, -0.0131378173828125, -0.011993408203125, -0.0108489990234375, -0.00970458984375, -0.0085601806640625, -0.007415771484375, -0.0062713623046875, -0.005126953125, -0.0039825439453125, -0.002838134765625, -0.0016937255859375, -0.00054931640625, 0.0005950927734375, 0.001739501953125, 0.0028839111328125, 0.0040283203125, 0.0051727294921875, 0.006317138671875, 0.0074615478515625, 0.00860595703125, 0.0097503662109375, 0.010894775390625, 0.0120391845703125, 0.01318359375, 0.0143280029296875, 0.015472412109375, 0.0166168212890625, 0.01776123046875, 0.0189056396484375, 0.020050048828125, 0.0211944580078125, 0.0223388671875, 0.0234832763671875, 0.024627685546875, 0.0257720947265625, 0.02691650390625, 0.0280609130859375, 0.029205322265625, 0.0303497314453125, 0.031494140625, 0.0326385498046875, 0.033782958984375, 0.0349273681640625, 0.03607177734375, 0.0372161865234375, 0.038360595703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 10.0, 5.0, 15.0, 13.0, 23.0, 42.0, 50.0, 95.0, 124.0, 163.0, 145.0, 110.0, 76.0, 42.0, 27.0, 24.0, 10.0, 5.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06121826171875, -0.05950212478637695, -0.057785987854003906, -0.05606985092163086, -0.05435371398925781, -0.052637577056884766, -0.05092144012451172, -0.04920530319213867, -0.047489166259765625, -0.04577302932739258, -0.04405689239501953, -0.042340755462646484, -0.04062461853027344, -0.03890848159790039, -0.037192344665527344, -0.0354762077331543, -0.03376007080078125, -0.0320439338684082, -0.030327796936035156, -0.02861166000366211, -0.026895523071289062, -0.025179386138916016, -0.02346324920654297, -0.021747112274169922, -0.020030975341796875, -0.018314838409423828, -0.01659870147705078, -0.014882564544677734, -0.013166427612304688, -0.01145029067993164, -0.009734153747558594, -0.008018016815185547, -0.0063018798828125, -0.004585742950439453, -0.0028696060180664062, -0.0011534690856933594, 0.0005626678466796875, 0.0022788047790527344, 0.003994941711425781, 0.005711078643798828, 0.007427215576171875, 0.009143352508544922, 0.010859489440917969, 0.012575626373291016, 0.014291763305664062, 0.01600790023803711, 0.017724037170410156, 0.019440174102783203, 0.02115631103515625, 0.022872447967529297, 0.024588584899902344, 0.02630472183227539, 0.028020858764648438, 0.029736995697021484, 0.03145313262939453, 0.03316926956176758, 0.034885406494140625, 0.03660154342651367, 0.03831768035888672, 0.040033817291259766, 0.04174995422363281, 0.04346609115600586, 0.045182228088378906, 0.04689836502075195, 0.048614501953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 23.0, 36.0, 47.0, 70.0, 82.0, 103.0, 124.0, 128.0, 113.0, 78.0, 58.0, 33.0, 30.0, 20.0, 10.0, 11.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5258496999740601, -0.5134339928627014, -0.5010183453559875, -0.4886026382446289, -0.47618696093559265, -0.4637712836265564, -0.45135560631752014, -0.4389399290084839, -0.42652422189712524, -0.414108544588089, -0.40169286727905273, -0.3892771601676941, -0.37686148285865784, -0.3644458055496216, -0.3520301282405853, -0.3396144509315491, -0.3271987736225128, -0.31478309631347656, -0.3023674190044403, -0.28995174169540405, -0.2775360345840454, -0.26512035727500916, -0.2527046799659729, -0.24028900265693665, -0.2278733104467392, -0.21545763313770294, -0.2030419409275055, -0.19062626361846924, -0.17821058630943298, -0.16579489409923553, -0.15337921679019928, -0.14096352458000183, -0.12854784727096558, -0.11613216251134872, -0.10371647775173187, -0.09130080044269562, -0.07888511568307877, -0.06646943092346191, -0.05405375361442566, -0.04163806885480881, -0.029222384095191956, -0.016806701198220253, -0.00439101830124855, 0.008024662733078003, 0.020440347492694855, 0.03285603225231171, 0.04527170956134796, 0.05768739432096481, 0.07010307908058167, 0.08251876384019852, 0.09493444859981537, 0.10735012590885162, 0.11976581066846848, 0.13218149542808533, 0.14459717273712158, 0.15701285004615784, 0.16942854225635529, 0.18184421956539154, 0.194259911775589, 0.20667558908462524, 0.2190912663936615, 0.23150695860385895, 0.2439226359128952, 0.25633832812309265, 0.2687540054321289]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 8.0, 20.0, 15.0, 20.0, 25.0, 22.0, 34.0, 33.0, 34.0, 40.0, 45.0, 34.0, 41.0, 49.0, 55.0, 41.0, 56.0, 45.0, 42.0, 33.0, 45.0, 29.0, 35.0, 25.0, 26.0, 22.0, 17.0, 11.0, 15.0, 9.0, 10.0, 9.0, 6.0, 8.0, 2.0, 1.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6307061314582825, -0.6127724051475525, -0.5948386192321777, -0.5769048929214478, -0.5589711666107178, -0.541037380695343, -0.523103654384613, -0.5051698684692383, -0.4872361421585083, -0.46930238604545593, -0.45136862993240356, -0.4334349036216736, -0.4155011475086212, -0.39756739139556885, -0.37963366508483887, -0.3616999089717865, -0.34376615285873413, -0.32583239674568176, -0.3078986406326294, -0.2899649143218994, -0.27203115820884705, -0.2540974020957947, -0.2361636608839035, -0.21822991967201233, -0.20029616355895996, -0.1823624074459076, -0.16442866623401642, -0.14649492502212524, -0.12856116890907288, -0.1106274202466011, -0.09269367158412933, -0.07475993037223816, -0.056826114654541016, -0.038892365992069244, -0.020958617329597473, -0.003024868667125702, 0.01490887999534607, 0.03284262865781784, 0.05077637732028961, 0.06871011853218079, 0.08664387464523315, 0.10457762330770493, 0.1225113719701767, 0.14044511318206787, 0.15837886929512024, 0.1763126254081726, 0.19424636662006378, 0.21218010783195496, 0.23011386394500732, 0.2480476200580597, 0.26598137617111206, 0.28391510248184204, 0.3018488585948944, 0.3197826147079468, 0.33771634101867676, 0.3556500971317291, 0.3735838532447815, 0.39151760935783386, 0.40945136547088623, 0.4273850917816162, 0.4453188478946686, 0.46325260400772095, 0.4811863303184509, 0.4991200864315033, 0.5170538425445557]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 6.0, 6.0, 10.0, 10.0, 13.0, 8.0, 30.0, 41.0, 61.0, 94.0, 157.0, 326.0, 741.0, 2133.0, 8663.0, 68068.0, 3184723.0, 890319.0, 31575.0, 4998.0, 1260.0, 471.0, 210.0, 102.0, 62.0, 52.0, 31.0, 20.0, 18.0, 16.0, 7.0, 13.0, 2.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.302001953125, -0.2944221496582031, -0.28684234619140625, -0.2792625427246094, -0.2716827392578125, -0.2641029357910156, -0.25652313232421875, -0.24894332885742188, -0.241363525390625, -0.23378372192382812, -0.22620391845703125, -0.21862411499023438, -0.2110443115234375, -0.20346450805664062, -0.19588470458984375, -0.18830490112304688, -0.18072509765625, -0.17314529418945312, -0.16556549072265625, -0.15798568725585938, -0.1504058837890625, -0.14282608032226562, -0.13524627685546875, -0.12766647338867188, -0.120086669921875, -0.11250686645507812, -0.10492706298828125, -0.09734725952148438, -0.0897674560546875, -0.08218765258789062, -0.07460784912109375, -0.06702804565429688, -0.0594482421875, -0.051868438720703125, -0.04428863525390625, -0.036708831787109375, -0.0291290283203125, -0.021549224853515625, -0.01396942138671875, -0.006389617919921875, 0.001190185546875, 0.008769989013671875, 0.01634979248046875, 0.023929595947265625, 0.0315093994140625, 0.039089202880859375, 0.04666900634765625, 0.054248809814453125, 0.06182861328125, 0.06940841674804688, 0.07698822021484375, 0.08456802368164062, 0.0921478271484375, 0.09972763061523438, 0.10730743408203125, 0.11488723754882812, 0.122467041015625, 0.13004684448242188, 0.13762664794921875, 0.14520645141601562, 0.1527862548828125, 0.16036605834960938, 0.16794586181640625, 0.17552566528320312, 0.18310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 6.0, 5.0, 8.0, 9.0, 14.0, 13.0, 11.0, 28.0, 19.0, 27.0, 41.0, 49.0, 53.0, 54.0, 60.0, 70.0, 72.0, 64.0, 47.0, 64.0, 51.0, 38.0, 38.0, 16.0, 29.0, 28.0, 21.0, 15.0, 13.0, 14.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062164306640625, -0.06045818328857422, -0.05875205993652344, -0.057045936584472656, -0.055339813232421875, -0.053633689880371094, -0.05192756652832031, -0.05022144317626953, -0.04851531982421875, -0.04680919647216797, -0.04510307312011719, -0.043396949768066406, -0.041690826416015625, -0.039984703063964844, -0.03827857971191406, -0.03657245635986328, -0.0348663330078125, -0.03316020965576172, -0.03145408630371094, -0.029747962951660156, -0.028041839599609375, -0.026335716247558594, -0.024629592895507812, -0.02292346954345703, -0.02121734619140625, -0.01951122283935547, -0.017805099487304688, -0.016098976135253906, -0.014392852783203125, -0.012686729431152344, -0.010980606079101562, -0.009274482727050781, -0.007568359375, -0.005862236022949219, -0.0041561126708984375, -0.0024499893188476562, -0.000743865966796875, 0.0009622573852539062, 0.0026683807373046875, 0.004374504089355469, 0.00608062744140625, 0.007786750793457031, 0.009492874145507812, 0.011198997497558594, 0.012905120849609375, 0.014611244201660156, 0.016317367553710938, 0.01802349090576172, 0.0197296142578125, 0.02143573760986328, 0.023141860961914062, 0.024847984313964844, 0.026554107666015625, 0.028260231018066406, 0.029966354370117188, 0.03167247772216797, 0.03337860107421875, 0.03508472442626953, 0.03679084777832031, 0.038496971130371094, 0.040203094482421875, 0.041909217834472656, 0.04361534118652344, 0.04532146453857422, 0.047027587890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 1.0, 16.0, 20.0, 32.0, 32.0, 61.0, 87.0, 125.0, 219.0, 347.0, 619.0, 1189.0, 2378.0, 4607.0, 9824.0, 21931.0, 54311.0, 147117.0, 446497.0, 1409155.0, 1404466.0, 447513.0, 147810.0, 54063.0, 22373.0, 9742.0, 4533.0, 2350.0, 1247.0, 658.0, 352.0, 208.0, 148.0, 80.0, 54.0, 27.0, 27.0, 18.0, 4.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07586669921875, -0.07349586486816406, -0.07112503051757812, -0.06875419616699219, -0.06638336181640625, -0.06401252746582031, -0.061641693115234375, -0.05927085876464844, -0.0569000244140625, -0.05452919006347656, -0.052158355712890625, -0.04978752136230469, -0.04741668701171875, -0.04504585266113281, -0.042675018310546875, -0.04030418395996094, -0.037933349609375, -0.03556251525878906, -0.033191680908203125, -0.030820846557617188, -0.02845001220703125, -0.026079177856445312, -0.023708343505859375, -0.021337509155273438, -0.0189666748046875, -0.016595840454101562, -0.014225006103515625, -0.011854171752929688, -0.00948333740234375, -0.0071125030517578125, -0.004741668701171875, -0.0023708343505859375, 0.0, 0.0023708343505859375, 0.004741668701171875, 0.0071125030517578125, 0.00948333740234375, 0.011854171752929688, 0.014225006103515625, 0.016595840454101562, 0.0189666748046875, 0.021337509155273438, 0.023708343505859375, 0.026079177856445312, 0.02845001220703125, 0.030820846557617188, 0.033191680908203125, 0.03556251525878906, 0.037933349609375, 0.04030418395996094, 0.042675018310546875, 0.04504585266113281, 0.04741668701171875, 0.04978752136230469, 0.052158355712890625, 0.05452919006347656, 0.0569000244140625, 0.05927085876464844, 0.061641693115234375, 0.06401252746582031, 0.06638336181640625, 0.06875419616699219, 0.07112503051757812, 0.07349586486816406, 0.07586669921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 5.0, 9.0, 10.0, 8.0, 12.0, 25.0, 39.0, 49.0, 52.0, 85.0, 128.0, 199.0, 270.0, 372.0, 554.0, 643.0, 536.0, 344.0, 235.0, 144.0, 86.0, 76.0, 57.0, 37.0, 20.0, 25.0, 9.0, 15.0, 8.0, 7.0, 10.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07611083984375, -0.07394933700561523, -0.07178783416748047, -0.0696263313293457, -0.06746482849121094, -0.06530332565307617, -0.0631418228149414, -0.06098031997680664, -0.058818817138671875, -0.05665731430053711, -0.054495811462402344, -0.05233430862426758, -0.05017280578613281, -0.04801130294799805, -0.04584980010986328, -0.043688297271728516, -0.04152679443359375, -0.039365291595458984, -0.03720378875732422, -0.03504228591918945, -0.03288078308105469, -0.030719280242919922, -0.028557777404785156, -0.02639627456665039, -0.024234771728515625, -0.02207326889038086, -0.019911766052246094, -0.017750263214111328, -0.015588760375976562, -0.013427257537841797, -0.011265754699707031, -0.009104251861572266, -0.0069427490234375, -0.004781246185302734, -0.0026197433471679688, -0.0004582405090332031, 0.0017032623291015625, 0.003864765167236328, 0.006026268005371094, 0.00818777084350586, 0.010349273681640625, 0.01251077651977539, 0.014672279357910156, 0.016833782196044922, 0.018995285034179688, 0.021156787872314453, 0.02331829071044922, 0.025479793548583984, 0.02764129638671875, 0.029802799224853516, 0.03196430206298828, 0.03412580490112305, 0.03628730773925781, 0.03844881057739258, 0.040610313415527344, 0.04277181625366211, 0.044933319091796875, 0.04709482192993164, 0.049256324768066406, 0.05141782760620117, 0.05357933044433594, 0.0557408332824707, 0.05790233612060547, 0.060063838958740234, 0.062225341796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 1.0, 7.0, 12.0, 18.0, 16.0, 25.0, 30.0, 37.0, 41.0, 57.0, 67.0, 72.0, 72.0, 74.0, 85.0, 81.0, 62.0, 66.0, 40.0, 37.0, 32.0, 15.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2082008570432663, -0.20202209055423737, -0.19584332406520844, -0.1896645724773407, -0.18348580598831177, -0.17730703949928284, -0.1711282730102539, -0.16494950652122498, -0.15877074003219604, -0.15259197354316711, -0.14641320705413818, -0.14023444056510925, -0.13405568897724152, -0.12787692248821259, -0.12169815599918365, -0.11551938951015472, -0.10934063792228699, -0.10316187143325806, -0.09698311239480972, -0.09080434590578079, -0.08462558686733246, -0.07844682037830353, -0.0722680538892746, -0.06608928740024567, -0.05991052836179733, -0.0537317655980587, -0.04755300283432007, -0.04137423634529114, -0.035195473581552505, -0.029016710817813873, -0.022837944328784943, -0.01665918156504631, -0.010480418801307678, -0.004301655106246471, 0.0018771085888147354, 0.008055873215198517, 0.014234635978937149, 0.02041339874267578, 0.026592165231704712, 0.032770927995443344, 0.038949690759181976, 0.04512845352292061, 0.05130721628665924, 0.05748598277568817, 0.0636647492647171, 0.06984350830316544, 0.07602227479219437, 0.0822010338306427, 0.08837980031967163, 0.09455856680870056, 0.1007373258471489, 0.10691609233617783, 0.11309485137462616, 0.11927361786365509, 0.12545238435268402, 0.13163115084171295, 0.1378099024295807, 0.14398866891860962, 0.15016743540763855, 0.15634620189666748, 0.16252495348453522, 0.16870371997356415, 0.17488248646259308, 0.181061252951622, 0.18724001944065094]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 4.0, 11.0, 12.0, 7.0, 10.0, 14.0, 8.0, 17.0, 26.0, 37.0, 27.0, 33.0, 36.0, 46.0, 43.0, 44.0, 43.0, 42.0, 42.0, 44.0, 47.0, 45.0, 42.0, 43.0, 40.0, 36.0, 34.0, 26.0, 25.0, 19.0, 17.0, 14.0, 9.0, 10.0, 11.0, 4.0, 8.0, 1.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1924980878829956, -0.18635408580303192, -0.18021009862422943, -0.17406609654426575, -0.16792210936546326, -0.16177810728549957, -0.1556341052055359, -0.1494901180267334, -0.14334611594676971, -0.13720211386680603, -0.13105812668800354, -0.12491412460803986, -0.11877012997865677, -0.11262613534927368, -0.10648213326931, -0.10033813863992691, -0.09419414401054382, -0.08805014938116074, -0.08190615475177765, -0.07576215267181396, -0.06961815804243088, -0.06347416341304779, -0.057330165058374405, -0.05118616670370102, -0.04504217207431793, -0.038898177444934845, -0.03275417909026146, -0.026610182598233223, -0.020466186106204987, -0.01432218961417675, -0.008178193122148514, -0.002034194767475128, 0.004109799861907959, 0.010253796353936195, 0.016397792845964432, 0.022541789337992668, 0.028685785830020905, 0.03482978045940399, 0.04097377881407738, 0.04711777716875076, 0.05326177179813385, 0.05940576642751694, 0.06554976105690002, 0.07169376313686371, 0.0778377577662468, 0.08398175239562988, 0.09012575447559357, 0.09626974910497665, 0.10241374373435974, 0.10855773836374283, 0.11470173299312592, 0.1208457350730896, 0.1269897222518921, 0.13313372433185577, 0.13927772641181946, 0.14542171359062195, 0.15156571567058563, 0.15770971775054932, 0.1638537049293518, 0.1699977070093155, 0.17614170908927917, 0.18228569626808167, 0.18842969834804535, 0.19457370042800903, 0.20071768760681152]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 10.0, 17.0, 19.0, 10.0, 23.0, 31.0, 55.0, 74.0, 91.0, 145.0, 216.0, 361.0, 535.0, 797.0, 1304.0, 2139.0, 3710.0, 6796.0, 12588.0, 24994.0, 50833.0, 104519.0, 201313.0, 269186.0, 182640.0, 92756.0, 44879.0, 22442.0, 11373.0, 5891.0, 3359.0, 1984.0, 1287.0, 753.0, 421.0, 311.0, 196.0, 122.0, 102.0, 66.0, 57.0, 35.0, 27.0, 24.0, 14.0, 10.0, 5.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.062346458435058594, -0.06036186218261719, -0.05837726593017578, -0.056392669677734375, -0.05440807342529297, -0.05242347717285156, -0.050438880920410156, -0.04845428466796875, -0.046469688415527344, -0.04448509216308594, -0.04250049591064453, -0.040515899658203125, -0.03853130340576172, -0.03654670715332031, -0.034562110900878906, -0.0325775146484375, -0.030592918395996094, -0.028608322143554688, -0.02662372589111328, -0.024639129638671875, -0.02265453338623047, -0.020669937133789062, -0.018685340881347656, -0.01670074462890625, -0.014716148376464844, -0.012731552124023438, -0.010746955871582031, -0.008762359619140625, -0.006777763366699219, -0.0047931671142578125, -0.0028085708618164062, -0.000823974609375, 0.0011606216430664062, 0.0031452178955078125, 0.005129814147949219, 0.007114410400390625, 0.009099006652832031, 0.011083602905273438, 0.013068199157714844, 0.01505279541015625, 0.017037391662597656, 0.019021987915039062, 0.02100658416748047, 0.022991180419921875, 0.02497577667236328, 0.026960372924804688, 0.028944969177246094, 0.0309295654296875, 0.032914161682128906, 0.03489875793457031, 0.03688335418701172, 0.038867950439453125, 0.04085254669189453, 0.04283714294433594, 0.044821739196777344, 0.04680633544921875, 0.048790931701660156, 0.05077552795410156, 0.05276012420654297, 0.054744720458984375, 0.05672931671142578, 0.05871391296386719, 0.060698509216308594, 0.06268310546875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 6.0, 15.0, 12.0, 12.0, 15.0, 24.0, 18.0, 30.0, 41.0, 52.0, 41.0, 51.0, 38.0, 47.0, 56.0, 53.0, 53.0, 53.0, 44.0, 46.0, 36.0, 42.0, 31.0, 27.0, 29.0, 17.0, 23.0, 21.0, 17.0, 6.0, 6.0, 8.0, 3.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0487060546875, -0.04729318618774414, -0.04588031768798828, -0.04446744918823242, -0.04305458068847656, -0.0416417121887207, -0.040228843688964844, -0.038815975189208984, -0.037403106689453125, -0.035990238189697266, -0.034577369689941406, -0.03316450119018555, -0.03175163269042969, -0.030338764190673828, -0.02892589569091797, -0.02751302719116211, -0.02610015869140625, -0.02468729019165039, -0.02327442169189453, -0.021861553192138672, -0.020448684692382812, -0.019035816192626953, -0.017622947692871094, -0.016210079193115234, -0.014797210693359375, -0.013384342193603516, -0.011971473693847656, -0.010558605194091797, -0.009145736694335938, -0.007732868194580078, -0.006319999694824219, -0.004907131195068359, -0.0034942626953125, -0.0020813941955566406, -0.0006685256958007812, 0.0007443428039550781, 0.0021572113037109375, 0.003570079803466797, 0.004982948303222656, 0.006395816802978516, 0.007808685302734375, 0.009221553802490234, 0.010634422302246094, 0.012047290802001953, 0.013460159301757812, 0.014873027801513672, 0.01628589630126953, 0.01769876480102539, 0.01911163330078125, 0.02052450180053711, 0.02193737030029297, 0.023350238800048828, 0.024763107299804688, 0.026175975799560547, 0.027588844299316406, 0.029001712799072266, 0.030414581298828125, 0.031827449798583984, 0.033240318298339844, 0.0346531867980957, 0.03606605529785156, 0.03747892379760742, 0.03889179229736328, 0.04030466079711914, 0.041717529296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 7.0, 7.0, 4.0, 14.0, 9.0, 14.0, 17.0, 15.0, 21.0, 19.0, 23.0, 37.0, 37.0, 52.0, 86.0, 142.0, 488.0, 3538.0, 80208.0, 888355.0, 71191.0, 3287.0, 473.0, 130.0, 72.0, 55.0, 25.0, 31.0, 28.0, 18.0, 31.0, 21.0, 13.0, 15.0, 11.0, 13.0, 3.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0], "bins": [-0.450927734375, -0.438568115234375, -0.42620849609375, -0.413848876953125, -0.4014892578125, -0.389129638671875, -0.37677001953125, -0.364410400390625, -0.35205078125, -0.339691162109375, -0.32733154296875, -0.314971923828125, -0.3026123046875, -0.290252685546875, -0.27789306640625, -0.265533447265625, -0.253173828125, -0.240814208984375, -0.22845458984375, -0.216094970703125, -0.2037353515625, -0.191375732421875, -0.17901611328125, -0.166656494140625, -0.154296875, -0.141937255859375, -0.12957763671875, -0.117218017578125, -0.1048583984375, -0.092498779296875, -0.08013916015625, -0.067779541015625, -0.055419921875, -0.043060302734375, -0.03070068359375, -0.018341064453125, -0.0059814453125, 0.006378173828125, 0.01873779296875, 0.031097412109375, 0.04345703125, 0.055816650390625, 0.06817626953125, 0.080535888671875, 0.0928955078125, 0.105255126953125, 0.11761474609375, 0.129974365234375, 0.142333984375, 0.154693603515625, 0.16705322265625, 0.179412841796875, 0.1917724609375, 0.204132080078125, 0.21649169921875, 0.228851318359375, 0.2412109375, 0.253570556640625, 0.26593017578125, 0.278289794921875, 0.2906494140625, 0.303009033203125, 0.31536865234375, 0.327728271484375, 0.340087890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 10.0, 3.0, 13.0, 8.0, 14.0, 17.0, 20.0, 19.0, 26.0, 30.0, 29.0, 26.0, 51.0, 40.0, 42.0, 40.0, 51.0, 50.0, 42.0, 49.0, 53.0, 35.0, 36.0, 34.0, 35.0, 27.0, 25.0, 16.0, 32.0, 19.0, 22.0, 13.0, 12.0, 9.0, 6.0, 8.0, 7.0, 4.0, 7.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.10223388671875, -0.09938716888427734, -0.09654045104980469, -0.09369373321533203, -0.09084701538085938, -0.08800029754638672, -0.08515357971191406, -0.0823068618774414, -0.07946014404296875, -0.0766134262084961, -0.07376670837402344, -0.07091999053955078, -0.06807327270507812, -0.06522655487060547, -0.06237983703613281, -0.059533119201660156, -0.0566864013671875, -0.053839683532714844, -0.05099296569824219, -0.04814624786376953, -0.045299530029296875, -0.04245281219482422, -0.03960609436035156, -0.036759376525878906, -0.03391265869140625, -0.031065940856933594, -0.028219223022460938, -0.02537250518798828, -0.022525787353515625, -0.01967906951904297, -0.016832351684570312, -0.013985633850097656, -0.011138916015625, -0.008292198181152344, -0.0054454803466796875, -0.0025987625122070312, 0.000247955322265625, 0.0030946731567382812, 0.0059413909912109375, 0.008788108825683594, 0.01163482666015625, 0.014481544494628906, 0.017328262329101562, 0.02017498016357422, 0.023021697998046875, 0.02586841583251953, 0.028715133666992188, 0.031561851501464844, 0.0344085693359375, 0.037255287170410156, 0.04010200500488281, 0.04294872283935547, 0.045795440673828125, 0.04864215850830078, 0.05148887634277344, 0.054335594177246094, 0.05718231201171875, 0.060029029846191406, 0.06287574768066406, 0.06572246551513672, 0.06856918334960938, 0.07141590118408203, 0.07426261901855469, 0.07710933685302734, 0.0799560546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 8.0, 11.0, 19.0, 26.0, 23.0, 46.0, 68.0, 125.0, 200.0, 350.0, 592.0, 1001.0, 1720.0, 3227.0, 6409.0, 13858.0, 34515.0, 99021.0, 303045.0, 369103.0, 136317.0, 44878.0, 17431.0, 7766.0, 3846.0, 2076.0, 1159.0, 651.0, 389.0, 230.0, 149.0, 84.0, 68.0, 44.0, 29.0, 21.0, 17.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0577392578125, -0.05614137649536133, -0.054543495178222656, -0.052945613861083984, -0.05134773254394531, -0.04974985122680664, -0.04815196990966797, -0.0465540885925293, -0.044956207275390625, -0.04335832595825195, -0.04176044464111328, -0.04016256332397461, -0.03856468200683594, -0.036966800689697266, -0.035368919372558594, -0.03377103805541992, -0.03217315673828125, -0.030575275421142578, -0.028977394104003906, -0.027379512786865234, -0.025781631469726562, -0.02418375015258789, -0.02258586883544922, -0.020987987518310547, -0.019390106201171875, -0.017792224884033203, -0.01619434356689453, -0.01459646224975586, -0.012998580932617188, -0.011400699615478516, -0.009802818298339844, -0.008204936981201172, -0.0066070556640625, -0.005009174346923828, -0.0034112930297851562, -0.0018134117126464844, -0.0002155303955078125, 0.0013823509216308594, 0.0029802322387695312, 0.004578113555908203, 0.006175994873046875, 0.007773876190185547, 0.009371757507324219, 0.01096963882446289, 0.012567520141601562, 0.014165401458740234, 0.015763282775878906, 0.017361164093017578, 0.01895904541015625, 0.020556926727294922, 0.022154808044433594, 0.023752689361572266, 0.025350570678710938, 0.02694845199584961, 0.02854633331298828, 0.030144214630126953, 0.031742095947265625, 0.0333399772644043, 0.03493785858154297, 0.03653573989868164, 0.03813362121582031, 0.039731502532958984, 0.041329383850097656, 0.04292726516723633, 0.044525146484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 3.0, 3.0, 5.0, 3.0, 10.0, 8.0, 9.0, 15.0, 40.0, 46.0, 61.0, 92.0, 127.0, 111.0, 128.0, 88.0, 74.0, 41.0, 38.0, 13.0, 19.0, 6.0, 4.0, 7.0, 7.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.4437904357910156e-05, -2.370774745941162e-05, -2.2977590560913086e-05, -2.224743366241455e-05, -2.1517276763916016e-05, -2.078711986541748e-05, -2.0056962966918945e-05, -1.932680606842041e-05, -1.8596649169921875e-05, -1.786649227142334e-05, -1.7136335372924805e-05, -1.640617847442627e-05, -1.5676021575927734e-05, -1.49458646774292e-05, -1.4215707778930664e-05, -1.3485550880432129e-05, -1.2755393981933594e-05, -1.2025237083435059e-05, -1.1295080184936523e-05, -1.0564923286437988e-05, -9.834766387939453e-06, -9.104609489440918e-06, -8.374452590942383e-06, -7.644295692443848e-06, -6.9141387939453125e-06, -6.183981895446777e-06, -5.453824996948242e-06, -4.723668098449707e-06, -3.993511199951172e-06, -3.2633543014526367e-06, -2.5331974029541016e-06, -1.8030405044555664e-06, -1.0728836059570312e-06, -3.427267074584961e-07, 3.8743019104003906e-07, 1.1175870895385742e-06, 1.8477439880371094e-06, 2.5779008865356445e-06, 3.3080577850341797e-06, 4.038214683532715e-06, 4.76837158203125e-06, 5.498528480529785e-06, 6.22868537902832e-06, 6.9588422775268555e-06, 7.68899917602539e-06, 8.419156074523926e-06, 9.149312973022461e-06, 9.879469871520996e-06, 1.0609626770019531e-05, 1.1339783668518066e-05, 1.2069940567016602e-05, 1.2800097465515137e-05, 1.3530254364013672e-05, 1.4260411262512207e-05, 1.4990568161010742e-05, 1.5720725059509277e-05, 1.6450881958007812e-05, 1.7181038856506348e-05, 1.7911195755004883e-05, 1.8641352653503418e-05, 1.9371509552001953e-05, 2.0101666450500488e-05, 2.0831823348999023e-05, 2.156198024749756e-05, 2.2292137145996094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 3.0, 4.0, 6.0, 6.0, 8.0, 7.0, 12.0, 12.0, 17.0, 15.0, 27.0, 31.0, 40.0, 67.0, 224.0, 1032.0, 10482.0, 248551.0, 743757.0, 40547.0, 2912.0, 433.0, 111.0, 54.0, 40.0, 32.0, 19.0, 19.0, 18.0, 12.0, 9.0, 7.0, 10.0, 4.0, 6.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10491943359375, -0.10144901275634766, -0.09797859191894531, -0.09450817108154297, -0.09103775024414062, -0.08756732940673828, -0.08409690856933594, -0.0806264877319336, -0.07715606689453125, -0.0736856460571289, -0.07021522521972656, -0.06674480438232422, -0.06327438354492188, -0.05980396270751953, -0.05633354187011719, -0.052863121032714844, -0.0493927001953125, -0.045922279357910156, -0.04245185852050781, -0.03898143768310547, -0.035511016845703125, -0.03204059600830078, -0.028570175170898438, -0.025099754333496094, -0.02162933349609375, -0.018158912658691406, -0.014688491821289062, -0.011218070983886719, -0.007747650146484375, -0.004277229309082031, -0.0008068084716796875, 0.0026636123657226562, 0.006134033203125, 0.009604454040527344, 0.013074874877929688, 0.01654529571533203, 0.020015716552734375, 0.02348613739013672, 0.026956558227539062, 0.030426979064941406, 0.03389739990234375, 0.037367820739746094, 0.04083824157714844, 0.04430866241455078, 0.047779083251953125, 0.05124950408935547, 0.05471992492675781, 0.058190345764160156, 0.0616607666015625, 0.06513118743896484, 0.06860160827636719, 0.07207202911376953, 0.07554244995117188, 0.07901287078857422, 0.08248329162597656, 0.0859537124633789, 0.08942413330078125, 0.0928945541381836, 0.09636497497558594, 0.09983539581298828, 0.10330581665039062, 0.10677623748779297, 0.11024665832519531, 0.11371707916259766, 0.1171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 9.0, 3.0, 3.0, 4.0, 5.0, 11.0, 2.0, 15.0, 7.0, 14.0, 19.0, 16.0, 25.0, 30.0, 45.0, 40.0, 52.0, 50.0, 76.0, 92.0, 62.0, 66.0, 57.0, 50.0, 47.0, 40.0, 28.0, 30.0, 23.0, 17.0, 12.0, 15.0, 6.0, 11.0, 6.0, 7.0, 2.0, 0.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0235595703125, -0.022821903228759766, -0.02208423614501953, -0.021346569061279297, -0.020608901977539062, -0.019871234893798828, -0.019133567810058594, -0.01839590072631836, -0.017658233642578125, -0.01692056655883789, -0.016182899475097656, -0.015445232391357422, -0.014707565307617188, -0.013969898223876953, -0.013232231140136719, -0.012494564056396484, -0.01175689697265625, -0.011019229888916016, -0.010281562805175781, -0.009543895721435547, -0.008806228637695312, -0.008068561553955078, -0.007330894470214844, -0.006593227386474609, -0.005855560302734375, -0.005117893218994141, -0.004380226135253906, -0.003642559051513672, -0.0029048919677734375, -0.002167224884033203, -0.0014295578002929688, -0.0006918907165527344, 4.57763671875e-05, 0.0007834434509277344, 0.0015211105346679688, 0.002258777618408203, 0.0029964447021484375, 0.003734111785888672, 0.004471778869628906, 0.005209445953369141, 0.005947113037109375, 0.006684780120849609, 0.007422447204589844, 0.008160114288330078, 0.008897781372070312, 0.009635448455810547, 0.010373115539550781, 0.011110782623291016, 0.01184844970703125, 0.012586116790771484, 0.013323783874511719, 0.014061450958251953, 0.014799118041992188, 0.015536785125732422, 0.016274452209472656, 0.01701211929321289, 0.017749786376953125, 0.01848745346069336, 0.019225120544433594, 0.019962787628173828, 0.020700454711914062, 0.021438121795654297, 0.02217578887939453, 0.022913455963134766, 0.023651123046875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 9.0, 17.0, 63.0, 184.0, 344.0, 257.0, 94.0, 27.0, 17.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4072701930999756, -1.3795124292373657, -1.3517545461654663, -1.3239967823028564, -1.296238899230957, -1.2684811353683472, -1.2407233715057373, -1.212965488433838, -1.185207724571228, -1.1574499607086182, -1.1296920776367188, -1.1019343137741089, -1.074176549911499, -1.0464186668395996, -1.0186609029769897, -0.9909030795097351, -0.9631452560424805, -0.9353874325752258, -0.9076296091079712, -0.8798718452453613, -0.8521140217781067, -0.824356198310852, -0.7965984344482422, -0.7688406109809875, -0.7410827875137329, -0.7133249640464783, -0.6855671405792236, -0.6578093767166138, -0.6300515532493591, -0.6022937297821045, -0.5745359659194946, -0.54677814245224, -0.5190203785896301, -0.4912625551223755, -0.46350476145744324, -0.435746967792511, -0.40798914432525635, -0.3802313208580017, -0.35247352719306946, -0.3247157335281372, -0.29695791006088257, -0.26920008659362793, -0.24144229292869568, -0.21368448436260223, -0.1859266757965088, -0.15816886723041534, -0.1304110586643219, -0.10265325009822845, -0.07489544153213501, -0.047137632966041565, -0.01937982439994812, 0.008377984166145325, 0.03613579273223877, 0.06389360129833221, 0.09165140986442566, 0.1194092184305191, 0.14716702699661255, 0.174924835562706, 0.20268264412879944, 0.23044045269489288, 0.25819826126098633, 0.28595608472824097, 0.3137138783931732, 0.34147167205810547, 0.3692294955253601]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 13.0, 8.0, 4.0, 9.0, 14.0, 15.0, 16.0, 19.0, 22.0, 32.0, 38.0, 31.0, 35.0, 49.0, 44.0, 53.0, 53.0, 55.0, 48.0, 36.0, 53.0, 35.0, 52.0, 32.0, 39.0, 32.0, 31.0, 14.0, 14.0, 19.0, 23.0, 16.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34522736072540283, -0.3336951732635498, -0.3221629559993744, -0.31063076853752136, -0.29909858107566833, -0.2875663638114929, -0.2760341763496399, -0.26450198888778687, -0.25296980142593384, -0.24143759906291962, -0.2299054116010666, -0.21837320923805237, -0.20684102177619934, -0.19530881941318512, -0.1837766170501709, -0.17224442958831787, -0.16071221232414246, -0.14918000996112823, -0.1376478224992752, -0.126115620136261, -0.11458342522382736, -0.10305123031139374, -0.09151902794837952, -0.07998683303594589, -0.06845463812351227, -0.056922443211078644, -0.04539024457335472, -0.0338580459356308, -0.022325851023197174, -0.01079365611076355, 0.0007385462522506714, 0.012270741164684296, 0.02380293607711792, 0.035335130989551544, 0.04686732962727547, 0.05839952826499939, 0.06993172317743301, 0.08146391808986664, 0.09299612045288086, 0.10452831536531448, 0.11606051027774811, 0.12759271264076233, 0.13912490010261536, 0.15065710246562958, 0.1621893048286438, 0.17372149229049683, 0.18525369465351105, 0.19678589701652527, 0.2083180844783783, 0.21985028684139252, 0.23138247430324554, 0.24291467666625977, 0.2544468641281128, 0.2659790515899658, 0.27751126885414124, 0.28904345631599426, 0.3005756735801697, 0.3121078610420227, 0.3236400783061981, 0.33517226576805115, 0.3467044532299042, 0.3582366704940796, 0.3697688579559326, 0.38130104541778564, 0.39283323287963867]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 10.0, 13.0, 21.0, 28.0, 32.0, 61.0, 71.0, 122.0, 183.0, 274.0, 504.0, 811.0, 1651.0, 3306.0, 7321.0, 18232.0, 54066.0, 210263.0, 1411231.0, 2082652.0, 297392.0, 68966.0, 21884.0, 8069.0, 3427.0, 1639.0, 809.0, 449.0, 275.0, 167.0, 104.0, 69.0, 45.0, 39.0, 20.0, 11.0, 15.0, 13.0, 6.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.12384033203125, -0.12050247192382812, -0.11716461181640625, -0.11382675170898438, -0.1104888916015625, -0.10715103149414062, -0.10381317138671875, -0.10047531127929688, -0.097137451171875, -0.09379959106445312, -0.09046173095703125, -0.08712387084960938, -0.0837860107421875, -0.08044815063476562, -0.07711029052734375, -0.07377243041992188, -0.0704345703125, -0.06709671020507812, -0.06375885009765625, -0.060420989990234375, -0.0570831298828125, -0.053745269775390625, -0.05040740966796875, -0.047069549560546875, -0.043731689453125, -0.040393829345703125, -0.03705596923828125, -0.033718109130859375, -0.0303802490234375, -0.027042388916015625, -0.02370452880859375, -0.020366668701171875, -0.01702880859375, -0.013690948486328125, -0.01035308837890625, -0.007015228271484375, -0.0036773681640625, -0.000339508056640625, 0.00299835205078125, 0.006336212158203125, 0.009674072265625, 0.013011932373046875, 0.01634979248046875, 0.019687652587890625, 0.0230255126953125, 0.026363372802734375, 0.02970123291015625, 0.033039093017578125, 0.036376953125, 0.039714813232421875, 0.04305267333984375, 0.046390533447265625, 0.0497283935546875, 0.053066253662109375, 0.05640411376953125, 0.059741973876953125, 0.063079833984375, 0.06641769409179688, 0.06975555419921875, 0.07309341430664062, 0.0764312744140625, 0.07976913452148438, 0.08310699462890625, 0.08644485473632812, 0.08978271484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 4.0, 13.0, 6.0, 9.0, 11.0, 18.0, 13.0, 23.0, 20.0, 26.0, 27.0, 40.0, 38.0, 53.0, 39.0, 50.0, 64.0, 57.0, 55.0, 42.0, 44.0, 43.0, 41.0, 32.0, 40.0, 27.0, 26.0, 19.0, 16.0, 21.0, 21.0, 12.0, 8.0, 8.0, 3.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.05084228515625, -0.04945516586303711, -0.04806804656982422, -0.04668092727661133, -0.04529380798339844, -0.04390668869018555, -0.042519569396972656, -0.041132450103759766, -0.039745330810546875, -0.038358211517333984, -0.036971092224121094, -0.0355839729309082, -0.03419685363769531, -0.03280973434448242, -0.03142261505126953, -0.03003549575805664, -0.02864837646484375, -0.02726125717163086, -0.02587413787841797, -0.024487018585205078, -0.023099899291992188, -0.021712779998779297, -0.020325660705566406, -0.018938541412353516, -0.017551422119140625, -0.016164302825927734, -0.014777183532714844, -0.013390064239501953, -0.012002944946289062, -0.010615825653076172, -0.009228706359863281, -0.00784158706665039, -0.0064544677734375, -0.005067348480224609, -0.0036802291870117188, -0.002293109893798828, -0.0009059906005859375, 0.0004811286926269531, 0.0018682479858398438, 0.0032553672790527344, 0.004642486572265625, 0.006029605865478516, 0.007416725158691406, 0.008803844451904297, 0.010190963745117188, 0.011578083038330078, 0.012965202331542969, 0.01435232162475586, 0.01573944091796875, 0.01712656021118164, 0.01851367950439453, 0.019900798797607422, 0.021287918090820312, 0.022675037384033203, 0.024062156677246094, 0.025449275970458984, 0.026836395263671875, 0.028223514556884766, 0.029610633850097656, 0.030997753143310547, 0.03238487243652344, 0.03377199172973633, 0.03515911102294922, 0.03654623031616211, 0.037933349609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 8.0, 9.0, 9.0, 18.0, 31.0, 41.0, 61.0, 107.0, 160.0, 334.0, 603.0, 1513.0, 3646.0, 10227.0, 31997.0, 108981.0, 405240.0, 1567906.0, 1515862.0, 394262.0, 105690.0, 31001.0, 10102.0, 3698.0, 1409.0, 573.0, 349.0, 174.0, 95.0, 44.0, 36.0, 34.0, 17.0, 12.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11212158203125, -0.10850334167480469, -0.10488510131835938, -0.10126686096191406, -0.09764862060546875, -0.09403038024902344, -0.09041213989257812, -0.08679389953613281, -0.0831756591796875, -0.07955741882324219, -0.07593917846679688, -0.07232093811035156, -0.06870269775390625, -0.06508445739746094, -0.061466217041015625, -0.05784797668457031, -0.054229736328125, -0.05061149597167969, -0.046993255615234375, -0.04337501525878906, -0.03975677490234375, -0.03613853454589844, -0.032520294189453125, -0.028902053833007812, -0.0252838134765625, -0.021665573120117188, -0.018047332763671875, -0.014429092407226562, -0.01081085205078125, -0.0071926116943359375, -0.003574371337890625, 4.38690185546875e-05, 0.003662109375, 0.0072803497314453125, 0.010898590087890625, 0.014516830444335938, 0.01813507080078125, 0.021753311157226562, 0.025371551513671875, 0.028989791870117188, 0.0326080322265625, 0.03622627258300781, 0.039844512939453125, 0.04346275329589844, 0.04708099365234375, 0.05069923400878906, 0.054317474365234375, 0.05793571472167969, 0.061553955078125, 0.06517219543457031, 0.06879043579101562, 0.07240867614746094, 0.07602691650390625, 0.07964515686035156, 0.08326339721679688, 0.08688163757324219, 0.0904998779296875, 0.09411811828613281, 0.09773635864257812, 0.10135459899902344, 0.10497283935546875, 0.10859107971191406, 0.11220932006835938, 0.11582756042480469, 0.11944580078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 13.0, 11.0, 25.0, 29.0, 37.0, 54.0, 91.0, 110.0, 148.0, 222.0, 335.0, 474.0, 630.0, 555.0, 380.0, 284.0, 199.0, 145.0, 99.0, 68.0, 56.0, 27.0, 13.0, 26.0, 15.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08203125, -0.0791788101196289, -0.07632637023925781, -0.07347393035888672, -0.07062149047851562, -0.06776905059814453, -0.06491661071777344, -0.062064170837402344, -0.05921173095703125, -0.056359291076660156, -0.05350685119628906, -0.05065441131591797, -0.047801971435546875, -0.04494953155517578, -0.04209709167480469, -0.039244651794433594, -0.0363922119140625, -0.033539772033691406, -0.030687332153320312, -0.02783489227294922, -0.024982452392578125, -0.02213001251220703, -0.019277572631835938, -0.016425132751464844, -0.01357269287109375, -0.010720252990722656, -0.007867813110351562, -0.005015373229980469, -0.002162933349609375, 0.0006895065307617188, 0.0035419464111328125, 0.006394386291503906, 0.009246826171875, 0.012099266052246094, 0.014951705932617188, 0.01780414581298828, 0.020656585693359375, 0.02350902557373047, 0.026361465454101562, 0.029213905334472656, 0.03206634521484375, 0.034918785095214844, 0.03777122497558594, 0.04062366485595703, 0.043476104736328125, 0.04632854461669922, 0.04918098449707031, 0.052033424377441406, 0.0548858642578125, 0.057738304138183594, 0.06059074401855469, 0.06344318389892578, 0.06629562377929688, 0.06914806365966797, 0.07200050354003906, 0.07485294342041016, 0.07770538330078125, 0.08055782318115234, 0.08341026306152344, 0.08626270294189453, 0.08911514282226562, 0.09196758270263672, 0.09482002258300781, 0.0976724624633789, 0.10052490234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 18.0, 45.0, 96.0, 220.0, 259.0, 196.0, 104.0, 45.0, 10.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33952879905700684, -0.3144300580024719, -0.2893312871456146, -0.2642325162887573, -0.2391337752342224, -0.2140350192785263, -0.1889362633228302, -0.1638375073671341, -0.138738751411438, -0.11363999545574188, -0.08854123950004578, -0.06344248354434967, -0.038343727588653564, -0.013244971632957458, 0.011853784322738647, 0.03695254027843475, 0.06205129623413086, 0.08715005218982697, 0.11224880814552307, 0.13734756410121918, 0.16244632005691528, 0.1875450760126114, 0.2126438319683075, 0.2377425879240036, 0.2628413438796997, 0.2879400849342346, 0.3130388557910919, 0.3381376266479492, 0.36323636770248413, 0.38833510875701904, 0.41343387961387634, 0.43853265047073364, 0.46363139152526855, 0.48873013257980347, 0.5138288736343384, 0.5389276742935181, 0.564026415348053, 0.5891251564025879, 0.6142239570617676, 0.6393226981163025, 0.6644214391708374, 0.6895201802253723, 0.7146189212799072, 0.7397177219390869, 0.7648164629936218, 0.7899152040481567, 0.8150140047073364, 0.8401127457618713, 0.8652114868164062, 0.8903102278709412, 0.9154089689254761, 0.9405077695846558, 0.9656065106391907, 0.9907052516937256, 1.0158040523529053, 1.0409027338027954, 1.066001534461975, 1.0911003351211548, 1.116199016571045, 1.1412978172302246, 1.1663966178894043, 1.1914952993392944, 1.2165940999984741, 1.2416927814483643, 1.266791582107544]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 10.0, 6.0, 10.0, 9.0, 6.0, 16.0, 15.0, 22.0, 20.0, 23.0, 24.0, 29.0, 26.0, 36.0, 30.0, 41.0, 40.0, 42.0, 35.0, 34.0, 31.0, 56.0, 39.0, 44.0, 33.0, 31.0, 32.0, 34.0, 33.0, 22.0, 14.0, 14.0, 19.0, 16.0, 14.0, 12.0, 10.0, 13.0, 8.0, 10.0, 5.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.20630133152008057, -0.19990728795528412, -0.19351324439048767, -0.18711921572685242, -0.18072517216205597, -0.17433112859725952, -0.16793709993362427, -0.16154305636882782, -0.15514901280403137, -0.14875496923923492, -0.14236092567443848, -0.13596689701080322, -0.12957285344600677, -0.12317880988121033, -0.11678477376699448, -0.11039073765277863, -0.10399669408798218, -0.09760265052318573, -0.09120861440896988, -0.08481457829475403, -0.07842053472995758, -0.07202649116516113, -0.06563245505094528, -0.05923841521143913, -0.05284437537193298, -0.046450335532426834, -0.040056295692920685, -0.033662255853414536, -0.027268216013908386, -0.020874176174402237, -0.014480136334896088, -0.008086096495389938, -0.001692056655883789, 0.00470198318362236, 0.01109602302312851, 0.01749006286263466, 0.023884102702140808, 0.030278142541646957, 0.03667218238115311, 0.043066222220659256, 0.049460262060165405, 0.055854301899671555, 0.062248341739177704, 0.06864237785339355, 0.07503642141819, 0.08143046498298645, 0.0878245010972023, 0.09421853721141815, 0.1006125807762146, 0.10700662434101105, 0.1134006604552269, 0.11979469656944275, 0.1261887401342392, 0.13258278369903564, 0.1389768123626709, 0.14537085592746735, 0.1517648994922638, 0.15815894305706024, 0.1645529866218567, 0.17094701528549194, 0.1773410588502884, 0.18373510241508484, 0.1901291310787201, 0.19652317464351654, 0.202917218208313]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 14.0, 18.0, 18.0, 29.0, 35.0, 73.0, 103.0, 149.0, 289.0, 490.0, 844.0, 1400.0, 2477.0, 4513.0, 8561.0, 18199.0, 45336.0, 128168.0, 316820.0, 314264.0, 125534.0, 44238.0, 17987.0, 8471.0, 4592.0, 2541.0, 1378.0, 826.0, 470.0, 282.0, 156.0, 105.0, 57.0, 41.0, 26.0, 18.0, 9.0, 5.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.1245107650756836, -0.12084770202636719, -0.11718463897705078, -0.11352157592773438, -0.10985851287841797, -0.10619544982910156, -0.10253238677978516, -0.09886932373046875, -0.09520626068115234, -0.09154319763183594, -0.08788013458251953, -0.08421707153320312, -0.08055400848388672, -0.07689094543457031, -0.0732278823852539, -0.0695648193359375, -0.0659017562866211, -0.06223869323730469, -0.05857563018798828, -0.054912567138671875, -0.05124950408935547, -0.04758644104003906, -0.043923377990722656, -0.04026031494140625, -0.036597251892089844, -0.03293418884277344, -0.02927112579345703, -0.025608062744140625, -0.02194499969482422, -0.018281936645507812, -0.014618873596191406, -0.010955810546875, -0.007292747497558594, -0.0036296844482421875, 3.337860107421875e-05, 0.003696441650390625, 0.007359504699707031, 0.011022567749023438, 0.014685630798339844, 0.01834869384765625, 0.022011756896972656, 0.025674819946289062, 0.02933788299560547, 0.033000946044921875, 0.03666400909423828, 0.04032707214355469, 0.043990135192871094, 0.0476531982421875, 0.051316261291503906, 0.05497932434082031, 0.05864238739013672, 0.062305450439453125, 0.06596851348876953, 0.06963157653808594, 0.07329463958740234, 0.07695770263671875, 0.08062076568603516, 0.08428382873535156, 0.08794689178466797, 0.09160995483398438, 0.09527301788330078, 0.09893608093261719, 0.1025991439819336, 0.10626220703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 8.0, 10.0, 13.0, 13.0, 16.0, 14.0, 24.0, 24.0, 29.0, 40.0, 38.0, 48.0, 44.0, 44.0, 53.0, 50.0, 55.0, 46.0, 51.0, 43.0, 33.0, 40.0, 35.0, 26.0, 35.0, 22.0, 26.0, 12.0, 18.0, 8.0, 13.0, 15.0, 5.0, 10.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.044708251953125, -0.04349851608276367, -0.042288780212402344, -0.041079044342041016, -0.03986930847167969, -0.03865957260131836, -0.03744983673095703, -0.0362401008605957, -0.035030364990234375, -0.03382062911987305, -0.03261089324951172, -0.03140115737915039, -0.030191421508789062, -0.028981685638427734, -0.027771949768066406, -0.026562213897705078, -0.02535247802734375, -0.024142742156982422, -0.022933006286621094, -0.021723270416259766, -0.020513534545898438, -0.01930379867553711, -0.01809406280517578, -0.016884326934814453, -0.015674591064453125, -0.014464855194091797, -0.013255119323730469, -0.01204538345336914, -0.010835647583007812, -0.009625911712646484, -0.008416175842285156, -0.007206439971923828, -0.0059967041015625, -0.004786968231201172, -0.0035772323608398438, -0.0023674964904785156, -0.0011577606201171875, 5.1975250244140625e-05, 0.0012617111206054688, 0.002471446990966797, 0.003681182861328125, 0.004890918731689453, 0.006100654602050781, 0.007310390472412109, 0.008520126342773438, 0.009729862213134766, 0.010939598083496094, 0.012149333953857422, 0.01335906982421875, 0.014568805694580078, 0.015778541564941406, 0.016988277435302734, 0.018198013305664062, 0.01940774917602539, 0.02061748504638672, 0.021827220916748047, 0.023036956787109375, 0.024246692657470703, 0.02545642852783203, 0.02666616439819336, 0.027875900268554688, 0.029085636138916016, 0.030295372009277344, 0.03150510787963867, 0.03271484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 11.0, 32.0, 37.0, 51.0, 72.0, 94.0, 197.0, 319.0, 655.0, 1376.0, 3172.0, 8050.0, 22677.0, 78568.0, 327299.0, 434600.0, 120960.0, 31765.0, 10922.0, 4181.0, 1742.0, 769.0, 391.0, 217.0, 140.0, 75.0, 59.0, 34.0, 32.0, 20.0, 12.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1825714111328125, -0.177520751953125, -0.1724700927734375, -0.16741943359375, -0.1623687744140625, -0.157318115234375, -0.1522674560546875, -0.147216796875, -0.1421661376953125, -0.137115478515625, -0.1320648193359375, -0.12701416015625, -0.1219635009765625, -0.116912841796875, -0.1118621826171875, -0.1068115234375, -0.1017608642578125, -0.096710205078125, -0.0916595458984375, -0.08660888671875, -0.0815582275390625, -0.076507568359375, -0.0714569091796875, -0.06640625, -0.0613555908203125, -0.056304931640625, -0.0512542724609375, -0.04620361328125, -0.0411529541015625, -0.036102294921875, -0.0310516357421875, -0.0260009765625, -0.0209503173828125, -0.015899658203125, -0.0108489990234375, -0.00579833984375, -0.0007476806640625, 0.004302978515625, 0.0093536376953125, 0.014404296875, 0.0194549560546875, 0.024505615234375, 0.0295562744140625, 0.03460693359375, 0.0396575927734375, 0.044708251953125, 0.0497589111328125, 0.0548095703125, 0.0598602294921875, 0.064910888671875, 0.0699615478515625, 0.07501220703125, 0.0800628662109375, 0.085113525390625, 0.0901641845703125, 0.09521484375, 0.1002655029296875, 0.105316162109375, 0.1103668212890625, 0.11541748046875, 0.1204681396484375, 0.125518798828125, 0.1305694580078125, 0.1356201171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 10.0, 4.0, 11.0, 11.0, 11.0, 22.0, 26.0, 16.0, 35.0, 54.0, 45.0, 44.0, 48.0, 55.0, 51.0, 62.0, 55.0, 61.0, 49.0, 58.0, 48.0, 49.0, 34.0, 35.0, 17.0, 16.0, 18.0, 16.0, 12.0, 4.0, 7.0, 5.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.127197265625, -0.12374687194824219, -0.12029647827148438, -0.11684608459472656, -0.11339569091796875, -0.10994529724121094, -0.10649490356445312, -0.10304450988769531, -0.0995941162109375, -0.09614372253417969, -0.09269332885742188, -0.08924293518066406, -0.08579254150390625, -0.08234214782714844, -0.07889175415039062, -0.07544136047363281, -0.071990966796875, -0.06854057312011719, -0.06509017944335938, -0.06163978576660156, -0.05818939208984375, -0.05473899841308594, -0.051288604736328125, -0.04783821105957031, -0.0443878173828125, -0.04093742370605469, -0.037487030029296875, -0.03403663635253906, -0.03058624267578125, -0.027135848999023438, -0.023685455322265625, -0.020235061645507812, -0.01678466796875, -0.013334274291992188, -0.009883880615234375, -0.0064334869384765625, -0.00298309326171875, 0.0004673004150390625, 0.003917694091796875, 0.0073680877685546875, 0.0108184814453125, 0.014268875122070312, 0.017719268798828125, 0.021169662475585938, 0.02462005615234375, 0.028070449829101562, 0.031520843505859375, 0.03497123718261719, 0.038421630859375, 0.04187202453613281, 0.045322418212890625, 0.04877281188964844, 0.05222320556640625, 0.05567359924316406, 0.059123992919921875, 0.06257438659667969, 0.0660247802734375, 0.06947517395019531, 0.07292556762695312, 0.07637596130371094, 0.07982635498046875, 0.08327674865722656, 0.08672714233398438, 0.09017753601074219, 0.0936279296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 16.0, 7.0, 17.0, 34.0, 40.0, 54.0, 68.0, 125.0, 165.0, 204.0, 368.0, 482.0, 777.0, 1147.0, 2080.0, 4843.0, 14228.0, 60108.0, 438473.0, 440532.0, 59931.0, 14427.0, 4876.0, 2093.0, 1129.0, 698.0, 437.0, 307.0, 253.0, 155.0, 126.0, 101.0, 72.0, 43.0, 36.0, 31.0, 17.0, 14.0, 7.0, 6.0, 10.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10711669921875, -0.1034231185913086, -0.09972953796386719, -0.09603595733642578, -0.09234237670898438, -0.08864879608154297, -0.08495521545410156, -0.08126163482666016, -0.07756805419921875, -0.07387447357177734, -0.07018089294433594, -0.06648731231689453, -0.06279373168945312, -0.05910015106201172, -0.05540657043457031, -0.051712989807128906, -0.0480194091796875, -0.044325828552246094, -0.04063224792480469, -0.03693866729736328, -0.033245086669921875, -0.02955150604248047, -0.025857925415039062, -0.022164344787597656, -0.01847076416015625, -0.014777183532714844, -0.011083602905273438, -0.007390022277832031, -0.003696441650390625, -2.86102294921875e-06, 0.0036907196044921875, 0.007384300231933594, 0.011077880859375, 0.014771461486816406, 0.018465042114257812, 0.02215862274169922, 0.025852203369140625, 0.02954578399658203, 0.03323936462402344, 0.036932945251464844, 0.04062652587890625, 0.044320106506347656, 0.04801368713378906, 0.05170726776123047, 0.055400848388671875, 0.05909442901611328, 0.06278800964355469, 0.0664815902709961, 0.0701751708984375, 0.0738687515258789, 0.07756233215332031, 0.08125591278076172, 0.08494949340820312, 0.08864307403564453, 0.09233665466308594, 0.09603023529052734, 0.09972381591796875, 0.10341739654541016, 0.10711097717285156, 0.11080455780029297, 0.11449813842773438, 0.11819171905517578, 0.12188529968261719, 0.1255788803100586, 0.1292724609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 11.0, 29.0, 90.0, 164.0, 258.0, 213.0, 117.0, 44.0, 18.0, 14.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8252601623535156e-05, -2.6946887373924255e-05, -2.5641173124313354e-05, -2.4335458874702454e-05, -2.3029744625091553e-05, -2.1724030375480652e-05, -2.041831612586975e-05, -1.911260187625885e-05, -1.780688762664795e-05, -1.650117337703705e-05, -1.5195459127426147e-05, -1.3889744877815247e-05, -1.2584030628204346e-05, -1.1278316378593445e-05, -9.972602128982544e-06, -8.666887879371643e-06, -7.361173629760742e-06, -6.055459380149841e-06, -4.7497451305389404e-06, -3.4440308809280396e-06, -2.1383166313171387e-06, -8.326023817062378e-07, 4.731118679046631e-07, 1.778826117515564e-06, 3.084540367126465e-06, 4.390254616737366e-06, 5.695968866348267e-06, 7.0016831159591675e-06, 8.307397365570068e-06, 9.61311161518097e-06, 1.091882586479187e-05, 1.2224540114402771e-05, 1.3530254364013672e-05, 1.4835968613624573e-05, 1.6141682863235474e-05, 1.7447397112846375e-05, 1.8753111362457275e-05, 2.0058825612068176e-05, 2.1364539861679077e-05, 2.2670254111289978e-05, 2.397596836090088e-05, 2.528168261051178e-05, 2.658739686012268e-05, 2.789311110973358e-05, 2.9198825359344482e-05, 3.0504539608955383e-05, 3.1810253858566284e-05, 3.3115968108177185e-05, 3.4421682357788086e-05, 3.572739660739899e-05, 3.703311085700989e-05, 3.833882510662079e-05, 3.964453935623169e-05, 4.095025360584259e-05, 4.225596785545349e-05, 4.356168210506439e-05, 4.486739635467529e-05, 4.6173110604286194e-05, 4.7478824853897095e-05, 4.8784539103507996e-05, 5.0090253353118896e-05, 5.13959676027298e-05, 5.27016818523407e-05, 5.40073961019516e-05, 5.53131103515625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 10.0, 18.0, 21.0, 27.0, 47.0, 70.0, 92.0, 152.0, 277.0, 375.0, 662.0, 1087.0, 2081.0, 3879.0, 7337.0, 15135.0, 34104.0, 89681.0, 230091.0, 334898.0, 197561.0, 74384.0, 29148.0, 12933.0, 6500.0, 3409.0, 1883.0, 1043.0, 612.0, 340.0, 223.0, 143.0, 96.0, 73.0, 46.0, 33.0, 18.0, 16.0, 9.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.044647216796875, -0.04312896728515625, -0.0416107177734375, -0.04009246826171875, -0.03857421875, -0.03705596923828125, -0.0355377197265625, -0.03401947021484375, -0.032501220703125, -0.03098297119140625, -0.0294647216796875, -0.02794647216796875, -0.02642822265625, -0.02490997314453125, -0.0233917236328125, -0.02187347412109375, -0.020355224609375, -0.01883697509765625, -0.0173187255859375, -0.01580047607421875, -0.0142822265625, -0.01276397705078125, -0.0112457275390625, -0.00972747802734375, -0.008209228515625, -0.00669097900390625, -0.0051727294921875, -0.00365447998046875, -0.00213623046875, -0.00061798095703125, 0.0009002685546875, 0.00241851806640625, 0.003936767578125, 0.00545501708984375, 0.0069732666015625, 0.00849151611328125, 0.010009765625, 0.01152801513671875, 0.0130462646484375, 0.01456451416015625, 0.016082763671875, 0.01760101318359375, 0.0191192626953125, 0.02063751220703125, 0.02215576171875, 0.02367401123046875, 0.0251922607421875, 0.02671051025390625, 0.028228759765625, 0.02974700927734375, 0.0312652587890625, 0.03278350830078125, 0.0343017578125, 0.03582000732421875, 0.0373382568359375, 0.03885650634765625, 0.040374755859375, 0.04189300537109375, 0.0434112548828125, 0.04492950439453125, 0.04644775390625, 0.04796600341796875, 0.0494842529296875, 0.05100250244140625, 0.052520751953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 8.0, 7.0, 9.0, 10.0, 6.0, 12.0, 18.0, 19.0, 16.0, 23.0, 34.0, 46.0, 47.0, 58.0, 68.0, 67.0, 68.0, 58.0, 81.0, 69.0, 48.0, 42.0, 41.0, 36.0, 31.0, 18.0, 16.0, 9.0, 11.0, 8.0, 2.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0284881591796875, -0.02749323844909668, -0.02649831771850586, -0.02550339698791504, -0.02450847625732422, -0.0235135555267334, -0.022518634796142578, -0.021523714065551758, -0.020528793334960938, -0.019533872604370117, -0.018538951873779297, -0.017544031143188477, -0.016549110412597656, -0.015554189682006836, -0.014559268951416016, -0.013564348220825195, -0.012569427490234375, -0.011574506759643555, -0.010579586029052734, -0.009584665298461914, -0.008589744567871094, -0.0075948238372802734, -0.006599903106689453, -0.005604982376098633, -0.0046100616455078125, -0.003615140914916992, -0.002620220184326172, -0.0016252994537353516, -0.0006303787231445312, 0.00036454200744628906, 0.0013594627380371094, 0.0023543834686279297, 0.00334930419921875, 0.00434422492980957, 0.005339145660400391, 0.006334066390991211, 0.007328987121582031, 0.008323907852172852, 0.009318828582763672, 0.010313749313354492, 0.011308670043945312, 0.012303590774536133, 0.013298511505126953, 0.014293432235717773, 0.015288352966308594, 0.016283273696899414, 0.017278194427490234, 0.018273115158081055, 0.019268035888671875, 0.020262956619262695, 0.021257877349853516, 0.022252798080444336, 0.023247718811035156, 0.024242639541625977, 0.025237560272216797, 0.026232481002807617, 0.027227401733398438, 0.028222322463989258, 0.029217243194580078, 0.0302121639251709, 0.03120708465576172, 0.03220200538635254, 0.03319692611694336, 0.03419184684753418, 0.035186767578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 10.0, 31.0, 37.0, 71.0, 90.0, 128.0, 155.0, 152.0, 137.0, 75.0, 48.0, 25.0, 14.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4316258728504181, -0.4184246063232422, -0.4052233397960663, -0.3920220732688904, -0.37882083654403687, -0.3656195402145386, -0.35241830348968506, -0.33921703696250916, -0.32601577043533325, -0.31281450390815735, -0.29961323738098145, -0.28641197085380554, -0.27321070432662964, -0.2600094676017761, -0.24680820107460022, -0.23360693454742432, -0.2204056680202484, -0.2072044014930725, -0.1940031349658966, -0.1808018833398819, -0.167600616812706, -0.1543993502855301, -0.14119809865951538, -0.12799683213233948, -0.11479556560516357, -0.10159429907798767, -0.08839304000139236, -0.07519178092479706, -0.061990514397621155, -0.04878924787044525, -0.035587988793849945, -0.02238672971725464, -0.009185463190078735, 0.0040157996118068695, 0.017217062413692474, 0.03041832521557808, 0.043619588017463684, 0.05682085454463959, 0.0700221136212349, 0.0832233726978302, 0.0964246392250061, 0.109625905752182, 0.12282716482877731, 0.13602842390537262, 0.14922969043254852, 0.16243095695972443, 0.17563220858573914, 0.18883347511291504, 0.20203474164009094, 0.21523600816726685, 0.22843727469444275, 0.24163852632045746, 0.25483977794647217, 0.26804107427597046, 0.281242311000824, 0.2944435775279999, 0.3076448440551758, 0.3208461105823517, 0.3340473771095276, 0.3472486436367035, 0.3604499101638794, 0.3736511468887329, 0.3868524134159088, 0.4000536799430847, 0.4132549464702606]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 5.0, 7.0, 7.0, 9.0, 8.0, 8.0, 12.0, 16.0, 19.0, 26.0, 22.0, 24.0, 28.0, 30.0, 37.0, 46.0, 28.0, 38.0, 38.0, 37.0, 35.0, 22.0, 41.0, 45.0, 23.0, 44.0, 31.0, 33.0, 34.0, 27.0, 31.0, 22.0, 25.0, 23.0, 23.0, 17.0, 7.0, 8.0, 10.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.20474779605865479, -0.19832244515419006, -0.19189709424972534, -0.18547174334526062, -0.1790463924407959, -0.17262104153633118, -0.16619569063186646, -0.15977033972740173, -0.153344988822937, -0.1469196379184723, -0.14049428701400757, -0.13406893610954285, -0.12764358520507812, -0.1212182343006134, -0.11479289084672928, -0.10836753994226456, -0.10194219648838043, -0.09551684558391571, -0.08909149467945099, -0.08266614377498627, -0.07624079287052155, -0.06981544196605682, -0.0633900985121727, -0.05696474760770798, -0.050539396703243256, -0.044114045798778534, -0.03768869489431381, -0.03126334771513939, -0.024837996810674667, -0.018412645906209946, -0.011987298727035522, -0.005561947822570801, 0.0008634030818939209, 0.007288753055036068, 0.013714103028178215, 0.020139452069997787, 0.02656480297446251, 0.03299015387892723, 0.039415501058101654, 0.045840851962566376, 0.0522662028670311, 0.05869155377149582, 0.06511690467596054, 0.07154224812984467, 0.07796759903430939, 0.08439294993877411, 0.09081830084323883, 0.09724365174770355, 0.10366900265216827, 0.110094353556633, 0.11651970446109772, 0.12294505536556244, 0.12937040627002716, 0.13579575717449188, 0.1422210931777954, 0.14864644408226013, 0.15507179498672485, 0.16149714589118958, 0.1679224967956543, 0.17434784770011902, 0.18077319860458374, 0.18719854950904846, 0.19362390041351318, 0.2000492513179779, 0.20647460222244263]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 15.0, 16.0, 26.0, 29.0, 79.0, 111.0, 211.0, 383.0, 752.0, 1493.0, 3115.0, 7764.0, 21374.0, 68605.0, 278434.0, 1339936.0, 1836931.0, 479453.0, 107693.0, 30455.0, 10188.0, 3922.0, 1698.0, 752.0, 365.0, 211.0, 94.0, 71.0, 47.0, 14.0, 10.0, 6.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08074951171875, -0.07815837860107422, -0.07556724548339844, -0.07297611236572266, -0.07038497924804688, -0.0677938461303711, -0.06520271301269531, -0.06261157989501953, -0.06002044677734375, -0.05742931365966797, -0.05483818054199219, -0.052247047424316406, -0.049655914306640625, -0.047064781188964844, -0.04447364807128906, -0.04188251495361328, -0.0392913818359375, -0.03670024871826172, -0.03410911560058594, -0.031517982482910156, -0.028926849365234375, -0.026335716247558594, -0.023744583129882812, -0.02115345001220703, -0.01856231689453125, -0.01597118377685547, -0.013380050659179688, -0.010788917541503906, -0.008197784423828125, -0.005606651306152344, -0.0030155181884765625, -0.00042438507080078125, 0.002166748046875, 0.004757881164550781, 0.0073490142822265625, 0.009940147399902344, 0.012531280517578125, 0.015122413635253906, 0.017713546752929688, 0.02030467987060547, 0.02289581298828125, 0.02548694610595703, 0.028078079223632812, 0.030669212341308594, 0.033260345458984375, 0.035851478576660156, 0.03844261169433594, 0.04103374481201172, 0.0436248779296875, 0.04621601104736328, 0.04880714416503906, 0.051398277282714844, 0.053989410400390625, 0.056580543518066406, 0.05917167663574219, 0.06176280975341797, 0.06435394287109375, 0.06694507598876953, 0.06953620910644531, 0.0721273422241211, 0.07471847534179688, 0.07730960845947266, 0.07990074157714844, 0.08249187469482422, 0.0850830078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 2.0, 5.0, 8.0, 10.0, 9.0, 10.0, 23.0, 14.0, 14.0, 28.0, 31.0, 32.0, 33.0, 42.0, 39.0, 46.0, 61.0, 42.0, 54.0, 35.0, 53.0, 59.0, 45.0, 40.0, 29.0, 32.0, 26.0, 26.0, 24.0, 18.0, 20.0, 20.0, 12.0, 10.0, 7.0, 12.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.044525146484375, -0.04327392578125, -0.042022705078125, -0.040771484375, -0.039520263671875, -0.03826904296875, -0.037017822265625, -0.0357666015625, -0.034515380859375, -0.03326416015625, -0.032012939453125, -0.03076171875, -0.029510498046875, -0.02825927734375, -0.027008056640625, -0.0257568359375, -0.024505615234375, -0.02325439453125, -0.022003173828125, -0.020751953125, -0.019500732421875, -0.01824951171875, -0.016998291015625, -0.0157470703125, -0.014495849609375, -0.01324462890625, -0.011993408203125, -0.0107421875, -0.009490966796875, -0.00823974609375, -0.006988525390625, -0.0057373046875, -0.004486083984375, -0.00323486328125, -0.001983642578125, -0.000732421875, 0.000518798828125, 0.00177001953125, 0.003021240234375, 0.0042724609375, 0.005523681640625, 0.00677490234375, 0.008026123046875, 0.00927734375, 0.010528564453125, 0.01177978515625, 0.013031005859375, 0.0142822265625, 0.015533447265625, 0.01678466796875, 0.018035888671875, 0.019287109375, 0.020538330078125, 0.02178955078125, 0.023040771484375, 0.0242919921875, 0.025543212890625, 0.02679443359375, 0.028045654296875, 0.029296875, 0.030548095703125, 0.03179931640625, 0.033050537109375, 0.0343017578125, 0.035552978515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 12.0, 13.0, 18.0, 21.0, 38.0, 47.0, 81.0, 113.0, 177.0, 243.0, 401.0, 703.0, 1554.0, 3410.0, 8394.0, 23308.0, 69637.0, 215409.0, 643214.0, 1414415.0, 1153033.0, 440886.0, 144087.0, 47406.0, 16237.0, 6043.0, 2529.0, 1196.0, 599.0, 359.0, 210.0, 136.0, 88.0, 69.0, 44.0, 35.0, 25.0, 19.0, 17.0, 14.0, 7.0, 9.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.08203125, -0.0794534683227539, -0.07687568664550781, -0.07429790496826172, -0.07172012329101562, -0.06914234161376953, -0.06656455993652344, -0.06398677825927734, -0.06140899658203125, -0.058831214904785156, -0.05625343322753906, -0.05367565155029297, -0.051097869873046875, -0.04852008819580078, -0.04594230651855469, -0.043364524841308594, -0.0407867431640625, -0.038208961486816406, -0.03563117980957031, -0.03305339813232422, -0.030475616455078125, -0.02789783477783203, -0.025320053100585938, -0.022742271423339844, -0.02016448974609375, -0.017586708068847656, -0.015008926391601562, -0.012431144714355469, -0.009853363037109375, -0.007275581359863281, -0.0046977996826171875, -0.0021200180053710938, 0.000457763671875, 0.0030355453491210938, 0.0056133270263671875, 0.008191108703613281, 0.010768890380859375, 0.013346672058105469, 0.015924453735351562, 0.018502235412597656, 0.02108001708984375, 0.023657798767089844, 0.026235580444335938, 0.02881336212158203, 0.031391143798828125, 0.03396892547607422, 0.03654670715332031, 0.039124488830566406, 0.0417022705078125, 0.044280052185058594, 0.04685783386230469, 0.04943561553955078, 0.052013397216796875, 0.05459117889404297, 0.05716896057128906, 0.059746742248535156, 0.06232452392578125, 0.06490230560302734, 0.06748008728027344, 0.07005786895751953, 0.07263565063476562, 0.07521343231201172, 0.07779121398925781, 0.0803689956665039, 0.08294677734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 10.0, 10.0, 11.0, 16.0, 12.0, 13.0, 13.0, 29.0, 34.0, 57.0, 84.0, 77.0, 96.0, 136.0, 163.0, 188.0, 230.0, 292.0, 325.0, 337.0, 327.0, 296.0, 225.0, 211.0, 179.0, 156.0, 119.0, 100.0, 80.0, 54.0, 53.0, 28.0, 26.0, 16.0, 20.0, 16.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0760498046875, -0.0739140510559082, -0.0717782974243164, -0.06964254379272461, -0.06750679016113281, -0.06537103652954102, -0.06323528289794922, -0.06109952926635742, -0.058963775634765625, -0.05682802200317383, -0.05469226837158203, -0.052556514739990234, -0.05042076110839844, -0.04828500747680664, -0.046149253845214844, -0.04401350021362305, -0.04187774658203125, -0.03974199295043945, -0.037606239318847656, -0.03547048568725586, -0.03333473205566406, -0.031198978424072266, -0.02906322479248047, -0.026927471160888672, -0.024791717529296875, -0.022655963897705078, -0.02052021026611328, -0.018384456634521484, -0.016248703002929688, -0.01411294937133789, -0.011977195739746094, -0.009841442108154297, -0.0077056884765625, -0.005569934844970703, -0.0034341812133789062, -0.0012984275817871094, 0.0008373260498046875, 0.0029730796813964844, 0.005108833312988281, 0.007244586944580078, 0.009380340576171875, 0.011516094207763672, 0.013651847839355469, 0.015787601470947266, 0.017923355102539062, 0.02005910873413086, 0.022194862365722656, 0.024330615997314453, 0.02646636962890625, 0.028602123260498047, 0.030737876892089844, 0.03287363052368164, 0.03500938415527344, 0.037145137786865234, 0.03928089141845703, 0.04141664505004883, 0.043552398681640625, 0.04568815231323242, 0.04782390594482422, 0.049959659576416016, 0.05209541320800781, 0.05423116683959961, 0.056366920471191406, 0.0585026741027832, 0.060638427734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 14.0, 22.0, 55.0, 69.0, 107.0, 133.0, 142.0, 142.0, 116.0, 76.0, 39.0, 34.0, 17.0, 9.0, 6.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5496717095375061, -0.5310545563697815, -0.5124374628067017, -0.49382030963897705, -0.47520315647125244, -0.4565860331058502, -0.437968909740448, -0.4193517565727234, -0.40073463320732117, -0.38211750984191895, -0.36350035667419434, -0.3448832333087921, -0.3262661099433899, -0.3076489567756653, -0.28903183341026306, -0.27041471004486084, -0.25179755687713623, -0.23318041861057281, -0.2145632803440094, -0.19594615697860718, -0.17732901871204376, -0.15871188044548035, -0.14009475708007812, -0.12147761881351471, -0.1028604805469513, -0.08424334228038788, -0.06562621146440506, -0.04700907692313194, -0.028391942381858826, -0.00977480411529541, 0.008842326700687408, 0.027459457516670227, 0.04607665538787842, 0.06469379365444183, 0.08331092447042465, 0.10192805528640747, 0.12054519355297089, 0.1391623318195343, 0.15777945518493652, 0.17639659345149994, 0.19501373171806335, 0.21363086998462677, 0.23224800825119019, 0.2508651316165924, 0.26948225498199463, 0.28809940814971924, 0.30671653151512146, 0.3253336548805237, 0.3439508080482483, 0.3625679314136505, 0.3811850845813751, 0.39980220794677734, 0.41841936111450195, 0.4370364844799042, 0.4556536078453064, 0.474270761013031, 0.4928878843784332, 0.5115050077438354, 0.5301221609115601, 0.5487393140792847, 0.5673564076423645, 0.5859735608100891, 0.6045907139778137, 0.6232078075408936, 0.6418249607086182]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 7.0, 5.0, 7.0, 7.0, 7.0, 13.0, 6.0, 10.0, 13.0, 18.0, 11.0, 16.0, 18.0, 24.0, 18.0, 30.0, 21.0, 31.0, 29.0, 25.0, 30.0, 35.0, 34.0, 31.0, 41.0, 29.0, 29.0, 51.0, 28.0, 35.0, 33.0, 27.0, 34.0, 29.0, 23.0, 24.0, 17.0, 23.0, 21.0, 13.0, 14.0, 16.0, 18.0, 12.0, 9.0, 11.0, 3.0, 5.0, 5.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.24280864000320435, -0.23558522760868073, -0.2283618003129959, -0.2211383879184723, -0.21391497552394867, -0.20669156312942505, -0.19946813583374023, -0.1922447234392166, -0.185021311044693, -0.17779789865016937, -0.17057447135448456, -0.16335105895996094, -0.15612764656543732, -0.1489042341709137, -0.14168080687522888, -0.13445739448070526, -0.12723396718502045, -0.12001054733991623, -0.11278713494539261, -0.10556371510028839, -0.09834030270576477, -0.09111688286066055, -0.08389346301555634, -0.07667005062103271, -0.0694466307759285, -0.06222321465611458, -0.05499979853630066, -0.04777637869119644, -0.04055296257138252, -0.033329546451568604, -0.026106126606464386, -0.018882710486650467, -0.011659294366836548, -0.004435877315700054, 0.0027875397354364395, 0.010010957717895508, 0.017234373837709427, 0.024457789957523346, 0.031681209802627563, 0.03890462592244148, 0.0461280420422554, 0.05335145816206932, 0.06057487428188324, 0.06779829412698746, 0.07502171397209167, 0.0822451263666153, 0.08946854621171951, 0.09669196605682373, 0.10391537845134735, 0.11113879829645157, 0.11836221069097519, 0.1255856305360794, 0.13280904293060303, 0.14003247022628784, 0.14725588262081146, 0.15447929501533508, 0.1617027223110199, 0.16892613470554352, 0.17614956200122833, 0.18337297439575195, 0.19059638679027557, 0.1978197991847992, 0.205043226480484, 0.21226663887500763, 0.21949005126953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 7.0, 14.0, 12.0, 18.0, 27.0, 46.0, 61.0, 83.0, 143.0, 205.0, 353.0, 619.0, 1051.0, 1837.0, 3140.0, 5760.0, 10514.0, 19188.0, 35001.0, 62607.0, 107882.0, 163502.0, 196616.0, 170720.0, 115306.0, 68468.0, 38153.0, 21049.0, 11543.0, 6270.0, 3542.0, 1915.0, 1132.0, 657.0, 401.0, 245.0, 150.0, 91.0, 66.0, 55.0, 33.0, 25.0, 18.0, 8.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.07240009307861328, -0.07003211975097656, -0.06766414642333984, -0.06529617309570312, -0.0629281997680664, -0.06056022644042969, -0.05819225311279297, -0.05582427978515625, -0.05345630645751953, -0.05108833312988281, -0.048720359802246094, -0.046352386474609375, -0.043984413146972656, -0.04161643981933594, -0.03924846649169922, -0.0368804931640625, -0.03451251983642578, -0.03214454650878906, -0.029776573181152344, -0.027408599853515625, -0.025040626525878906, -0.022672653198242188, -0.02030467987060547, -0.01793670654296875, -0.015568733215332031, -0.013200759887695312, -0.010832786560058594, -0.008464813232421875, -0.006096839904785156, -0.0037288665771484375, -0.0013608932495117188, 0.001007080078125, 0.0033750534057617188, 0.0057430267333984375, 0.008111000061035156, 0.010478973388671875, 0.012846946716308594, 0.015214920043945312, 0.01758289337158203, 0.01995086669921875, 0.02231884002685547, 0.024686813354492188, 0.027054786682128906, 0.029422760009765625, 0.031790733337402344, 0.03415870666503906, 0.03652667999267578, 0.0388946533203125, 0.04126262664794922, 0.04363059997558594, 0.045998573303222656, 0.048366546630859375, 0.050734519958496094, 0.05310249328613281, 0.05547046661376953, 0.05783843994140625, 0.06020641326904297, 0.06257438659667969, 0.0649423599243164, 0.06731033325195312, 0.06967830657958984, 0.07204627990722656, 0.07441425323486328, 0.0767822265625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 4.0, 12.0, 10.0, 13.0, 15.0, 17.0, 16.0, 10.0, 23.0, 28.0, 38.0, 37.0, 33.0, 46.0, 55.0, 54.0, 59.0, 40.0, 50.0, 55.0, 47.0, 44.0, 46.0, 45.0, 30.0, 22.0, 31.0, 17.0, 19.0, 16.0, 9.0, 9.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.046875, -0.045644283294677734, -0.04441356658935547, -0.0431828498840332, -0.04195213317871094, -0.04072141647338867, -0.039490699768066406, -0.03825998306274414, -0.037029266357421875, -0.03579854965209961, -0.034567832946777344, -0.03333711624145508, -0.03210639953613281, -0.030875682830810547, -0.02964496612548828, -0.028414249420166016, -0.02718353271484375, -0.025952816009521484, -0.02472209930419922, -0.023491382598876953, -0.022260665893554688, -0.021029949188232422, -0.019799232482910156, -0.01856851577758789, -0.017337799072265625, -0.01610708236694336, -0.014876365661621094, -0.013645648956298828, -0.012414932250976562, -0.011184215545654297, -0.009953498840332031, -0.008722782135009766, -0.0074920654296875, -0.006261348724365234, -0.005030632019042969, -0.003799915313720703, -0.0025691986083984375, -0.0013384819030761719, -0.00010776519775390625, 0.0011229515075683594, 0.002353668212890625, 0.0035843849182128906, 0.004815101623535156, 0.006045818328857422, 0.0072765350341796875, 0.008507251739501953, 0.009737968444824219, 0.010968685150146484, 0.01219940185546875, 0.013430118560791016, 0.014660835266113281, 0.015891551971435547, 0.017122268676757812, 0.018352985382080078, 0.019583702087402344, 0.02081441879272461, 0.022045135498046875, 0.02327585220336914, 0.024506568908691406, 0.025737285614013672, 0.026968002319335938, 0.028198719024658203, 0.02942943572998047, 0.030660152435302734, 0.031890869140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 11.0, 6.0, 8.0, 10.0, 21.0, 28.0, 47.0, 55.0, 70.0, 132.0, 146.0, 213.0, 399.0, 593.0, 1002.0, 1817.0, 3277.0, 6537.0, 12724.0, 24356.0, 46703.0, 87353.0, 153298.0, 217110.0, 202733.0, 132638.0, 74276.0, 39328.0, 20592.0, 10528.0, 5423.0, 3000.0, 1609.0, 925.0, 570.0, 335.0, 227.0, 130.0, 96.0, 62.0, 43.0, 43.0, 21.0, 16.0, 13.0, 7.0, 4.0, 8.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.099853515625, -0.09681415557861328, -0.09377479553222656, -0.09073543548583984, -0.08769607543945312, -0.0846567153930664, -0.08161735534667969, -0.07857799530029297, -0.07553863525390625, -0.07249927520751953, -0.06945991516113281, -0.0664205551147461, -0.06338119506835938, -0.060341835021972656, -0.05730247497558594, -0.05426311492919922, -0.0512237548828125, -0.04818439483642578, -0.04514503479003906, -0.042105674743652344, -0.039066314697265625, -0.036026954650878906, -0.03298759460449219, -0.02994823455810547, -0.02690887451171875, -0.02386951446533203, -0.020830154418945312, -0.017790794372558594, -0.014751434326171875, -0.011712074279785156, -0.008672714233398438, -0.005633354187011719, -0.002593994140625, 0.00044536590576171875, 0.0034847259521484375, 0.006524085998535156, 0.009563446044921875, 0.012602806091308594, 0.015642166137695312, 0.01868152618408203, 0.02172088623046875, 0.02476024627685547, 0.027799606323242188, 0.030838966369628906, 0.033878326416015625, 0.036917686462402344, 0.03995704650878906, 0.04299640655517578, 0.0460357666015625, 0.04907512664794922, 0.05211448669433594, 0.055153846740722656, 0.058193206787109375, 0.061232566833496094, 0.06427192687988281, 0.06731128692626953, 0.07035064697265625, 0.07339000701904297, 0.07642936706542969, 0.0794687271118164, 0.08250808715820312, 0.08554744720458984, 0.08858680725097656, 0.09162616729736328, 0.09466552734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 12.0, 7.0, 12.0, 9.0, 14.0, 14.0, 23.0, 16.0, 17.0, 15.0, 28.0, 30.0, 35.0, 26.0, 40.0, 38.0, 33.0, 34.0, 37.0, 49.0, 35.0, 39.0, 48.0, 34.0, 35.0, 32.0, 34.0, 38.0, 24.0, 31.0, 24.0, 18.0, 18.0, 11.0, 14.0, 14.0, 10.0, 9.0, 13.0, 4.0, 3.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0], "bins": [-0.093017578125, -0.09022998809814453, -0.08744239807128906, -0.0846548080444336, -0.08186721801757812, -0.07907962799072266, -0.07629203796386719, -0.07350444793701172, -0.07071685791015625, -0.06792926788330078, -0.06514167785644531, -0.062354087829589844, -0.059566497802734375, -0.056778907775878906, -0.05399131774902344, -0.05120372772216797, -0.0484161376953125, -0.04562854766845703, -0.04284095764160156, -0.040053367614746094, -0.037265777587890625, -0.034478187561035156, -0.03169059753417969, -0.02890300750732422, -0.02611541748046875, -0.02332782745361328, -0.020540237426757812, -0.017752647399902344, -0.014965057373046875, -0.012177467346191406, -0.009389877319335938, -0.006602287292480469, -0.003814697265625, -0.0010271072387695312, 0.0017604827880859375, 0.004548072814941406, 0.007335662841796875, 0.010123252868652344, 0.012910842895507812, 0.01569843292236328, 0.01848602294921875, 0.02127361297607422, 0.024061203002929688, 0.026848793029785156, 0.029636383056640625, 0.032423973083496094, 0.03521156311035156, 0.03799915313720703, 0.0407867431640625, 0.04357433319091797, 0.04636192321777344, 0.049149513244628906, 0.051937103271484375, 0.054724693298339844, 0.05751228332519531, 0.06029987335205078, 0.06308746337890625, 0.06587505340576172, 0.06866264343261719, 0.07145023345947266, 0.07423782348632812, 0.0770254135131836, 0.07981300354003906, 0.08260059356689453, 0.08538818359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 14.0, 9.0, 6.0, 14.0, 26.0, 34.0, 33.0, 61.0, 69.0, 105.0, 145.0, 193.0, 277.0, 431.0, 617.0, 1034.0, 1761.0, 3183.0, 8269.0, 182342.0, 795908.0, 42398.0, 5075.0, 2474.0, 1429.0, 861.0, 559.0, 355.0, 254.0, 166.0, 110.0, 85.0, 63.0, 49.0, 26.0, 27.0, 19.0, 13.0, 12.0, 13.0, 5.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.211181640625, -0.20484161376953125, -0.1985015869140625, -0.19216156005859375, -0.185821533203125, -0.17948150634765625, -0.1731414794921875, -0.16680145263671875, -0.16046142578125, -0.15412139892578125, -0.1477813720703125, -0.14144134521484375, -0.135101318359375, -0.12876129150390625, -0.1224212646484375, -0.11608123779296875, -0.1097412109375, -0.10340118408203125, -0.0970611572265625, -0.09072113037109375, -0.084381103515625, -0.07804107666015625, -0.0717010498046875, -0.06536102294921875, -0.05902099609375, -0.05268096923828125, -0.0463409423828125, -0.04000091552734375, -0.033660888671875, -0.02732086181640625, -0.0209808349609375, -0.01464080810546875, -0.00830078125, -0.00196075439453125, 0.0043792724609375, 0.01071929931640625, 0.017059326171875, 0.02339935302734375, 0.0297393798828125, 0.03607940673828125, 0.04241943359375, 0.04875946044921875, 0.0550994873046875, 0.06143951416015625, 0.067779541015625, 0.07411956787109375, 0.0804595947265625, 0.08679962158203125, 0.0931396484375, 0.09947967529296875, 0.1058197021484375, 0.11215972900390625, 0.118499755859375, 0.12483978271484375, 0.1311798095703125, 0.13751983642578125, 0.14385986328125, 0.15019989013671875, 0.1565399169921875, 0.16287994384765625, 0.169219970703125, 0.17555999755859375, 0.1819000244140625, 0.18824005126953125, 0.194580078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 23.0, 128.0, 445.0, 320.0, 56.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001342296600341797, -0.00013036932796239853, -0.00012650899589061737, -0.0001226486638188362, -0.00011878833174705505, -0.0001149279996752739, -0.00011106766760349274, -0.00010720733553171158, -0.00010334700345993042, -9.948667138814926e-05, -9.56263393163681e-05, -9.176600724458694e-05, -8.790567517280579e-05, -8.404534310102463e-05, -8.018501102924347e-05, -7.632467895746231e-05, -7.246434688568115e-05, -6.86040148139e-05, -6.474368274211884e-05, -6.088335067033768e-05, -5.702301859855652e-05, -5.316268652677536e-05, -4.93023544549942e-05, -4.544202238321304e-05, -4.1581690311431885e-05, -3.7721358239650726e-05, -3.386102616786957e-05, -3.000069409608841e-05, -2.614036202430725e-05, -2.2280029952526093e-05, -1.8419697880744934e-05, -1.4559365808963776e-05, -1.0699033737182617e-05, -6.838701665401459e-06, -2.9783695936203003e-06, 8.819624781608582e-07, 4.742294549942017e-06, 8.602626621723175e-06, 1.2462958693504333e-05, 1.6323290765285492e-05, 2.018362283706665e-05, 2.404395490884781e-05, 2.7904286980628967e-05, 3.1764619052410126e-05, 3.5624951124191284e-05, 3.948528319597244e-05, 4.33456152677536e-05, 4.720594733953476e-05, 5.106627941131592e-05, 5.4926611483097076e-05, 5.8786943554878235e-05, 6.26472756266594e-05, 6.650760769844055e-05, 7.036793977022171e-05, 7.422827184200287e-05, 7.808860391378403e-05, 8.194893598556519e-05, 8.580926805734634e-05, 8.96696001291275e-05, 9.352993220090866e-05, 9.739026427268982e-05, 0.00010125059634447098, 0.00010511092841625214, 0.0001089712604880333, 0.00011283159255981445]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 9.0, 11.0, 25.0, 32.0, 38.0, 58.0, 97.0, 126.0, 229.0, 364.0, 650.0, 1100.0, 2076.0, 4444.0, 9199.0, 19643.0, 41248.0, 83458.0, 148945.0, 208755.0, 209934.0, 150858.0, 85517.0, 42625.0, 20053.0, 9434.0, 4503.0, 2287.0, 1161.0, 659.0, 379.0, 218.0, 129.0, 93.0, 50.0, 45.0, 29.0, 22.0, 14.0, 15.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.034027099609375, -0.033026695251464844, -0.03202629089355469, -0.03102588653564453, -0.030025482177734375, -0.02902507781982422, -0.028024673461914062, -0.027024269104003906, -0.02602386474609375, -0.025023460388183594, -0.024023056030273438, -0.02302265167236328, -0.022022247314453125, -0.02102184295654297, -0.020021438598632812, -0.019021034240722656, -0.0180206298828125, -0.017020225524902344, -0.016019821166992188, -0.015019416809082031, -0.014019012451171875, -0.013018608093261719, -0.012018203735351562, -0.011017799377441406, -0.01001739501953125, -0.009016990661621094, -0.008016586303710938, -0.007016181945800781, -0.006015777587890625, -0.005015373229980469, -0.0040149688720703125, -0.0030145645141601562, -0.00201416015625, -0.0010137557983398438, -1.33514404296875e-05, 0.0009870529174804688, 0.001987457275390625, 0.0029878616333007812, 0.0039882659912109375, 0.004988670349121094, 0.00598907470703125, 0.006989479064941406, 0.007989883422851562, 0.008990287780761719, 0.009990692138671875, 0.010991096496582031, 0.011991500854492188, 0.012991905212402344, 0.0139923095703125, 0.014992713928222656, 0.015993118286132812, 0.01699352264404297, 0.017993927001953125, 0.01899433135986328, 0.019994735717773438, 0.020995140075683594, 0.02199554443359375, 0.022995948791503906, 0.023996353149414062, 0.02499675750732422, 0.025997161865234375, 0.02699756622314453, 0.027997970581054688, 0.028998374938964844, 0.029998779296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 11.0, 9.0, 7.0, 16.0, 22.0, 22.0, 19.0, 21.0, 27.0, 34.0, 40.0, 55.0, 43.0, 54.0, 49.0, 64.0, 51.0, 47.0, 56.0, 53.0, 42.0, 45.0, 38.0, 26.0, 35.0, 24.0, 10.0, 13.0, 18.0, 13.0, 6.0, 8.0, 2.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02764892578125, -0.026840686798095703, -0.026032447814941406, -0.02522420883178711, -0.024415969848632812, -0.023607730865478516, -0.02279949188232422, -0.021991252899169922, -0.021183013916015625, -0.020374774932861328, -0.01956653594970703, -0.018758296966552734, -0.017950057983398438, -0.01714181900024414, -0.016333580017089844, -0.015525341033935547, -0.01471710205078125, -0.013908863067626953, -0.013100624084472656, -0.01229238510131836, -0.011484146118164062, -0.010675907135009766, -0.009867668151855469, -0.009059429168701172, -0.008251190185546875, -0.007442951202392578, -0.006634712219238281, -0.005826473236083984, -0.0050182342529296875, -0.004209995269775391, -0.0034017562866210938, -0.002593517303466797, -0.0017852783203125, -0.0009770393371582031, -0.00016880035400390625, 0.0006394386291503906, 0.0014476776123046875, 0.0022559165954589844, 0.0030641555786132812, 0.003872394561767578, 0.004680633544921875, 0.005488872528076172, 0.006297111511230469, 0.007105350494384766, 0.007913589477539062, 0.00872182846069336, 0.009530067443847656, 0.010338306427001953, 0.01114654541015625, 0.011954784393310547, 0.012763023376464844, 0.01357126235961914, 0.014379501342773438, 0.015187740325927734, 0.01599597930908203, 0.016804218292236328, 0.017612457275390625, 0.018420696258544922, 0.01922893524169922, 0.020037174224853516, 0.020845413208007812, 0.02165365219116211, 0.022461891174316406, 0.023270130157470703, 0.024078369140625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 8.0, 12.0, 10.0, 13.0, 24.0, 38.0, 45.0, 52.0, 60.0, 82.0, 82.0, 74.0, 86.0, 75.0, 68.0, 59.0, 36.0, 41.0, 30.0, 23.0, 17.0, 15.0, 8.0, 3.0, 6.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25172969698905945, -0.24300813674926758, -0.2342865765094757, -0.22556501626968384, -0.21684345602989197, -0.2081218957901001, -0.19940032064914703, -0.19067876040935516, -0.1819572001695633, -0.17323563992977142, -0.16451407968997955, -0.15579251945018768, -0.14707094430923462, -0.13834938406944275, -0.12962782382965088, -0.12090626358985901, -0.11218470335006714, -0.10346314311027527, -0.0947415828704834, -0.08602001518011093, -0.07729845494031906, -0.06857689470052719, -0.05985533073544502, -0.051133766770362854, -0.042412206530570984, -0.033690646290779114, -0.024969082325696945, -0.016247520223259926, -0.0075259581208229065, 0.0011956021189689636, 0.009917166084051132, 0.0186387300491333, 0.02736032009124756, 0.03608188033103943, 0.0448034442961216, 0.053525008261203766, 0.062246568500995636, 0.0709681287407875, 0.07968969643115997, 0.08841125667095184, 0.09713281691074371, 0.10585437715053558, 0.11457593739032745, 0.12329750508069992, 0.1320190727710724, 0.14074063301086426, 0.14946219325065613, 0.158183753490448, 0.16690531373023987, 0.17562687397003174, 0.1843484342098236, 0.19306999444961548, 0.20179155468940735, 0.21051311492919922, 0.21923469007015228, 0.22795625030994415, 0.23667781054973602, 0.2453993707895279, 0.25412094593048096, 0.2628425061702728, 0.2715640664100647, 0.28028562664985657, 0.28900718688964844, 0.2977287471294403, 0.3064503073692322]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 6.0, 8.0, 17.0, 16.0, 34.0, 28.0, 31.0, 37.0, 45.0, 46.0, 51.0, 58.0, 44.0, 53.0, 60.0, 59.0, 48.0, 46.0, 40.0, 46.0, 31.0, 39.0, 22.0, 17.0, 19.0, 23.0, 12.0, 16.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.43676120042800903, -0.4260993003845215, -0.41543740034103394, -0.4047755002975464, -0.39411357045173645, -0.3834516704082489, -0.37278977036476135, -0.3621278703212738, -0.35146597027778625, -0.3408040702342987, -0.33014217019081116, -0.3194802403450012, -0.30881834030151367, -0.2981564402580261, -0.2874945402145386, -0.276832640171051, -0.2661707401275635, -0.2555088400840759, -0.24484692513942719, -0.23418502509593964, -0.2235231250524521, -0.21286121010780334, -0.2021993100643158, -0.19153741002082825, -0.1808754801750183, -0.17021358013153076, -0.15955166518688202, -0.14888976514339447, -0.13822786509990692, -0.12756595015525818, -0.11690405011177063, -0.10624215006828308, -0.09558025002479553, -0.08491834253072739, -0.07425644248723984, -0.06359453499317169, -0.052932631224393845, -0.042270727455616, -0.03160881996154785, -0.020946919918060303, -0.010285012423992157, 0.0003768922761082649, 0.011038796976208687, 0.021700702607631683, 0.03236260637640953, 0.04302451014518738, 0.053686417639255524, 0.06434831768274307, 0.07501022517681122, 0.08567213267087936, 0.09633403271436691, 0.10699594020843506, 0.11765784025192261, 0.12831974029541016, 0.1389816552400589, 0.14964355528354645, 0.1603054702281952, 0.17096737027168274, 0.18162928521633148, 0.19229118525981903, 0.20295308530330658, 0.21361500024795532, 0.22427690029144287, 0.23493880033493042, 0.24560070037841797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 7.0, 8.0, 15.0, 16.0, 23.0, 29.0, 48.0, 55.0, 108.0, 185.0, 374.0, 843.0, 1986.0, 6021.0, 22634.0, 114769.0, 1026546.0, 2518813.0, 423278.0, 59209.0, 13124.0, 3712.0, 1254.0, 550.0, 243.0, 125.0, 81.0, 60.0, 36.0, 25.0, 16.0, 15.0, 14.0, 11.0, 5.0, 10.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1138916015625, -0.11057186126708984, -0.10725212097167969, -0.10393238067626953, -0.10061264038085938, -0.09729290008544922, -0.09397315979003906, -0.0906534194946289, -0.08733367919921875, -0.0840139389038086, -0.08069419860839844, -0.07737445831298828, -0.07405471801757812, -0.07073497772216797, -0.06741523742675781, -0.06409549713134766, -0.0607757568359375, -0.057456016540527344, -0.05413627624511719, -0.05081653594970703, -0.047496795654296875, -0.04417705535888672, -0.04085731506347656, -0.037537574768066406, -0.03421783447265625, -0.030898094177246094, -0.027578353881835938, -0.02425861358642578, -0.020938873291015625, -0.01761913299560547, -0.014299392700195312, -0.010979652404785156, -0.007659912109375, -0.004340171813964844, -0.0010204315185546875, 0.0022993087768554688, 0.005619049072265625, 0.008938789367675781, 0.012258529663085938, 0.015578269958496094, 0.01889801025390625, 0.022217750549316406, 0.025537490844726562, 0.02885723114013672, 0.032176971435546875, 0.03549671173095703, 0.03881645202636719, 0.042136192321777344, 0.0454559326171875, 0.048775672912597656, 0.05209541320800781, 0.05541515350341797, 0.058734893798828125, 0.06205463409423828, 0.06537437438964844, 0.0686941146850586, 0.07201385498046875, 0.0753335952758789, 0.07865333557128906, 0.08197307586669922, 0.08529281616210938, 0.08861255645751953, 0.09193229675292969, 0.09525203704833984, 0.09857177734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 1.0, 5.0, 6.0, 6.0, 10.0, 6.0, 15.0, 19.0, 15.0, 28.0, 22.0, 24.0, 34.0, 35.0, 40.0, 53.0, 47.0, 46.0, 52.0, 45.0, 52.0, 56.0, 42.0, 42.0, 49.0, 45.0, 30.0, 30.0, 26.0, 17.0, 20.0, 16.0, 18.0, 11.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.045493125915527344, -0.04417228698730469, -0.04285144805908203, -0.041530609130859375, -0.04020977020263672, -0.03888893127441406, -0.037568092346191406, -0.03624725341796875, -0.034926414489746094, -0.03360557556152344, -0.03228473663330078, -0.030963897705078125, -0.02964305877685547, -0.028322219848632812, -0.027001380920410156, -0.0256805419921875, -0.024359703063964844, -0.023038864135742188, -0.02171802520751953, -0.020397186279296875, -0.01907634735107422, -0.017755508422851562, -0.016434669494628906, -0.01511383056640625, -0.013792991638183594, -0.012472152709960938, -0.011151313781738281, -0.009830474853515625, -0.008509635925292969, -0.0071887969970703125, -0.005867958068847656, -0.004547119140625, -0.0032262802124023438, -0.0019054412841796875, -0.0005846023559570312, 0.000736236572265625, 0.0020570755004882812, 0.0033779144287109375, 0.004698753356933594, 0.00601959228515625, 0.007340431213378906, 0.008661270141601562, 0.009982109069824219, 0.011302947998046875, 0.012623786926269531, 0.013944625854492188, 0.015265464782714844, 0.0165863037109375, 0.017907142639160156, 0.019227981567382812, 0.02054882049560547, 0.021869659423828125, 0.02319049835205078, 0.024511337280273438, 0.025832176208496094, 0.02715301513671875, 0.028473854064941406, 0.029794692993164062, 0.03111553192138672, 0.032436370849609375, 0.03375720977783203, 0.03507804870605469, 0.036398887634277344, 0.0377197265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 14.0, 17.0, 44.0, 52.0, 106.0, 175.0, 329.0, 742.0, 2094.0, 7148.0, 31566.0, 160958.0, 894114.0, 2233615.0, 702367.0, 126765.0, 25190.0, 5865.0, 1771.0, 673.0, 294.0, 155.0, 79.0, 48.0, 30.0, 19.0, 11.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1368408203125, -0.13327980041503906, -0.12971878051757812, -0.1261577606201172, -0.12259674072265625, -0.11903572082519531, -0.11547470092773438, -0.11191368103027344, -0.1083526611328125, -0.10479164123535156, -0.10123062133789062, -0.09766960144042969, -0.09410858154296875, -0.09054756164550781, -0.08698654174804688, -0.08342552185058594, -0.079864501953125, -0.07630348205566406, -0.07274246215820312, -0.06918144226074219, -0.06562042236328125, -0.06205940246582031, -0.058498382568359375, -0.05493736267089844, -0.0513763427734375, -0.04781532287597656, -0.044254302978515625, -0.04069328308105469, -0.03713226318359375, -0.03357124328613281, -0.030010223388671875, -0.026449203491210938, -0.02288818359375, -0.019327163696289062, -0.015766143798828125, -0.012205123901367188, -0.00864410400390625, -0.0050830841064453125, -0.001522064208984375, 0.0020389556884765625, 0.0055999755859375, 0.009160995483398438, 0.012722015380859375, 0.016283035278320312, 0.01984405517578125, 0.023405075073242188, 0.026966094970703125, 0.030527114868164062, 0.034088134765625, 0.03764915466308594, 0.041210174560546875, 0.04477119445800781, 0.04833221435546875, 0.05189323425292969, 0.055454254150390625, 0.05901527404785156, 0.0625762939453125, 0.06613731384277344, 0.06969833374023438, 0.07325935363769531, 0.07682037353515625, 0.08038139343261719, 0.08394241333007812, 0.08750343322753906, 0.091064453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 1.0, 6.0, 5.0, 17.0, 17.0, 27.0, 34.0, 50.0, 62.0, 73.0, 114.0, 179.0, 223.0, 295.0, 360.0, 476.0, 497.0, 411.0, 335.0, 220.0, 186.0, 121.0, 80.0, 75.0, 53.0, 39.0, 42.0, 28.0, 16.0, 12.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.1009521484375, -0.09832763671875, -0.095703125, -0.09307861328125, -0.0904541015625, -0.08782958984375, -0.085205078125, -0.08258056640625, -0.0799560546875, -0.07733154296875, -0.07470703125, -0.07208251953125, -0.0694580078125, -0.06683349609375, -0.064208984375, -0.06158447265625, -0.0589599609375, -0.05633544921875, -0.0537109375, -0.05108642578125, -0.0484619140625, -0.04583740234375, -0.043212890625, -0.04058837890625, -0.0379638671875, -0.03533935546875, -0.03271484375, -0.03009033203125, -0.0274658203125, -0.02484130859375, -0.022216796875, -0.01959228515625, -0.0169677734375, -0.01434326171875, -0.01171875, -0.00909423828125, -0.0064697265625, -0.00384521484375, -0.001220703125, 0.00140380859375, 0.0040283203125, 0.00665283203125, 0.00927734375, 0.01190185546875, 0.0145263671875, 0.01715087890625, 0.019775390625, 0.02239990234375, 0.0250244140625, 0.02764892578125, 0.0302734375, 0.03289794921875, 0.0355224609375, 0.03814697265625, 0.040771484375, 0.04339599609375, 0.0460205078125, 0.04864501953125, 0.05126953125, 0.05389404296875, 0.0565185546875, 0.05914306640625, 0.061767578125, 0.06439208984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 14.0, 20.0, 44.0, 68.0, 78.0, 115.0, 111.0, 105.0, 115.0, 93.0, 67.0, 50.0, 45.0, 27.0, 18.0, 12.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31187447905540466, -0.2980983853340149, -0.2843222916126251, -0.27054619789123535, -0.25677013397216797, -0.2429940402507782, -0.22921794652938843, -0.21544185280799866, -0.20166577398777008, -0.1878896802663803, -0.17411360144615173, -0.16033750772476196, -0.1465614140033722, -0.13278533518314362, -0.11900924146175385, -0.10523315519094467, -0.0914570689201355, -0.07768098264932632, -0.06390489637851715, -0.05012880265712738, -0.03635271638631821, -0.022576630115509033, -0.008800536394119263, 0.004975549876689911, 0.018751636147499084, 0.03252772241830826, 0.04630381241440773, 0.0600799024105072, 0.07385598868131638, 0.08763207495212555, 0.10140816867351532, 0.1151842549443245, 0.12896037101745605, 0.14273646473884583, 0.1565125435590744, 0.17028863728046417, 0.18406471610069275, 0.19784080982208252, 0.2116169035434723, 0.22539299726486206, 0.23916907608509064, 0.2529451549053192, 0.266721248626709, 0.28049734234809875, 0.2942734360694885, 0.3080494999885559, 0.32182562351226807, 0.33560168743133545, 0.3493777811527252, 0.363153874874115, 0.37692996859550476, 0.39070606231689453, 0.4044821262359619, 0.4182582199573517, 0.43203431367874146, 0.4458104074001312, 0.459586501121521, 0.47336259484291077, 0.48713868856430054, 0.5009147524833679, 0.5146908760070801, 0.5284669399261475, 0.5422430038452148, 0.556019127368927, 0.5697951912879944]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 10.0, 7.0, 9.0, 11.0, 12.0, 16.0, 21.0, 19.0, 26.0, 26.0, 17.0, 29.0, 39.0, 33.0, 31.0, 42.0, 35.0, 33.0, 40.0, 44.0, 34.0, 39.0, 44.0, 41.0, 39.0, 32.0, 34.0, 42.0, 27.0, 32.0, 19.0, 17.0, 23.0, 13.0, 16.0, 15.0, 14.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24989545345306396, -0.24242407083511353, -0.23495268821716309, -0.22748130559921265, -0.2200099378824234, -0.21253855526447296, -0.20506717264652252, -0.19759579002857208, -0.19012442231178284, -0.1826530396938324, -0.17518165707588196, -0.16771027445793152, -0.16023890674114227, -0.15276752412319183, -0.1452961415052414, -0.13782475888729095, -0.13035337626934052, -0.12288199365139008, -0.11541061848402023, -0.1079392358660698, -0.10046786069869995, -0.09299647808074951, -0.08552509546279907, -0.07805371284484863, -0.07058233767747879, -0.06311095505952835, -0.05563957989215851, -0.04816819727420807, -0.04069681838154793, -0.03322543948888779, -0.025754056870937347, -0.018282677978277206, -0.010811299085617065, -0.00333991926163435, 0.004131460562348366, 0.011602841317653656, 0.019074220210313797, 0.026545599102973938, 0.03401698172092438, 0.04148836061358452, 0.04895973950624466, 0.0564311183989048, 0.06390249729156494, 0.07137387990951538, 0.07884526252746582, 0.08631663769483566, 0.0937880203127861, 0.10125939548015594, 0.10873077809810638, 0.11620216071605682, 0.12367353588342667, 0.1311449110507965, 0.13861629366874695, 0.1460876762866974, 0.15355905890464783, 0.16103044152259827, 0.1685018241405487, 0.17597320675849915, 0.18344458937644958, 0.19091597199440002, 0.19838733971118927, 0.2058587223291397, 0.21333010494709015, 0.2208014875650406, 0.22827285528182983]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 10.0, 22.0, 35.0, 45.0, 68.0, 91.0, 154.0, 253.0, 438.0, 732.0, 1278.0, 2189.0, 3805.0, 6846.0, 12401.0, 22156.0, 41314.0, 77375.0, 133179.0, 193843.0, 203862.0, 150526.0, 89909.0, 49080.0, 25884.0, 14427.0, 8021.0, 4464.0, 2567.0, 1417.0, 837.0, 515.0, 290.0, 174.0, 114.0, 73.0, 46.0, 33.0, 26.0, 11.0, 18.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.08837890625, -0.08571147918701172, -0.08304405212402344, -0.08037662506103516, -0.07770919799804688, -0.0750417709350586, -0.07237434387207031, -0.06970691680908203, -0.06703948974609375, -0.06437206268310547, -0.06170463562011719, -0.059037208557128906, -0.056369781494140625, -0.053702354431152344, -0.05103492736816406, -0.04836750030517578, -0.0457000732421875, -0.04303264617919922, -0.04036521911621094, -0.037697792053222656, -0.035030364990234375, -0.032362937927246094, -0.029695510864257812, -0.02702808380126953, -0.02436065673828125, -0.02169322967529297, -0.019025802612304688, -0.016358375549316406, -0.013690948486328125, -0.011023521423339844, -0.008356094360351562, -0.005688667297363281, -0.003021240234375, -0.00035381317138671875, 0.0023136138916015625, 0.004981040954589844, 0.007648468017578125, 0.010315895080566406, 0.012983322143554688, 0.01565074920654297, 0.01831817626953125, 0.02098560333251953, 0.023653030395507812, 0.026320457458496094, 0.028987884521484375, 0.031655311584472656, 0.03432273864746094, 0.03699016571044922, 0.0396575927734375, 0.04232501983642578, 0.04499244689941406, 0.047659873962402344, 0.050327301025390625, 0.052994728088378906, 0.05566215515136719, 0.05832958221435547, 0.06099700927734375, 0.06366443634033203, 0.06633186340332031, 0.0689992904663086, 0.07166671752929688, 0.07433414459228516, 0.07700157165527344, 0.07966899871826172, 0.08233642578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 4.0, 4.0, 7.0, 13.0, 14.0, 18.0, 20.0, 21.0, 34.0, 26.0, 24.0, 37.0, 56.0, 48.0, 36.0, 70.0, 51.0, 37.0, 58.0, 52.0, 49.0, 37.0, 37.0, 38.0, 29.0, 28.0, 31.0, 15.0, 20.0, 14.0, 11.0, 10.0, 13.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043731689453125, -0.04251241683959961, -0.04129314422607422, -0.04007387161254883, -0.03885459899902344, -0.03763532638549805, -0.036416053771972656, -0.035196781158447266, -0.033977508544921875, -0.032758235931396484, -0.031538963317871094, -0.030319690704345703, -0.029100418090820312, -0.027881145477294922, -0.02666187286376953, -0.02544260025024414, -0.02422332763671875, -0.02300405502319336, -0.02178478240966797, -0.020565509796142578, -0.019346237182617188, -0.018126964569091797, -0.016907691955566406, -0.015688419342041016, -0.014469146728515625, -0.013249874114990234, -0.012030601501464844, -0.010811328887939453, -0.009592056274414062, -0.008372783660888672, -0.007153511047363281, -0.005934238433837891, -0.0047149658203125, -0.0034956932067871094, -0.0022764205932617188, -0.0010571479797363281, 0.0001621246337890625, 0.0013813972473144531, 0.0026006698608398438, 0.0038199424743652344, 0.005039215087890625, 0.006258487701416016, 0.007477760314941406, 0.008697032928466797, 0.009916305541992188, 0.011135578155517578, 0.012354850769042969, 0.01357412338256836, 0.01479339599609375, 0.01601266860961914, 0.01723194122314453, 0.018451213836669922, 0.019670486450195312, 0.020889759063720703, 0.022109031677246094, 0.023328304290771484, 0.024547576904296875, 0.025766849517822266, 0.026986122131347656, 0.028205394744873047, 0.029424667358398438, 0.030643939971923828, 0.03186321258544922, 0.03308248519897461, 0.0343017578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 14.0, 11.0, 15.0, 25.0, 35.0, 42.0, 59.0, 92.0, 118.0, 180.0, 236.0, 384.0, 570.0, 918.0, 1758.0, 3578.0, 8263.0, 19130.0, 45782.0, 101179.0, 195412.0, 268607.0, 205057.0, 109275.0, 49423.0, 20917.0, 8786.0, 3966.0, 1856.0, 1009.0, 576.0, 395.0, 242.0, 184.0, 129.0, 110.0, 46.0, 59.0, 32.0, 23.0, 14.0, 12.0, 9.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10272216796875, -0.09935951232910156, -0.09599685668945312, -0.09263420104980469, -0.08927154541015625, -0.08590888977050781, -0.08254623413085938, -0.07918357849121094, -0.0758209228515625, -0.07245826721191406, -0.06909561157226562, -0.06573295593261719, -0.06237030029296875, -0.05900764465332031, -0.055644989013671875, -0.05228233337402344, -0.048919677734375, -0.04555702209472656, -0.042194366455078125, -0.03883171081542969, -0.03546905517578125, -0.03210639953613281, -0.028743743896484375, -0.025381088256835938, -0.0220184326171875, -0.018655776977539062, -0.015293121337890625, -0.011930465698242188, -0.00856781005859375, -0.0052051544189453125, -0.001842498779296875, 0.0015201568603515625, 0.0048828125, 0.008245468139648438, 0.011608123779296875, 0.014970779418945312, 0.01833343505859375, 0.021696090698242188, 0.025058746337890625, 0.028421401977539062, 0.0317840576171875, 0.03514671325683594, 0.038509368896484375, 0.04187202453613281, 0.04523468017578125, 0.04859733581542969, 0.051959991455078125, 0.05532264709472656, 0.058685302734375, 0.06204795837402344, 0.06541061401367188, 0.06877326965332031, 0.07213592529296875, 0.07549858093261719, 0.07886123657226562, 0.08222389221191406, 0.0855865478515625, 0.08894920349121094, 0.09231185913085938, 0.09567451477050781, 0.09903717041015625, 0.10239982604980469, 0.10576248168945312, 0.10912513732910156, 0.11248779296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 13.0, 13.0, 6.0, 12.0, 7.0, 15.0, 15.0, 24.0, 15.0, 23.0, 25.0, 34.0, 33.0, 32.0, 39.0, 37.0, 38.0, 35.0, 37.0, 37.0, 35.0, 50.0, 38.0, 44.0, 38.0, 26.0, 33.0, 31.0, 24.0, 29.0, 26.0, 13.0, 9.0, 20.0, 12.0, 14.0, 13.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.09173583984375, -0.08884143829345703, -0.08594703674316406, -0.0830526351928711, -0.08015823364257812, -0.07726383209228516, -0.07436943054199219, -0.07147502899169922, -0.06858062744140625, -0.06568622589111328, -0.06279182434082031, -0.059897422790527344, -0.057003021240234375, -0.054108619689941406, -0.05121421813964844, -0.04831981658935547, -0.0454254150390625, -0.04253101348876953, -0.03963661193847656, -0.036742210388183594, -0.033847808837890625, -0.030953407287597656, -0.028059005737304688, -0.02516460418701172, -0.02227020263671875, -0.01937580108642578, -0.016481399536132812, -0.013586997985839844, -0.010692596435546875, -0.007798194885253906, -0.0049037933349609375, -0.0020093917846679688, 0.000885009765625, 0.0037794113159179688, 0.0066738128662109375, 0.009568214416503906, 0.012462615966796875, 0.015357017517089844, 0.018251419067382812, 0.02114582061767578, 0.02404022216796875, 0.02693462371826172, 0.029829025268554688, 0.032723426818847656, 0.035617828369140625, 0.038512229919433594, 0.04140663146972656, 0.04430103302001953, 0.0471954345703125, 0.05008983612060547, 0.05298423767089844, 0.055878639221191406, 0.058773040771484375, 0.061667442321777344, 0.06456184387207031, 0.06745624542236328, 0.07035064697265625, 0.07324504852294922, 0.07613945007324219, 0.07903385162353516, 0.08192825317382812, 0.0848226547241211, 0.08771705627441406, 0.09061145782470703, 0.093505859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 12.0, 15.0, 24.0, 45.0, 68.0, 127.0, 228.0, 394.0, 738.0, 1460.0, 3302.0, 8187.0, 22199.0, 63755.0, 174713.0, 327843.0, 268751.0, 113107.0, 39102.0, 14210.0, 5545.0, 2378.0, 1070.0, 569.0, 279.0, 150.0, 100.0, 64.0, 36.0, 26.0, 18.0, 7.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04669189453125, -0.04538679122924805, -0.044081687927246094, -0.04277658462524414, -0.04147148132324219, -0.040166378021240234, -0.03886127471923828, -0.03755617141723633, -0.036251068115234375, -0.03494596481323242, -0.03364086151123047, -0.032335758209228516, -0.031030654907226562, -0.02972555160522461, -0.028420448303222656, -0.027115345001220703, -0.02581024169921875, -0.024505138397216797, -0.023200035095214844, -0.02189493179321289, -0.020589828491210938, -0.019284725189208984, -0.01797962188720703, -0.016674518585205078, -0.015369415283203125, -0.014064311981201172, -0.012759208679199219, -0.011454105377197266, -0.010149002075195312, -0.00884389877319336, -0.007538795471191406, -0.006233692169189453, -0.0049285888671875, -0.003623485565185547, -0.0023183822631835938, -0.0010132789611816406, 0.0002918243408203125, 0.0015969276428222656, 0.0029020309448242188, 0.004207134246826172, 0.005512237548828125, 0.006817340850830078, 0.008122444152832031, 0.009427547454833984, 0.010732650756835938, 0.01203775405883789, 0.013342857360839844, 0.014647960662841797, 0.01595306396484375, 0.017258167266845703, 0.018563270568847656, 0.01986837387084961, 0.021173477172851562, 0.022478580474853516, 0.02378368377685547, 0.025088787078857422, 0.026393890380859375, 0.027698993682861328, 0.02900409698486328, 0.030309200286865234, 0.03161430358886719, 0.03291940689086914, 0.034224510192871094, 0.03552961349487305, 0.036834716796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 3.0, 5.0, 8.0, 7.0, 13.0, 13.0, 13.0, 12.0, 23.0, 20.0, 30.0, 24.0, 34.0, 41.0, 43.0, 60.0, 44.0, 62.0, 61.0, 65.0, 48.0, 40.0, 60.0, 36.0, 45.0, 31.0, 27.0, 21.0, 16.0, 17.0, 16.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1411495506763458e-05, -1.1021271347999573e-05, -1.0631047189235687e-05, -1.0240823030471802e-05, -9.850598871707916e-06, -9.46037471294403e-06, -9.070150554180145e-06, -8.67992639541626e-06, -8.289702236652374e-06, -7.899478077888489e-06, -7.509253919124603e-06, -7.119029760360718e-06, -6.728805601596832e-06, -6.338581442832947e-06, -5.948357284069061e-06, -5.558133125305176e-06, -5.16790896654129e-06, -4.777684807777405e-06, -4.387460649013519e-06, -3.997236490249634e-06, -3.6070123314857483e-06, -3.216788172721863e-06, -2.8265640139579773e-06, -2.436339855194092e-06, -2.0461156964302063e-06, -1.6558915376663208e-06, -1.2656673789024353e-06, -8.754432201385498e-07, -4.852190613746643e-07, -9.499490261077881e-08, 2.952292561531067e-07, 6.854534149169922e-07, 1.0756775736808777e-06, 1.4659017324447632e-06, 1.8561258912086487e-06, 2.246350049972534e-06, 2.6365742087364197e-06, 3.026798367500305e-06, 3.4170225262641907e-06, 3.807246685028076e-06, 4.197470843791962e-06, 4.587695002555847e-06, 4.977919161319733e-06, 5.368143320083618e-06, 5.758367478847504e-06, 6.148591637611389e-06, 6.538815796375275e-06, 6.92903995513916e-06, 7.319264113903046e-06, 7.709488272666931e-06, 8.099712431430817e-06, 8.489936590194702e-06, 8.880160748958588e-06, 9.270384907722473e-06, 9.660609066486359e-06, 1.0050833225250244e-05, 1.044105738401413e-05, 1.0831281542778015e-05, 1.12215057015419e-05, 1.1611729860305786e-05, 1.2001954019069672e-05, 1.2392178177833557e-05, 1.2782402336597443e-05, 1.3172626495361328e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 5.0, 7.0, 9.0, 18.0, 21.0, 33.0, 58.0, 58.0, 79.0, 126.0, 231.0, 372.0, 769.0, 1359.0, 2972.0, 7128.0, 17455.0, 47734.0, 132935.0, 293345.0, 308245.0, 148234.0, 53425.0, 19585.0, 7728.0, 3262.0, 1461.0, 755.0, 408.0, 266.0, 165.0, 102.0, 59.0, 53.0, 26.0, 17.0, 20.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.04840087890625, -0.04716157913208008, -0.045922279357910156, -0.044682979583740234, -0.04344367980957031, -0.04220438003540039, -0.04096508026123047, -0.03972578048706055, -0.038486480712890625, -0.0372471809387207, -0.03600788116455078, -0.03476858139038086, -0.03352928161621094, -0.032289981842041016, -0.031050682067871094, -0.029811382293701172, -0.02857208251953125, -0.027332782745361328, -0.026093482971191406, -0.024854183197021484, -0.023614883422851562, -0.02237558364868164, -0.02113628387451172, -0.019896984100341797, -0.018657684326171875, -0.017418384552001953, -0.01617908477783203, -0.01493978500366211, -0.013700485229492188, -0.012461185455322266, -0.011221885681152344, -0.009982585906982422, -0.0087432861328125, -0.007503986358642578, -0.006264686584472656, -0.005025386810302734, -0.0037860870361328125, -0.0025467872619628906, -0.0013074874877929688, -6.818771362304688e-05, 0.001171112060546875, 0.002410411834716797, 0.0036497116088867188, 0.004889011383056641, 0.0061283111572265625, 0.007367610931396484, 0.008606910705566406, 0.009846210479736328, 0.01108551025390625, 0.012324810028076172, 0.013564109802246094, 0.014803409576416016, 0.016042709350585938, 0.01728200912475586, 0.01852130889892578, 0.019760608673095703, 0.020999908447265625, 0.022239208221435547, 0.02347850799560547, 0.02471780776977539, 0.025957107543945312, 0.027196407318115234, 0.028435707092285156, 0.029675006866455078, 0.030914306640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 8.0, 9.0, 8.0, 12.0, 20.0, 31.0, 28.0, 27.0, 32.0, 39.0, 47.0, 47.0, 45.0, 55.0, 61.0, 58.0, 62.0, 57.0, 53.0, 40.0, 45.0, 41.0, 23.0, 19.0, 23.0, 29.0, 14.0, 8.0, 11.0, 8.0, 7.0, 2.0, 3.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0205535888671875, -0.019805431365966797, -0.019057273864746094, -0.01830911636352539, -0.017560958862304688, -0.016812801361083984, -0.01606464385986328, -0.015316486358642578, -0.014568328857421875, -0.013820171356201172, -0.013072013854980469, -0.012323856353759766, -0.011575698852539062, -0.01082754135131836, -0.010079383850097656, -0.009331226348876953, -0.00858306884765625, -0.007834911346435547, -0.007086753845214844, -0.006338596343994141, -0.0055904388427734375, -0.004842281341552734, -0.004094123840332031, -0.003345966339111328, -0.002597808837890625, -0.0018496513366699219, -0.0011014938354492188, -0.0003533363342285156, 0.0003948211669921875, 0.0011429786682128906, 0.0018911361694335938, 0.002639293670654297, 0.003387451171875, 0.004135608673095703, 0.004883766174316406, 0.005631923675537109, 0.0063800811767578125, 0.007128238677978516, 0.007876396179199219, 0.008624553680419922, 0.009372711181640625, 0.010120868682861328, 0.010869026184082031, 0.011617183685302734, 0.012365341186523438, 0.01311349868774414, 0.013861656188964844, 0.014609813690185547, 0.01535797119140625, 0.016106128692626953, 0.016854286193847656, 0.01760244369506836, 0.018350601196289062, 0.019098758697509766, 0.01984691619873047, 0.020595073699951172, 0.021343231201171875, 0.022091388702392578, 0.02283954620361328, 0.023587703704833984, 0.024335861206054688, 0.02508401870727539, 0.025832176208496094, 0.026580333709716797, 0.0273284912109375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 9.0, 24.0, 50.0, 101.0, 157.0, 196.0, 185.0, 128.0, 75.0, 40.0, 17.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8653367161750793, -0.8430077433586121, -0.8206787109375, -0.7983497381210327, -0.7760207653045654, -0.7536917924880981, -0.7313628196716309, -0.7090337872505188, -0.6867048144340515, -0.6643758416175842, -0.6420468091964722, -0.6197178363800049, -0.5973888635635376, -0.5750598907470703, -0.552730917930603, -0.530401885509491, -0.5080729126930237, -0.4857439398765564, -0.4634149372577667, -0.44108593463897705, -0.41875696182250977, -0.3964279890060425, -0.3740989863872528, -0.35176998376846313, -0.32944101095199585, -0.30711203813552856, -0.2847830355167389, -0.2624540328979492, -0.24012506008148193, -0.21779607236385345, -0.19546708464622498, -0.1731380969285965, -0.1508091688156128, -0.12848018109798431, -0.10615119338035583, -0.08382220566272736, -0.06149321794509888, -0.0391642302274704, -0.01683524250984192, 0.00549374520778656, 0.02782273292541504, 0.05015172064304352, 0.072480708360672, 0.09480969607830048, 0.11713868379592896, 0.13946767151355743, 0.1617966592311859, 0.1841256469488144, 0.20645463466644287, 0.22878362238407135, 0.25111261010169983, 0.2734416127204895, 0.2957705855369568, 0.3180995583534241, 0.34042856097221375, 0.3627575635910034, 0.3850865364074707, 0.407415509223938, 0.42974451184272766, 0.45207351446151733, 0.4744024872779846, 0.4967314600944519, 0.519060492515564, 0.5413894653320312, 0.5637184381484985]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 9.0, 11.0, 11.0, 18.0, 16.0, 25.0, 24.0, 25.0, 23.0, 37.0, 45.0, 40.0, 33.0, 34.0, 41.0, 56.0, 46.0, 45.0, 43.0, 46.0, 41.0, 43.0, 28.0, 34.0, 24.0, 21.0, 30.0, 23.0, 16.0, 10.0, 13.0, 16.0, 20.0, 9.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.33001846075057983, -0.3204707205295563, -0.3109229803085327, -0.30137524008750916, -0.2918274998664856, -0.28227975964546204, -0.2727320194244385, -0.26318424940109253, -0.25363653898239136, -0.2440887987613678, -0.23454105854034424, -0.22499331831932068, -0.21544557809829712, -0.20589783787727356, -0.1963500827550888, -0.18680234253406525, -0.1772545874118805, -0.16770684719085693, -0.15815910696983337, -0.14861136674880981, -0.13906362652778625, -0.1295158863067627, -0.11996813118457794, -0.11042039096355438, -0.10087265074253082, -0.09132491052150726, -0.0817771703004837, -0.07222942262887955, -0.06268168240785599, -0.05313394218683243, -0.04358619824051857, -0.03403845429420471, -0.024490714073181152, -0.014942971989512444, -0.005395229905843735, 0.004152512177824974, 0.013700254261493683, 0.023247994482517242, 0.0327957384288311, 0.04234348237514496, 0.05189122259616852, 0.06143896281719208, 0.07098670303821564, 0.0805344507098198, 0.09008219093084335, 0.09962993115186691, 0.10917767882347107, 0.11872541904449463, 0.1282731592655182, 0.13782089948654175, 0.1473686397075653, 0.15691637992858887, 0.16646412014961243, 0.176011860370636, 0.18555961549282074, 0.1951073557138443, 0.20465509593486786, 0.21420283615589142, 0.22375057637691498, 0.23329831659793854, 0.2428460717201233, 0.25239381194114685, 0.2619415521621704, 0.27148929238319397, 0.28103703260421753]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 11.0, 14.0, 17.0, 19.0, 35.0, 48.0, 78.0, 133.0, 150.0, 253.0, 383.0, 569.0, 994.0, 1682.0, 3007.0, 5685.0, 11397.0, 24499.0, 56268.0, 147742.0, 492049.0, 1398125.0, 1349762.0, 456210.0, 142611.0, 54724.0, 24038.0, 11148.0, 5567.0, 2942.0, 1683.0, 943.0, 515.0, 339.0, 225.0, 153.0, 84.0, 49.0, 40.0, 17.0, 14.0, 12.0, 5.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.06341552734375, -0.06170034408569336, -0.05998516082763672, -0.05826997756958008, -0.05655479431152344, -0.0548396110534668, -0.053124427795410156, -0.051409244537353516, -0.049694061279296875, -0.047978878021240234, -0.046263694763183594, -0.04454851150512695, -0.04283332824707031, -0.04111814498901367, -0.03940296173095703, -0.03768777847290039, -0.03597259521484375, -0.03425741195678711, -0.03254222869873047, -0.030827045440673828, -0.029111862182617188, -0.027396678924560547, -0.025681495666503906, -0.023966312408447266, -0.022251129150390625, -0.020535945892333984, -0.018820762634277344, -0.017105579376220703, -0.015390396118164062, -0.013675212860107422, -0.011960029602050781, -0.01024484634399414, -0.0085296630859375, -0.006814479827880859, -0.005099296569824219, -0.003384113311767578, -0.0016689300537109375, 4.6253204345703125e-05, 0.0017614364624023438, 0.0034766197204589844, 0.005191802978515625, 0.006906986236572266, 0.008622169494628906, 0.010337352752685547, 0.012052536010742188, 0.013767719268798828, 0.015482902526855469, 0.01719808578491211, 0.01891326904296875, 0.02062845230102539, 0.02234363555908203, 0.024058818817138672, 0.025774002075195312, 0.027489185333251953, 0.029204368591308594, 0.030919551849365234, 0.032634735107421875, 0.034349918365478516, 0.036065101623535156, 0.0377802848815918, 0.03949546813964844, 0.04121065139770508, 0.04292583465576172, 0.04464101791381836, 0.046356201171875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 7.0, 7.0, 7.0, 16.0, 9.0, 15.0, 18.0, 32.0, 30.0, 36.0, 35.0, 49.0, 41.0, 57.0, 44.0, 56.0, 49.0, 58.0, 39.0, 50.0, 49.0, 45.0, 38.0, 29.0, 38.0, 29.0, 19.0, 16.0, 12.0, 10.0, 14.0, 10.0, 12.0, 11.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.05072021484375, -0.049408912658691406, -0.04809761047363281, -0.04678630828857422, -0.045475006103515625, -0.04416370391845703, -0.04285240173339844, -0.041541099548339844, -0.04022979736328125, -0.038918495178222656, -0.03760719299316406, -0.03629589080810547, -0.034984588623046875, -0.03367328643798828, -0.03236198425292969, -0.031050682067871094, -0.0297393798828125, -0.028428077697753906, -0.027116775512695312, -0.02580547332763672, -0.024494171142578125, -0.02318286895751953, -0.021871566772460938, -0.020560264587402344, -0.01924896240234375, -0.017937660217285156, -0.016626358032226562, -0.015315055847167969, -0.014003753662109375, -0.012692451477050781, -0.011381149291992188, -0.010069847106933594, -0.008758544921875, -0.007447242736816406, -0.0061359405517578125, -0.004824638366699219, -0.003513336181640625, -0.0022020339965820312, -0.0008907318115234375, 0.00042057037353515625, 0.00173187255859375, 0.0030431747436523438, 0.0043544769287109375, 0.005665779113769531, 0.006977081298828125, 0.008288383483886719, 0.009599685668945312, 0.010910987854003906, 0.0122222900390625, 0.013533592224121094, 0.014844894409179688, 0.01615619659423828, 0.017467498779296875, 0.01877880096435547, 0.020090103149414062, 0.021401405334472656, 0.02271270751953125, 0.024024009704589844, 0.025335311889648438, 0.02664661407470703, 0.027957916259765625, 0.02926921844482422, 0.030580520629882812, 0.031891822814941406, 0.033203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 10.0, 10.0, 18.0, 27.0, 40.0, 52.0, 105.0, 178.0, 366.0, 776.0, 2188.0, 8325.0, 45144.0, 313791.0, 2123281.0, 1468622.0, 193623.0, 29037.0, 5702.0, 1679.0, 650.0, 266.0, 151.0, 95.0, 45.0, 35.0, 24.0, 14.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11793994903564453, -0.11399269104003906, -0.1100454330444336, -0.10609817504882812, -0.10215091705322266, -0.09820365905761719, -0.09425640106201172, -0.09030914306640625, -0.08636188507080078, -0.08241462707519531, -0.07846736907958984, -0.07452011108398438, -0.0705728530883789, -0.06662559509277344, -0.06267833709716797, -0.0587310791015625, -0.05478382110595703, -0.05083656311035156, -0.046889305114746094, -0.042942047119140625, -0.038994789123535156, -0.03504753112792969, -0.03110027313232422, -0.02715301513671875, -0.02320575714111328, -0.019258499145507812, -0.015311241149902344, -0.011363983154296875, -0.007416725158691406, -0.0034694671630859375, 0.00047779083251953125, 0.004425048828125, 0.008372306823730469, 0.012319564819335938, 0.016266822814941406, 0.020214080810546875, 0.024161338806152344, 0.028108596801757812, 0.03205585479736328, 0.03600311279296875, 0.03995037078857422, 0.04389762878417969, 0.047844886779785156, 0.051792144775390625, 0.055739402770996094, 0.05968666076660156, 0.06363391876220703, 0.0675811767578125, 0.07152843475341797, 0.07547569274902344, 0.0794229507446289, 0.08337020874023438, 0.08731746673583984, 0.09126472473144531, 0.09521198272705078, 0.09915924072265625, 0.10310649871826172, 0.10705375671386719, 0.11100101470947266, 0.11494827270507812, 0.1188955307006836, 0.12284278869628906, 0.12679004669189453, 0.1307373046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 10.0, 10.0, 8.0, 16.0, 24.0, 27.0, 38.0, 65.0, 99.0, 92.0, 153.0, 215.0, 289.0, 402.0, 495.0, 470.0, 465.0, 337.0, 238.0, 163.0, 135.0, 103.0, 57.0, 43.0, 29.0, 31.0, 15.0, 11.0, 9.0, 11.0, 8.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.0786886215209961, -0.07607841491699219, -0.07346820831298828, -0.07085800170898438, -0.06824779510498047, -0.06563758850097656, -0.06302738189697266, -0.06041717529296875, -0.057806968688964844, -0.05519676208496094, -0.05258655548095703, -0.049976348876953125, -0.04736614227294922, -0.04475593566894531, -0.042145729064941406, -0.0395355224609375, -0.036925315856933594, -0.03431510925292969, -0.03170490264892578, -0.029094696044921875, -0.02648448944091797, -0.023874282836914062, -0.021264076232910156, -0.01865386962890625, -0.016043663024902344, -0.013433456420898438, -0.010823249816894531, -0.008213043212890625, -0.005602836608886719, -0.0029926300048828125, -0.00038242340087890625, 0.002227783203125, 0.004837989807128906, 0.0074481964111328125, 0.010058403015136719, 0.012668609619140625, 0.015278816223144531, 0.017889022827148438, 0.020499229431152344, 0.02310943603515625, 0.025719642639160156, 0.028329849243164062, 0.03094005584716797, 0.033550262451171875, 0.03616046905517578, 0.03877067565917969, 0.041380882263183594, 0.0439910888671875, 0.046601295471191406, 0.04921150207519531, 0.05182170867919922, 0.054431915283203125, 0.05704212188720703, 0.05965232849121094, 0.062262535095214844, 0.06487274169921875, 0.06748294830322266, 0.07009315490722656, 0.07270336151123047, 0.07531356811523438, 0.07792377471923828, 0.08053398132324219, 0.0831441879272461, 0.08575439453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 24.0, 19.0, 44.0, 61.0, 86.0, 104.0, 99.0, 112.0, 123.0, 87.0, 83.0, 58.0, 34.0, 23.0, 20.0, 5.0, 1.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5702563524246216, -0.5564194321632385, -0.5425825119018555, -0.5287455320358276, -0.5149086117744446, -0.5010716915130615, -0.48723477125167847, -0.4733978509902954, -0.45956093072891235, -0.4457240104675293, -0.43188706040382385, -0.4180501401424408, -0.40421321988105774, -0.3903762698173523, -0.37653934955596924, -0.3627024292945862, -0.34886547923088074, -0.3350285589694977, -0.32119160890579224, -0.3073546886444092, -0.2935177683830261, -0.27968084812164307, -0.2658438980579376, -0.25200697779655457, -0.23817004263401031, -0.22433310747146606, -0.210496187210083, -0.19665925204753876, -0.1828223168849945, -0.16898539662361145, -0.1551484614610672, -0.14131152629852295, -0.1274745762348175, -0.11363764852285385, -0.0998007208108902, -0.08596378564834595, -0.0721268579363823, -0.05828993022441864, -0.04445299506187439, -0.030616067349910736, -0.016779139637947083, -0.0029422100633382797, 0.010894719511270523, 0.024731650948524475, 0.03856857866048813, 0.05240550637245178, 0.06624244153499603, 0.08007936924695969, 0.09391629695892334, 0.107753224670887, 0.12159015238285065, 0.1354270875453949, 0.14926400780677795, 0.1631009429693222, 0.17693787813186646, 0.1907747983932495, 0.20461173355579376, 0.218448668718338, 0.23228558897972107, 0.24612252414226532, 0.25995945930480957, 0.2737963795661926, 0.2876332998275757, 0.30147024989128113, 0.3153071701526642]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 7.0, 11.0, 17.0, 17.0, 15.0, 19.0, 34.0, 29.0, 26.0, 45.0, 34.0, 33.0, 39.0, 38.0, 43.0, 53.0, 38.0, 41.0, 42.0, 41.0, 41.0, 38.0, 28.0, 28.0, 30.0, 29.0, 21.0, 27.0, 20.0, 19.0, 22.0, 10.0, 11.0, 10.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.27998483180999756, -0.2722688615322113, -0.26455286145210266, -0.2568368911743164, -0.24912090599536896, -0.2414049208164215, -0.23368893563747406, -0.2259729504585266, -0.21825698018074036, -0.2105409950017929, -0.20282500982284546, -0.1951090395450592, -0.18739305436611176, -0.1796770691871643, -0.17196108400821686, -0.1642450988292694, -0.15652911365032196, -0.1488131284713745, -0.14109714329242706, -0.13338115811347961, -0.12566518783569336, -0.11794920265674591, -0.11023321747779846, -0.10251723229885101, -0.09480125457048416, -0.08708526939153671, -0.07936929166316986, -0.07165330648422241, -0.06393732130527496, -0.05622134357690811, -0.04850535839796066, -0.04078937694430351, -0.03307339549064636, -0.025357414036989212, -0.017641430720686913, -0.009925447404384613, -0.0022094659507274628, 0.0055065155029296875, 0.013222500681877136, 0.020938482135534286, 0.028654463589191437, 0.03637044504284859, 0.04408642649650574, 0.051802411675453186, 0.059518393129110336, 0.06723437458276749, 0.07495035976171494, 0.08266633749008179, 0.09038232266902924, 0.09809830784797668, 0.10581428557634354, 0.11353027075529099, 0.12124624848365784, 0.12896223366260529, 0.13667821884155273, 0.14439420402050018, 0.15211018919944763, 0.15982617437839508, 0.16754215955734253, 0.17525812983512878, 0.18297411501407623, 0.19069010019302368, 0.19840608537197113, 0.20612207055091858, 0.21383804082870483]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 10.0, 12.0, 20.0, 37.0, 35.0, 50.0, 69.0, 135.0, 195.0, 320.0, 510.0, 829.0, 1380.0, 2557.0, 4573.0, 8223.0, 14979.0, 27473.0, 49324.0, 85547.0, 137722.0, 189006.0, 188602.0, 138572.0, 86715.0, 49381.0, 27885.0, 15006.0, 8508.0, 4527.0, 2662.0, 1428.0, 865.0, 489.0, 319.0, 192.0, 142.0, 76.0, 57.0, 42.0, 33.0, 14.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.075439453125, -0.07322120666503906, -0.07100296020507812, -0.06878471374511719, -0.06656646728515625, -0.06434822082519531, -0.062129974365234375, -0.05991172790527344, -0.0576934814453125, -0.05547523498535156, -0.053256988525390625, -0.05103874206542969, -0.04882049560546875, -0.04660224914550781, -0.044384002685546875, -0.04216575622558594, -0.039947509765625, -0.03772926330566406, -0.035511016845703125, -0.03329277038574219, -0.03107452392578125, -0.028856277465820312, -0.026638031005859375, -0.024419784545898438, -0.0222015380859375, -0.019983291625976562, -0.017765045166015625, -0.015546798706054688, -0.01332855224609375, -0.011110305786132812, -0.008892059326171875, -0.0066738128662109375, -0.00445556640625, -0.0022373199462890625, -1.9073486328125e-05, 0.0021991729736328125, 0.00441741943359375, 0.0066356658935546875, 0.008853912353515625, 0.011072158813476562, 0.0132904052734375, 0.015508651733398438, 0.017726898193359375, 0.019945144653320312, 0.02216339111328125, 0.024381637573242188, 0.026599884033203125, 0.028818130493164062, 0.031036376953125, 0.03325462341308594, 0.035472869873046875, 0.03769111633300781, 0.03990936279296875, 0.04212760925292969, 0.044345855712890625, 0.04656410217285156, 0.0487823486328125, 0.05100059509277344, 0.053218841552734375, 0.05543708801269531, 0.05765533447265625, 0.05987358093261719, 0.062091827392578125, 0.06431007385253906, 0.0665283203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 15.0, 14.0, 14.0, 12.0, 19.0, 39.0, 25.0, 30.0, 35.0, 34.0, 42.0, 41.0, 42.0, 52.0, 58.0, 51.0, 47.0, 44.0, 44.0, 36.0, 42.0, 40.0, 27.0, 26.0, 27.0, 18.0, 18.0, 18.0, 15.0, 9.0, 10.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0], "bins": [-0.04632568359375, -0.04516935348510742, -0.044013023376464844, -0.042856693267822266, -0.04170036315917969, -0.04054403305053711, -0.03938770294189453, -0.03823137283325195, -0.037075042724609375, -0.0359187126159668, -0.03476238250732422, -0.03360605239868164, -0.03244972229003906, -0.031293392181396484, -0.030137062072753906, -0.028980731964111328, -0.02782440185546875, -0.026668071746826172, -0.025511741638183594, -0.024355411529541016, -0.023199081420898438, -0.02204275131225586, -0.02088642120361328, -0.019730091094970703, -0.018573760986328125, -0.017417430877685547, -0.01626110076904297, -0.01510477066040039, -0.013948440551757812, -0.012792110443115234, -0.011635780334472656, -0.010479450225830078, -0.0093231201171875, -0.008166790008544922, -0.007010459899902344, -0.005854129791259766, -0.0046977996826171875, -0.0035414695739746094, -0.0023851394653320312, -0.0012288093566894531, -7.2479248046875e-05, 0.0010838508605957031, 0.0022401809692382812, 0.0033965110778808594, 0.0045528411865234375, 0.005709171295166016, 0.006865501403808594, 0.008021831512451172, 0.00917816162109375, 0.010334491729736328, 0.011490821838378906, 0.012647151947021484, 0.013803482055664062, 0.01495981216430664, 0.01611614227294922, 0.017272472381591797, 0.018428802490234375, 0.019585132598876953, 0.02074146270751953, 0.02189779281616211, 0.023054122924804688, 0.024210453033447266, 0.025366783142089844, 0.026523113250732422, 0.027679443359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 11.0, 20.0, 14.0, 40.0, 46.0, 76.0, 126.0, 199.0, 395.0, 774.0, 1663.0, 3706.0, 8710.0, 20909.0, 47577.0, 103344.0, 196096.0, 262832.0, 203557.0, 108853.0, 50479.0, 21955.0, 9462.0, 4117.0, 1742.0, 816.0, 417.0, 216.0, 149.0, 102.0, 39.0, 34.0, 17.0, 17.0, 13.0, 10.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.0878143310546875, -0.084625244140625, -0.0814361572265625, -0.0782470703125, -0.0750579833984375, -0.071868896484375, -0.0686798095703125, -0.06549072265625, -0.0623016357421875, -0.059112548828125, -0.0559234619140625, -0.052734375, -0.0495452880859375, -0.046356201171875, -0.0431671142578125, -0.03997802734375, -0.0367889404296875, -0.033599853515625, -0.0304107666015625, -0.0272216796875, -0.0240325927734375, -0.020843505859375, -0.0176544189453125, -0.01446533203125, -0.0112762451171875, -0.008087158203125, -0.0048980712890625, -0.001708984375, 0.0014801025390625, 0.004669189453125, 0.0078582763671875, 0.01104736328125, 0.0142364501953125, 0.017425537109375, 0.0206146240234375, 0.0238037109375, 0.0269927978515625, 0.030181884765625, 0.0333709716796875, 0.03656005859375, 0.0397491455078125, 0.042938232421875, 0.0461273193359375, 0.04931640625, 0.0525054931640625, 0.055694580078125, 0.0588836669921875, 0.06207275390625, 0.0652618408203125, 0.068450927734375, 0.0716400146484375, 0.0748291015625, 0.0780181884765625, 0.081207275390625, 0.0843963623046875, 0.08758544921875, 0.0907745361328125, 0.093963623046875, 0.0971527099609375, 0.100341796875, 0.1035308837890625, 0.106719970703125, 0.1099090576171875, 0.11309814453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 6.0, 6.0, 12.0, 12.0, 16.0, 17.0, 18.0, 33.0, 34.0, 30.0, 34.0, 36.0, 33.0, 52.0, 58.0, 56.0, 53.0, 49.0, 50.0, 49.0, 48.0, 38.0, 43.0, 36.0, 30.0, 36.0, 22.0, 25.0, 14.0, 8.0, 7.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13037109375, -0.12659263610839844, -0.12281417846679688, -0.11903572082519531, -0.11525726318359375, -0.11147880554199219, -0.10770034790039062, -0.10392189025878906, -0.1001434326171875, -0.09636497497558594, -0.09258651733398438, -0.08880805969238281, -0.08502960205078125, -0.08125114440917969, -0.07747268676757812, -0.07369422912597656, -0.069915771484375, -0.06613731384277344, -0.062358856201171875, -0.05858039855957031, -0.05480194091796875, -0.05102348327636719, -0.047245025634765625, -0.04346656799316406, -0.0396881103515625, -0.03590965270996094, -0.032131195068359375, -0.028352737426757812, -0.02457427978515625, -0.020795822143554688, -0.017017364501953125, -0.013238906860351562, -0.00946044921875, -0.0056819915771484375, -0.001903533935546875, 0.0018749237060546875, 0.00565338134765625, 0.009431838989257812, 0.013210296630859375, 0.016988754272460938, 0.0207672119140625, 0.024545669555664062, 0.028324127197265625, 0.03210258483886719, 0.03588104248046875, 0.03965950012207031, 0.043437957763671875, 0.04721641540527344, 0.050994873046875, 0.05477333068847656, 0.058551788330078125, 0.06233024597167969, 0.06610870361328125, 0.06988716125488281, 0.07366561889648438, 0.07744407653808594, 0.0812225341796875, 0.08500099182128906, 0.08877944946289062, 0.09255790710449219, 0.09633636474609375, 0.10011482238769531, 0.10389328002929688, 0.10767173767089844, 0.1114501953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 14.0, 9.0, 12.0, 28.0, 59.0, 108.0, 186.0, 375.0, 770.0, 1869.0, 4690.0, 12608.0, 36239.0, 98933.0, 219045.0, 301225.0, 217600.0, 98587.0, 35570.0, 12605.0, 4644.0, 1805.0, 806.0, 342.0, 194.0, 86.0, 48.0, 30.0, 19.0, 8.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.034271240234375, -0.03318309783935547, -0.03209495544433594, -0.031006813049316406, -0.029918670654296875, -0.028830528259277344, -0.027742385864257812, -0.02665424346923828, -0.02556610107421875, -0.02447795867919922, -0.023389816284179688, -0.022301673889160156, -0.021213531494140625, -0.020125389099121094, -0.019037246704101562, -0.01794910430908203, -0.0168609619140625, -0.01577281951904297, -0.014684677124023438, -0.013596534729003906, -0.012508392333984375, -0.011420249938964844, -0.010332107543945312, -0.009243965148925781, -0.00815582275390625, -0.007067680358886719, -0.0059795379638671875, -0.004891395568847656, -0.003803253173828125, -0.0027151107788085938, -0.0016269683837890625, -0.0005388259887695312, 0.00054931640625, 0.0016374588012695312, 0.0027256011962890625, 0.0038137435913085938, 0.004901885986328125, 0.005990028381347656, 0.0070781707763671875, 0.008166313171386719, 0.00925445556640625, 0.010342597961425781, 0.011430740356445312, 0.012518882751464844, 0.013607025146484375, 0.014695167541503906, 0.015783309936523438, 0.01687145233154297, 0.0179595947265625, 0.01904773712158203, 0.020135879516601562, 0.021224021911621094, 0.022312164306640625, 0.023400306701660156, 0.024488449096679688, 0.02557659149169922, 0.02666473388671875, 0.02775287628173828, 0.028841018676757812, 0.029929161071777344, 0.031017303466796875, 0.032105445861816406, 0.03319358825683594, 0.03428173065185547, 0.035369873046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 7.0, 4.0, 12.0, 10.0, 11.0, 13.0, 24.0, 19.0, 27.0, 33.0, 34.0, 64.0, 48.0, 64.0, 65.0, 57.0, 70.0, 48.0, 63.0, 40.0, 46.0, 40.0, 18.0, 38.0, 26.0, 20.0, 13.0, 14.0, 8.0, 5.0, 9.0, 5.0, 5.0, 2.0, 5.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.3530254364013672e-05, -1.3130716979503632e-05, -1.2731179594993591e-05, -1.2331642210483551e-05, -1.193210482597351e-05, -1.153256744146347e-05, -1.113303005695343e-05, -1.073349267244339e-05, -1.033395528793335e-05, -9.93441790342331e-06, -9.534880518913269e-06, -9.135343134403229e-06, -8.735805749893188e-06, -8.336268365383148e-06, -7.936730980873108e-06, -7.537193596363068e-06, -7.137656211853027e-06, -6.738118827342987e-06, -6.338581442832947e-06, -5.9390440583229065e-06, -5.539506673812866e-06, -5.139969289302826e-06, -4.740431904792786e-06, -4.340894520282745e-06, -3.941357135772705e-06, -3.541819751262665e-06, -3.1422823667526245e-06, -2.7427449822425842e-06, -2.343207597732544e-06, -1.9436702132225037e-06, -1.5441328287124634e-06, -1.144595444202423e-06, -7.450580596923828e-07, -3.4552067518234253e-07, 5.4016709327697754e-08, 4.5355409383773804e-07, 8.530914783477783e-07, 1.2526288628578186e-06, 1.6521662473678589e-06, 2.051703631877899e-06, 2.4512410163879395e-06, 2.8507784008979797e-06, 3.25031578540802e-06, 3.6498531699180603e-06, 4.049390554428101e-06, 4.448927938938141e-06, 4.848465323448181e-06, 5.2480027079582214e-06, 5.647540092468262e-06, 6.047077476978302e-06, 6.446614861488342e-06, 6.8461522459983826e-06, 7.245689630508423e-06, 7.645227015018463e-06, 8.044764399528503e-06, 8.444301784038544e-06, 8.843839168548584e-06, 9.243376553058624e-06, 9.642913937568665e-06, 1.0042451322078705e-05, 1.0441988706588745e-05, 1.0841526091098785e-05, 1.1241063475608826e-05, 1.1640600860118866e-05, 1.2040138244628906e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 9.0, 16.0, 15.0, 19.0, 31.0, 57.0, 109.0, 138.0, 252.0, 435.0, 774.0, 1307.0, 2493.0, 4708.0, 9779.0, 20147.0, 42099.0, 82541.0, 144786.0, 204090.0, 207898.0, 151064.0, 87676.0, 44880.0, 21816.0, 10489.0, 5029.0, 2611.0, 1385.0, 767.0, 449.0, 295.0, 142.0, 84.0, 58.0, 38.0, 17.0, 14.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.02630615234375, -0.02561473846435547, -0.024923324584960938, -0.024231910705566406, -0.023540496826171875, -0.022849082946777344, -0.022157669067382812, -0.02146625518798828, -0.02077484130859375, -0.02008342742919922, -0.019392013549804688, -0.018700599670410156, -0.018009185791015625, -0.017317771911621094, -0.016626358032226562, -0.01593494415283203, -0.0152435302734375, -0.014552116394042969, -0.013860702514648438, -0.013169288635253906, -0.012477874755859375, -0.011786460876464844, -0.011095046997070312, -0.010403633117675781, -0.00971221923828125, -0.009020805358886719, -0.008329391479492188, -0.007637977600097656, -0.006946563720703125, -0.006255149841308594, -0.0055637359619140625, -0.004872322082519531, -0.004180908203125, -0.0034894943237304688, -0.0027980804443359375, -0.0021066665649414062, -0.001415252685546875, -0.0007238388061523438, -3.24249267578125e-05, 0.0006589889526367188, 0.00135040283203125, 0.0020418167114257812, 0.0027332305908203125, 0.0034246444702148438, 0.004116058349609375, 0.004807472229003906, 0.0054988861083984375, 0.006190299987792969, 0.0068817138671875, 0.007573127746582031, 0.008264541625976562, 0.008955955505371094, 0.009647369384765625, 0.010338783264160156, 0.011030197143554688, 0.011721611022949219, 0.01241302490234375, 0.013104438781738281, 0.013795852661132812, 0.014487266540527344, 0.015178680419921875, 0.015870094299316406, 0.016561508178710938, 0.01725292205810547, 0.0179443359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 8.0, 5.0, 13.0, 7.0, 15.0, 18.0, 16.0, 36.0, 30.0, 48.0, 53.0, 53.0, 57.0, 63.0, 62.0, 68.0, 52.0, 51.0, 56.0, 48.0, 28.0, 40.0, 29.0, 30.0, 17.0, 20.0, 16.0, 19.0, 7.0, 4.0, 4.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01983642578125, -0.019155263900756836, -0.018474102020263672, -0.017792940139770508, -0.017111778259277344, -0.01643061637878418, -0.015749454498291016, -0.015068292617797852, -0.014387130737304688, -0.013705968856811523, -0.01302480697631836, -0.012343645095825195, -0.011662483215332031, -0.010981321334838867, -0.010300159454345703, -0.009618997573852539, -0.008937835693359375, -0.008256673812866211, -0.007575511932373047, -0.006894350051879883, -0.006213188171386719, -0.005532026290893555, -0.004850864410400391, -0.0041697025299072266, -0.0034885406494140625, -0.0028073787689208984, -0.0021262168884277344, -0.0014450550079345703, -0.0007638931274414062, -8.273124694824219e-05, 0.0005984306335449219, 0.001279592514038086, 0.00196075439453125, 0.002641916275024414, 0.003323078155517578, 0.004004240036010742, 0.004685401916503906, 0.00536656379699707, 0.006047725677490234, 0.0067288875579833984, 0.0074100494384765625, 0.008091211318969727, 0.00877237319946289, 0.009453535079956055, 0.010134696960449219, 0.010815858840942383, 0.011497020721435547, 0.012178182601928711, 0.012859344482421875, 0.013540506362915039, 0.014221668243408203, 0.014902830123901367, 0.015583992004394531, 0.016265153884887695, 0.01694631576538086, 0.017627477645874023, 0.018308639526367188, 0.01898980140686035, 0.019670963287353516, 0.02035212516784668, 0.021033287048339844, 0.021714448928833008, 0.022395610809326172, 0.023076772689819336, 0.0237579345703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 11.0, 11.0, 17.0, 45.0, 71.0, 78.0, 99.0, 130.0, 128.0, 113.0, 101.0, 78.0, 41.0, 26.0, 15.0, 15.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6395614147186279, -0.6244599223136902, -0.6093584895133972, -0.5942569971084595, -0.5791555047035217, -0.564054012298584, -0.548952579498291, -0.5338510870933533, -0.5187495946884155, -0.5036481022834778, -0.4885466396808624, -0.47344517707824707, -0.4583436846733093, -0.44324222207069397, -0.4281407594680786, -0.41303926706314087, -0.3979378342628479, -0.38283637166023254, -0.3677348792552948, -0.35263341665267944, -0.3375319242477417, -0.32243046164512634, -0.307328999042511, -0.29222750663757324, -0.2771260142326355, -0.26202455163002014, -0.2469230592250824, -0.23182159662246704, -0.2167201191186905, -0.20161864161491394, -0.1865171641111374, -0.17141568660736084, -0.15631422400474548, -0.14121274650096893, -0.12611126899719238, -0.11100979894399643, -0.09590832889080048, -0.08080685138702393, -0.06570537388324738, -0.05060390383005142, -0.03550242632627487, -0.02040095254778862, -0.005299476906657219, 0.009801998734474182, 0.024903472512960434, 0.040004946291446686, 0.055106423795223236, 0.07020789384841919, 0.08530937135219574, 0.10041084885597229, 0.11551231890916824, 0.1306138038635254, 0.14571526646614075, 0.1608167439699173, 0.17591822147369385, 0.1910196840763092, 0.20612117648124695, 0.2212226539850235, 0.23632413148880005, 0.2514255940914154, 0.26652708649635315, 0.2816285490989685, 0.29673004150390625, 0.3118315041065216, 0.32693296670913696]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 8.0, 9.0, 8.0, 12.0, 11.0, 11.0, 15.0, 20.0, 23.0, 19.0, 24.0, 37.0, 47.0, 39.0, 27.0, 40.0, 38.0, 47.0, 53.0, 43.0, 38.0, 39.0, 41.0, 39.0, 35.0, 27.0, 26.0, 35.0, 23.0, 33.0, 28.0, 13.0, 17.0, 10.0, 17.0, 11.0, 5.0, 7.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.29893815517425537, -0.28897735476493835, -0.2790165841579437, -0.2690557837486267, -0.2590950131416321, -0.24913421273231506, -0.23917342722415924, -0.22921264171600342, -0.2192518413066864, -0.20929105579853058, -0.19933027029037476, -0.18936946988105774, -0.17940868437290192, -0.1694478988647461, -0.15948711335659027, -0.14952632784843445, -0.13956554234027863, -0.1296047568321228, -0.11964396387338638, -0.10968317836523056, -0.09972238540649414, -0.08976159989833832, -0.0798008143901825, -0.06984002143144608, -0.05987923592329025, -0.04991844668984413, -0.03995765745639801, -0.029996871948242188, -0.020036082714796066, -0.010075293481349945, -0.00011450797319412231, 0.009846284985542297, 0.01980707049369812, 0.02976785972714424, 0.03972864896059036, 0.049689434468746185, 0.059650223702192307, 0.06961101293563843, 0.07957179844379425, 0.08953259140253067, 0.09949337691068649, 0.10945416241884232, 0.11941495537757874, 0.12937574088573456, 0.13933652639389038, 0.1492973268032074, 0.15925809741020203, 0.16921889781951904, 0.17917968332767487, 0.1891404688358307, 0.1991012543439865, 0.20906203985214233, 0.21902284026145935, 0.22898362576961517, 0.238944411277771, 0.248905211687088, 0.25886598229408264, 0.26882678270339966, 0.2787875533103943, 0.2887483537197113, 0.29870912432670593, 0.30866992473602295, 0.3186306953430176, 0.3285914957523346, 0.3385522961616516]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 8.0, 13.0, 21.0, 22.0, 32.0, 62.0, 93.0, 144.0, 225.0, 418.0, 789.0, 1614.0, 3422.0, 8149.0, 20763.0, 62480.0, 234725.0, 1214593.0, 1974058.0, 501861.0, 113283.0, 35294.0, 12743.0, 5251.0, 2181.0, 964.0, 488.0, 267.0, 119.0, 84.0, 35.0, 20.0, 17.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08966064453125, -0.08731555938720703, -0.08497047424316406, -0.0826253890991211, -0.08028030395507812, -0.07793521881103516, -0.07559013366699219, -0.07324504852294922, -0.07089996337890625, -0.06855487823486328, -0.06620979309082031, -0.06386470794677734, -0.061519622802734375, -0.059174537658691406, -0.05682945251464844, -0.05448436737060547, -0.0521392822265625, -0.04979419708251953, -0.04744911193847656, -0.045104026794433594, -0.042758941650390625, -0.040413856506347656, -0.03806877136230469, -0.03572368621826172, -0.03337860107421875, -0.03103351593017578, -0.028688430786132812, -0.026343345642089844, -0.023998260498046875, -0.021653175354003906, -0.019308090209960938, -0.01696300506591797, -0.014617919921875, -0.012272834777832031, -0.009927749633789062, -0.007582664489746094, -0.005237579345703125, -0.0028924942016601562, -0.0005474090576171875, 0.0017976760864257812, 0.00414276123046875, 0.006487846374511719, 0.008832931518554688, 0.011178016662597656, 0.013523101806640625, 0.015868186950683594, 0.018213272094726562, 0.02055835723876953, 0.0229034423828125, 0.02524852752685547, 0.027593612670898438, 0.029938697814941406, 0.032283782958984375, 0.034628868103027344, 0.03697395324707031, 0.03931903839111328, 0.04166412353515625, 0.04400920867919922, 0.04635429382324219, 0.048699378967285156, 0.051044464111328125, 0.053389549255371094, 0.05573463439941406, 0.05807971954345703, 0.0604248046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 2.0, 8.0, 8.0, 15.0, 15.0, 20.0, 23.0, 25.0, 30.0, 20.0, 36.0, 34.0, 50.0, 49.0, 53.0, 58.0, 30.0, 48.0, 48.0, 44.0, 50.0, 38.0, 43.0, 29.0, 22.0, 30.0, 18.0, 24.0, 23.0, 18.0, 15.0, 16.0, 11.0, 8.0, 8.0, 10.0, 2.0, 5.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04766845703125, -0.046422481536865234, -0.04517650604248047, -0.0439305305480957, -0.04268455505371094, -0.04143857955932617, -0.040192604064941406, -0.03894662857055664, -0.037700653076171875, -0.03645467758178711, -0.035208702087402344, -0.03396272659301758, -0.03271675109863281, -0.03147077560424805, -0.03022480010986328, -0.028978824615478516, -0.02773284912109375, -0.026486873626708984, -0.02524089813232422, -0.023994922637939453, -0.022748947143554688, -0.021502971649169922, -0.020256996154785156, -0.01901102066040039, -0.017765045166015625, -0.01651906967163086, -0.015273094177246094, -0.014027118682861328, -0.012781143188476562, -0.011535167694091797, -0.010289192199707031, -0.009043216705322266, -0.0077972412109375, -0.006551265716552734, -0.005305290222167969, -0.004059314727783203, -0.0028133392333984375, -0.0015673637390136719, -0.00032138824462890625, 0.0009245872497558594, 0.002170562744140625, 0.0034165382385253906, 0.004662513732910156, 0.005908489227294922, 0.0071544647216796875, 0.008400440216064453, 0.009646415710449219, 0.010892391204833984, 0.01213836669921875, 0.013384342193603516, 0.014630317687988281, 0.015876293182373047, 0.017122268676757812, 0.018368244171142578, 0.019614219665527344, 0.02086019515991211, 0.022106170654296875, 0.02335214614868164, 0.024598121643066406, 0.025844097137451172, 0.027090072631835938, 0.028336048126220703, 0.02958202362060547, 0.030827999114990234, 0.032073974609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 3.0, 13.0, 6.0, 22.0, 24.0, 41.0, 54.0, 97.0, 156.0, 248.0, 556.0, 1175.0, 2878.0, 7378.0, 20507.0, 61909.0, 202184.0, 711277.0, 1831496.0, 960081.0, 270256.0, 81606.0, 26631.0, 9280.0, 3445.0, 1432.0, 708.0, 316.0, 188.0, 93.0, 79.0, 44.0, 28.0, 16.0, 16.0, 9.0, 7.0, 6.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0740966796875, -0.07182502746582031, -0.06955337524414062, -0.06728172302246094, -0.06501007080078125, -0.06273841857910156, -0.060466766357421875, -0.05819511413574219, -0.0559234619140625, -0.05365180969238281, -0.051380157470703125, -0.04910850524902344, -0.04683685302734375, -0.04456520080566406, -0.042293548583984375, -0.04002189636230469, -0.037750244140625, -0.03547859191894531, -0.033206939697265625, -0.030935287475585938, -0.02866363525390625, -0.026391983032226562, -0.024120330810546875, -0.021848678588867188, -0.0195770263671875, -0.017305374145507812, -0.015033721923828125, -0.012762069702148438, -0.01049041748046875, -0.008218765258789062, -0.005947113037109375, -0.0036754608154296875, -0.00140380859375, 0.0008678436279296875, 0.003139495849609375, 0.0054111480712890625, 0.00768280029296875, 0.009954452514648438, 0.012226104736328125, 0.014497756958007812, 0.0167694091796875, 0.019041061401367188, 0.021312713623046875, 0.023584365844726562, 0.02585601806640625, 0.028127670288085938, 0.030399322509765625, 0.03267097473144531, 0.034942626953125, 0.03721427917480469, 0.039485931396484375, 0.04175758361816406, 0.04402923583984375, 0.04630088806152344, 0.048572540283203125, 0.05084419250488281, 0.0531158447265625, 0.05538749694824219, 0.057659149169921875, 0.05993080139160156, 0.06220245361328125, 0.06447410583496094, 0.06674575805664062, 0.06901741027832031, 0.0712890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 6.0, 12.0, 14.0, 17.0, 20.0, 32.0, 43.0, 56.0, 78.0, 99.0, 144.0, 225.0, 285.0, 367.0, 500.0, 544.0, 447.0, 324.0, 225.0, 164.0, 144.0, 81.0, 67.0, 48.0, 36.0, 21.0, 17.0, 21.0, 10.0, 10.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0885009765625, -0.0861215591430664, -0.08374214172363281, -0.08136272430419922, -0.07898330688476562, -0.07660388946533203, -0.07422447204589844, -0.07184505462646484, -0.06946563720703125, -0.06708621978759766, -0.06470680236816406, -0.06232738494873047, -0.059947967529296875, -0.05756855010986328, -0.05518913269042969, -0.052809715270996094, -0.0504302978515625, -0.048050880432128906, -0.04567146301269531, -0.04329204559326172, -0.040912628173828125, -0.03853321075439453, -0.03615379333496094, -0.033774375915527344, -0.03139495849609375, -0.029015541076660156, -0.026636123657226562, -0.02425670623779297, -0.021877288818359375, -0.01949787139892578, -0.017118453979492188, -0.014739036560058594, -0.012359619140625, -0.009980201721191406, -0.0076007843017578125, -0.005221366882324219, -0.002841949462890625, -0.00046253204345703125, 0.0019168853759765625, 0.004296302795410156, 0.00667572021484375, 0.009055137634277344, 0.011434555053710938, 0.013813972473144531, 0.016193389892578125, 0.01857280731201172, 0.020952224731445312, 0.023331642150878906, 0.0257110595703125, 0.028090476989746094, 0.030469894409179688, 0.03284931182861328, 0.035228729248046875, 0.03760814666748047, 0.03998756408691406, 0.042366981506347656, 0.04474639892578125, 0.047125816345214844, 0.04950523376464844, 0.05188465118408203, 0.054264068603515625, 0.05664348602294922, 0.05902290344238281, 0.061402320861816406, 0.06378173828125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 3.0, 8.0, 17.0, 23.0, 34.0, 40.0, 49.0, 59.0, 67.0, 105.0, 90.0, 93.0, 86.0, 81.0, 65.0, 61.0, 36.0, 21.0, 23.0, 11.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35886165499687195, -0.34757113456726074, -0.33628058433532715, -0.32499006390571594, -0.31369954347610474, -0.30240899324417114, -0.29111847281455994, -0.27982795238494873, -0.26853740215301514, -0.25724688172340393, -0.24595634639263153, -0.23466581106185913, -0.22337529063224792, -0.21208475530147552, -0.20079421997070312, -0.18950369954109192, -0.1782131791114807, -0.1669226437807083, -0.1556321233510971, -0.1443415880203247, -0.1330510675907135, -0.1217605322599411, -0.1104699969291687, -0.0991794690489769, -0.0878889411687851, -0.07659841328859329, -0.06530788540840149, -0.05401735007762909, -0.042726822197437286, -0.03143629431724548, -0.020145758986473083, -0.00885523110628128, 0.0024352967739105225, 0.013725826516747475, 0.025016356259584427, 0.03630688786506653, 0.04759741574525833, 0.058887943625450134, 0.07017847895622253, 0.08146900683641434, 0.09275953471660614, 0.10405006259679794, 0.11534059047698975, 0.12663112580776215, 0.13792166113853455, 0.14921218156814575, 0.16050271689891815, 0.17179325222969055, 0.18308377265930176, 0.19437430799007416, 0.20566482841968536, 0.21695536375045776, 0.22824588418006897, 0.23953641951084137, 0.25082695484161377, 0.262117475271225, 0.2734079957008362, 0.2846985161304474, 0.295989066362381, 0.3072795867919922, 0.3185701072216034, 0.3298606276512146, 0.3411511778831482, 0.3524416983127594, 0.363732248544693]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 3.0, 5.0, 6.0, 14.0, 16.0, 14.0, 24.0, 26.0, 24.0, 29.0, 32.0, 40.0, 37.0, 52.0, 40.0, 41.0, 41.0, 39.0, 39.0, 43.0, 50.0, 35.0, 44.0, 38.0, 39.0, 33.0, 27.0, 23.0, 32.0, 19.0, 21.0, 9.0, 8.0, 12.0, 8.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.24597465991973877, -0.23880283534526825, -0.23163102567195892, -0.2244592010974884, -0.21728739142417908, -0.21011556684970856, -0.20294374227523804, -0.1957719326019287, -0.1886001080274582, -0.18142828345298767, -0.17425647377967834, -0.16708464920520782, -0.1599128246307373, -0.15274101495742798, -0.14556919038295746, -0.13839736580848694, -0.1312255561351776, -0.12405373901128769, -0.11688192188739777, -0.10971009731292725, -0.10253828018903732, -0.0953664630651474, -0.08819463849067688, -0.08102282136678696, -0.07385100424289703, -0.06667918711900711, -0.05950736626982689, -0.05233554542064667, -0.045163728296756744, -0.03799191117286682, -0.0308200903236866, -0.023648269474506378, -0.016476452350616455, -0.009304633364081383, -0.0021328143775463104, 0.005039004608988762, 0.012210823595523834, 0.019382640719413757, 0.02655446156859398, 0.0337262824177742, 0.040898099541664124, 0.04806991666555405, 0.05524173751473427, 0.06241355836391449, 0.06958537548780441, 0.07675719261169434, 0.08392901718616486, 0.09110083431005478, 0.0982726514339447, 0.10544446855783463, 0.11261628568172455, 0.11978811025619507, 0.1269599199295044, 0.13413174450397491, 0.14130356907844543, 0.14847537875175476, 0.15564720332622528, 0.1628190279006958, 0.16999083757400513, 0.17716266214847565, 0.18433448672294617, 0.1915062963962555, 0.198678120970726, 0.20584994554519653, 0.21302175521850586]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 6.0, 7.0, 6.0, 8.0, 20.0, 20.0, 31.0, 32.0, 67.0, 96.0, 146.0, 237.0, 402.0, 639.0, 1128.0, 1909.0, 3342.0, 6110.0, 11042.0, 21008.0, 38793.0, 70942.0, 121601.0, 179047.0, 200711.0, 161341.0, 102651.0, 58180.0, 31306.0, 16867.0, 9123.0, 5011.0, 2826.0, 1554.0, 921.0, 547.0, 315.0, 183.0, 126.0, 86.0, 50.0, 33.0, 29.0, 17.0, 15.0, 10.0, 3.0, 10.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08575439453125, -0.08261680603027344, -0.07947921752929688, -0.07634162902832031, -0.07320404052734375, -0.07006645202636719, -0.06692886352539062, -0.06379127502441406, -0.0606536865234375, -0.05751609802246094, -0.054378509521484375, -0.05124092102050781, -0.04810333251953125, -0.04496574401855469, -0.041828155517578125, -0.03869056701660156, -0.035552978515625, -0.03241539001464844, -0.029277801513671875, -0.026140213012695312, -0.02300262451171875, -0.019865036010742188, -0.016727447509765625, -0.013589859008789062, -0.0104522705078125, -0.0073146820068359375, -0.004177093505859375, -0.0010395050048828125, 0.00209808349609375, 0.0052356719970703125, 0.008373260498046875, 0.011510848999023438, 0.0146484375, 0.017786026000976562, 0.020923614501953125, 0.024061203002929688, 0.02719879150390625, 0.030336380004882812, 0.033473968505859375, 0.03661155700683594, 0.0397491455078125, 0.04288673400878906, 0.046024322509765625, 0.04916191101074219, 0.05229949951171875, 0.05543708801269531, 0.058574676513671875, 0.06171226501464844, 0.064849853515625, 0.06798744201660156, 0.07112503051757812, 0.07426261901855469, 0.07740020751953125, 0.08053779602050781, 0.08367538452148438, 0.08681297302246094, 0.0899505615234375, 0.09308815002441406, 0.09622573852539062, 0.09936332702636719, 0.10250091552734375, 0.10563850402832031, 0.10877609252929688, 0.11191368103027344, 0.11505126953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 14.0, 10.0, 20.0, 14.0, 15.0, 20.0, 26.0, 36.0, 45.0, 39.0, 42.0, 52.0, 38.0, 46.0, 53.0, 45.0, 53.0, 42.0, 49.0, 40.0, 39.0, 28.0, 34.0, 39.0, 27.0, 24.0, 14.0, 11.0, 21.0, 13.0, 9.0, 6.0, 10.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0438232421875, -0.042616844177246094, -0.04141044616699219, -0.04020404815673828, -0.038997650146484375, -0.03779125213623047, -0.03658485412597656, -0.035378456115722656, -0.03417205810546875, -0.032965660095214844, -0.03175926208496094, -0.03055286407470703, -0.029346466064453125, -0.02814006805419922, -0.026933670043945312, -0.025727272033691406, -0.0245208740234375, -0.023314476013183594, -0.022108078002929688, -0.02090167999267578, -0.019695281982421875, -0.01848888397216797, -0.017282485961914062, -0.016076087951660156, -0.01486968994140625, -0.013663291931152344, -0.012456893920898438, -0.011250495910644531, -0.010044097900390625, -0.008837699890136719, -0.0076313018798828125, -0.006424903869628906, -0.005218505859375, -0.004012107849121094, -0.0028057098388671875, -0.0015993118286132812, -0.000392913818359375, 0.0008134841918945312, 0.0020198822021484375, 0.0032262802124023438, 0.00443267822265625, 0.005639076232910156, 0.0068454742431640625, 0.008051872253417969, 0.009258270263671875, 0.010464668273925781, 0.011671066284179688, 0.012877464294433594, 0.0140838623046875, 0.015290260314941406, 0.016496658325195312, 0.01770305633544922, 0.018909454345703125, 0.02011585235595703, 0.021322250366210938, 0.022528648376464844, 0.02373504638671875, 0.024941444396972656, 0.026147842407226562, 0.02735424041748047, 0.028560638427734375, 0.02976703643798828, 0.030973434448242188, 0.032179832458496094, 0.03338623046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 8.0, 9.0, 12.0, 18.0, 17.0, 31.0, 58.0, 64.0, 104.0, 168.0, 225.0, 347.0, 616.0, 1127.0, 2159.0, 4523.0, 9774.0, 22238.0, 51813.0, 111601.0, 198133.0, 247702.0, 196721.0, 108892.0, 50893.0, 22010.0, 9782.0, 4464.0, 2254.0, 1096.0, 610.0, 380.0, 254.0, 152.0, 106.0, 64.0, 30.0, 35.0, 25.0, 18.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.113037109375, -0.10944747924804688, -0.10585784912109375, -0.10226821899414062, -0.0986785888671875, -0.09508895874023438, -0.09149932861328125, -0.08790969848632812, -0.084320068359375, -0.08073043823242188, -0.07714080810546875, -0.07355117797851562, -0.0699615478515625, -0.06637191772460938, -0.06278228759765625, -0.059192657470703125, -0.05560302734375, -0.052013397216796875, -0.04842376708984375, -0.044834136962890625, -0.0412445068359375, -0.037654876708984375, -0.03406524658203125, -0.030475616455078125, -0.026885986328125, -0.023296356201171875, -0.01970672607421875, -0.016117095947265625, -0.0125274658203125, -0.008937835693359375, -0.00534820556640625, -0.001758575439453125, 0.0018310546875, 0.005420684814453125, 0.00901031494140625, 0.012599945068359375, 0.0161895751953125, 0.019779205322265625, 0.02336883544921875, 0.026958465576171875, 0.030548095703125, 0.034137725830078125, 0.03772735595703125, 0.041316986083984375, 0.0449066162109375, 0.048496246337890625, 0.05208587646484375, 0.055675506591796875, 0.05926513671875, 0.06285476684570312, 0.06644439697265625, 0.07003402709960938, 0.0736236572265625, 0.07721328735351562, 0.08080291748046875, 0.08439254760742188, 0.087982177734375, 0.09157180786132812, 0.09516143798828125, 0.09875106811523438, 0.1023406982421875, 0.10593032836914062, 0.10951995849609375, 0.11310958862304688, 0.11669921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 9.0, 5.0, 10.0, 14.0, 13.0, 10.0, 27.0, 17.0, 17.0, 33.0, 31.0, 34.0, 31.0, 51.0, 43.0, 41.0, 39.0, 48.0, 54.0, 57.0, 40.0, 38.0, 46.0, 36.0, 31.0, 31.0, 32.0, 29.0, 27.0, 22.0, 11.0, 16.0, 14.0, 9.0, 13.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10076904296875, -0.09743690490722656, -0.09410476684570312, -0.09077262878417969, -0.08744049072265625, -0.08410835266113281, -0.08077621459960938, -0.07744407653808594, -0.0741119384765625, -0.07077980041503906, -0.06744766235351562, -0.06411552429199219, -0.06078338623046875, -0.05745124816894531, -0.054119110107421875, -0.05078697204589844, -0.047454833984375, -0.04412269592285156, -0.040790557861328125, -0.03745841979980469, -0.03412628173828125, -0.030794143676757812, -0.027462005615234375, -0.024129867553710938, -0.0207977294921875, -0.017465591430664062, -0.014133453369140625, -0.010801315307617188, -0.00746917724609375, -0.0041370391845703125, -0.000804901123046875, 0.0025272369384765625, 0.005859375, 0.009191513061523438, 0.012523651123046875, 0.015855789184570312, 0.01918792724609375, 0.022520065307617188, 0.025852203369140625, 0.029184341430664062, 0.0325164794921875, 0.03584861755371094, 0.039180755615234375, 0.04251289367675781, 0.04584503173828125, 0.04917716979980469, 0.052509307861328125, 0.05584144592285156, 0.059173583984375, 0.06250572204589844, 0.06583786010742188, 0.06916999816894531, 0.07250213623046875, 0.07583427429199219, 0.07916641235351562, 0.08249855041503906, 0.0858306884765625, 0.08916282653808594, 0.09249496459960938, 0.09582710266113281, 0.09915924072265625, 0.10249137878417969, 0.10582351684570312, 0.10915565490722656, 0.11248779296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 9.0, 24.0, 10.0, 25.0, 34.0, 56.0, 86.0, 118.0, 170.0, 256.0, 331.0, 507.0, 799.0, 1234.0, 1895.0, 3092.0, 5274.0, 8818.0, 15653.0, 28894.0, 53460.0, 99081.0, 163353.0, 208146.0, 184972.0, 121261.0, 67818.0, 36169.0, 19701.0, 10901.0, 6196.0, 3748.0, 2193.0, 1491.0, 905.0, 575.0, 399.0, 254.0, 175.0, 137.0, 107.0, 56.0, 52.0, 35.0, 21.0, 19.0, 14.0, 9.0, 6.0, 2.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.029052734375, -0.02813577651977539, -0.02721881866455078, -0.026301860809326172, -0.025384902954101562, -0.024467945098876953, -0.023550987243652344, -0.022634029388427734, -0.021717071533203125, -0.020800113677978516, -0.019883155822753906, -0.018966197967529297, -0.018049240112304688, -0.017132282257080078, -0.01621532440185547, -0.01529836654663086, -0.01438140869140625, -0.01346445083618164, -0.012547492980957031, -0.011630535125732422, -0.010713577270507812, -0.009796619415283203, -0.008879661560058594, -0.007962703704833984, -0.007045745849609375, -0.006128787994384766, -0.005211830139160156, -0.004294872283935547, -0.0033779144287109375, -0.002460956573486328, -0.0015439987182617188, -0.0006270408630371094, 0.0002899169921875, 0.0012068748474121094, 0.0021238327026367188, 0.003040790557861328, 0.0039577484130859375, 0.004874706268310547, 0.005791664123535156, 0.006708621978759766, 0.007625579833984375, 0.008542537689208984, 0.009459495544433594, 0.010376453399658203, 0.011293411254882812, 0.012210369110107422, 0.013127326965332031, 0.01404428482055664, 0.01496124267578125, 0.01587820053100586, 0.01679515838623047, 0.017712116241455078, 0.018629074096679688, 0.019546031951904297, 0.020462989807128906, 0.021379947662353516, 0.022296905517578125, 0.023213863372802734, 0.024130821228027344, 0.025047779083251953, 0.025964736938476562, 0.026881694793701172, 0.02779865264892578, 0.02871561050415039, 0.029632568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 10.0, 4.0, 7.0, 15.0, 14.0, 11.0, 7.0, 16.0, 15.0, 25.0, 27.0, 24.0, 17.0, 31.0, 32.0, 31.0, 32.0, 50.0, 58.0, 38.0, 57.0, 52.0, 48.0, 45.0, 47.0, 42.0, 29.0, 35.0, 31.0, 27.0, 15.0, 21.0, 18.0, 17.0, 10.0, 10.0, 3.0, 4.0, 6.0, 9.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.4483928680419922e-05, -1.4083459973335266e-05, -1.368299126625061e-05, -1.3282522559165955e-05, -1.2882053852081299e-05, -1.2481585144996643e-05, -1.2081116437911987e-05, -1.1680647730827332e-05, -1.1280179023742676e-05, -1.087971031665802e-05, -1.0479241609573364e-05, -1.0078772902488708e-05, -9.678304195404053e-06, -9.277835488319397e-06, -8.877366781234741e-06, -8.476898074150085e-06, -8.07642936706543e-06, -7.675960659980774e-06, -7.275491952896118e-06, -6.875023245811462e-06, -6.474554538726807e-06, -6.074085831642151e-06, -5.673617124557495e-06, -5.273148417472839e-06, -4.872679710388184e-06, -4.472211003303528e-06, -4.071742296218872e-06, -3.6712735891342163e-06, -3.2708048820495605e-06, -2.8703361749649048e-06, -2.469867467880249e-06, -2.0693987607955933e-06, -1.6689300537109375e-06, -1.2684613466262817e-06, -8.67992639541626e-07, -4.675239324569702e-07, -6.705522537231445e-08, 3.334134817123413e-07, 7.338821887969971e-07, 1.1343508958816528e-06, 1.5348196029663086e-06, 1.9352883100509644e-06, 2.33575701713562e-06, 2.736225724220276e-06, 3.1366944313049316e-06, 3.5371631383895874e-06, 3.937631845474243e-06, 4.338100552558899e-06, 4.738569259643555e-06, 5.1390379667282104e-06, 5.539506673812866e-06, 5.939975380897522e-06, 6.340444087982178e-06, 6.7409127950668335e-06, 7.141381502151489e-06, 7.541850209236145e-06, 7.9423189163208e-06, 8.342787623405457e-06, 8.743256330490112e-06, 9.143725037574768e-06, 9.544193744659424e-06, 9.94466245174408e-06, 1.0345131158828735e-05, 1.0745599865913391e-05, 1.1146068572998047e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 9.0, 19.0, 27.0, 29.0, 43.0, 72.0, 91.0, 122.0, 182.0, 325.0, 530.0, 799.0, 1443.0, 2648.0, 4917.0, 9754.0, 21323.0, 53518.0, 145531.0, 313570.0, 287651.0, 123409.0, 45422.0, 18383.0, 8466.0, 4446.0, 2325.0, 1281.0, 828.0, 488.0, 296.0, 205.0, 115.0, 79.0, 48.0, 33.0, 19.0, 31.0, 9.0, 14.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.04595947265625, -0.04460430145263672, -0.04324913024902344, -0.041893959045410156, -0.040538787841796875, -0.039183616638183594, -0.03782844543457031, -0.03647327423095703, -0.03511810302734375, -0.03376293182373047, -0.03240776062011719, -0.031052589416503906, -0.029697418212890625, -0.028342247009277344, -0.026987075805664062, -0.02563190460205078, -0.0242767333984375, -0.02292156219482422, -0.021566390991210938, -0.020211219787597656, -0.018856048583984375, -0.017500877380371094, -0.016145706176757812, -0.014790534973144531, -0.01343536376953125, -0.012080192565917969, -0.010725021362304688, -0.009369850158691406, -0.008014678955078125, -0.006659507751464844, -0.0053043365478515625, -0.003949165344238281, -0.002593994140625, -0.0012388229370117188, 0.0001163482666015625, 0.0014715194702148438, 0.002826690673828125, 0.004181861877441406, 0.0055370330810546875, 0.006892204284667969, 0.00824737548828125, 0.009602546691894531, 0.010957717895507812, 0.012312889099121094, 0.013668060302734375, 0.015023231506347656, 0.016378402709960938, 0.01773357391357422, 0.0190887451171875, 0.02044391632080078, 0.021799087524414062, 0.023154258728027344, 0.024509429931640625, 0.025864601135253906, 0.027219772338867188, 0.02857494354248047, 0.02993011474609375, 0.03128528594970703, 0.03264045715332031, 0.033995628356933594, 0.035350799560546875, 0.036705970764160156, 0.03806114196777344, 0.03941631317138672, 0.040771484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 13.0, 9.0, 16.0, 15.0, 33.0, 39.0, 35.0, 65.0, 69.0, 83.0, 112.0, 108.0, 81.0, 68.0, 73.0, 39.0, 39.0, 27.0, 18.0, 16.0, 13.0, 5.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.048309326171875, -0.047008514404296875, -0.04570770263671875, -0.044406890869140625, -0.0431060791015625, -0.041805267333984375, -0.04050445556640625, -0.039203643798828125, -0.03790283203125, -0.036602020263671875, -0.03530120849609375, -0.034000396728515625, -0.0326995849609375, -0.031398773193359375, -0.03009796142578125, -0.028797149658203125, -0.027496337890625, -0.026195526123046875, -0.02489471435546875, -0.023593902587890625, -0.0222930908203125, -0.020992279052734375, -0.01969146728515625, -0.018390655517578125, -0.01708984375, -0.015789031982421875, -0.01448822021484375, -0.013187408447265625, -0.0118865966796875, -0.010585784912109375, -0.00928497314453125, -0.007984161376953125, -0.006683349609375, -0.005382537841796875, -0.00408172607421875, -0.002780914306640625, -0.0014801025390625, -0.000179290771484375, 0.00112152099609375, 0.002422332763671875, 0.00372314453125, 0.005023956298828125, 0.00632476806640625, 0.007625579833984375, 0.0089263916015625, 0.010227203369140625, 0.01152801513671875, 0.012828826904296875, 0.014129638671875, 0.015430450439453125, 0.01673126220703125, 0.018032073974609375, 0.0193328857421875, 0.020633697509765625, 0.02193450927734375, 0.023235321044921875, 0.0245361328125, 0.025836944580078125, 0.02713775634765625, 0.028438568115234375, 0.0297393798828125, 0.031040191650390625, 0.03234100341796875, 0.033641815185546875, 0.034942626953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 9.0, 8.0, 8.0, 11.0, 18.0, 24.0, 31.0, 34.0, 40.0, 57.0, 64.0, 69.0, 69.0, 88.0, 84.0, 69.0, 66.0, 51.0, 41.0, 29.0, 36.0, 24.0, 16.0, 19.0, 14.0, 8.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.41167014837265015, -0.3999342918395996, -0.38819846510887146, -0.3764626085758209, -0.3647267818450928, -0.35299092531204224, -0.3412550687789917, -0.32951924204826355, -0.3177834153175354, -0.30604755878448486, -0.2943117320537567, -0.2825758755207062, -0.270840048789978, -0.2591041922569275, -0.24736835062503815, -0.2356325089931488, -0.22389665246009827, -0.21216081082820892, -0.20042496919631958, -0.18868911266326904, -0.1769532859325409, -0.16521742939949036, -0.153481587767601, -0.14174574613571167, -0.13000990450382233, -0.11827406287193298, -0.10653822124004364, -0.0948023721575737, -0.08306653052568436, -0.07133068889379501, -0.05959483981132507, -0.04785899817943573, -0.03612315654754639, -0.024387313053011894, -0.012651469558477402, -0.00091562420129776, 0.010820217430591583, 0.022556059062480927, 0.03429190814495087, 0.04602774977684021, 0.05776359140872955, 0.0694994330406189, 0.08123527467250824, 0.09297112375497818, 0.10470696538686752, 0.11644280701875687, 0.1281786561012268, 0.13991449773311615, 0.1516503393650055, 0.16338618099689484, 0.17512202262878418, 0.18685787916183472, 0.19859370589256287, 0.2103295624256134, 0.22206540405750275, 0.2338012456893921, 0.24553708732128143, 0.2572729289531708, 0.2690087854862213, 0.28074461221694946, 0.29248046875, 0.30421629548072815, 0.3159521520137787, 0.32768797874450684, 0.3394238352775574]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 9.0, 8.0, 8.0, 8.0, 6.0, 14.0, 16.0, 19.0, 15.0, 22.0, 18.0, 25.0, 29.0, 31.0, 30.0, 34.0, 32.0, 49.0, 42.0, 43.0, 35.0, 54.0, 35.0, 47.0, 37.0, 38.0, 45.0, 38.0, 30.0, 21.0, 30.0, 30.0, 12.0, 19.0, 15.0, 12.0, 11.0, 11.0, 3.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34467560052871704, -0.334215372800827, -0.323755145072937, -0.3132948875427246, -0.3028346598148346, -0.2923744320869446, -0.2819141745567322, -0.27145394682884216, -0.26099371910095215, -0.25053349137306213, -0.24007324874401093, -0.22961300611495972, -0.2191527783870697, -0.2086925506591797, -0.19823230803012848, -0.18777206540107727, -0.17731183767318726, -0.16685160994529724, -0.15639136731624603, -0.14593112468719482, -0.1354708969593048, -0.1250106692314148, -0.11455042660236359, -0.10409019142389297, -0.09362995624542236, -0.08316972106695175, -0.07270948588848114, -0.06224925071001053, -0.05178901553153992, -0.041328780353069305, -0.030868545174598694, -0.020408309996128082, -0.00994807481765747, 0.0005121603608131409, 0.010972395539283752, 0.021432630717754364, 0.031892865896224976, 0.04235310107469559, 0.0528133362531662, 0.06327357143163681, 0.07373380661010742, 0.08419404178857803, 0.09465427696704865, 0.10511451214551926, 0.11557474732398987, 0.12603497505187988, 0.1364952176809311, 0.1469554603099823, 0.15741568803787231, 0.16787591576576233, 0.17833615839481354, 0.18879640102386475, 0.19925662875175476, 0.20971685647964478, 0.22017709910869598, 0.2306373417377472, 0.2410975694656372, 0.2515577971935272, 0.26201802492141724, 0.27247828245162964, 0.28293851017951965, 0.29339873790740967, 0.30385899543762207, 0.3143192231655121, 0.3247794508934021]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 10.0, 11.0, 9.0, 14.0, 15.0, 40.0, 59.0, 73.0, 118.0, 192.0, 332.0, 528.0, 891.0, 1647.0, 2906.0, 5710.0, 11475.0, 24580.0, 58376.0, 167694.0, 621045.0, 1683361.0, 1133477.0, 313124.0, 97331.0, 37352.0, 16524.0, 7879.0, 4149.0, 2226.0, 1294.0, 766.0, 392.0, 248.0, 161.0, 97.0, 51.0, 40.0, 22.0, 19.0, 17.0, 13.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05987548828125, -0.05792808532714844, -0.055980682373046875, -0.05403327941894531, -0.05208587646484375, -0.05013847351074219, -0.048191070556640625, -0.04624366760253906, -0.0442962646484375, -0.04234886169433594, -0.040401458740234375, -0.03845405578613281, -0.03650665283203125, -0.03455924987792969, -0.032611846923828125, -0.030664443969726562, -0.028717041015625, -0.026769638061523438, -0.024822235107421875, -0.022874832153320312, -0.02092742919921875, -0.018980026245117188, -0.017032623291015625, -0.015085220336914062, -0.0131378173828125, -0.011190414428710938, -0.009243011474609375, -0.0072956085205078125, -0.00534820556640625, -0.0034008026123046875, -0.001453399658203125, 0.0004940032958984375, 0.00244140625, 0.0043888092041015625, 0.006336212158203125, 0.008283615112304688, 0.01023101806640625, 0.012178421020507812, 0.014125823974609375, 0.016073226928710938, 0.0180206298828125, 0.019968032836914062, 0.021915435791015625, 0.023862838745117188, 0.02581024169921875, 0.027757644653320312, 0.029705047607421875, 0.03165245056152344, 0.033599853515625, 0.03554725646972656, 0.037494659423828125, 0.03944206237792969, 0.04138946533203125, 0.04333686828613281, 0.045284271240234375, 0.04723167419433594, 0.0491790771484375, 0.05112648010253906, 0.053073883056640625, 0.05502128601074219, 0.05696868896484375, 0.05891609191894531, 0.060863494873046875, 0.06281089782714844, 0.06475830078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 3.0, 10.0, 8.0, 13.0, 16.0, 19.0, 26.0, 31.0, 42.0, 28.0, 36.0, 35.0, 33.0, 53.0, 57.0, 38.0, 44.0, 41.0, 45.0, 48.0, 44.0, 36.0, 44.0, 36.0, 30.0, 29.0, 27.0, 24.0, 13.0, 18.0, 11.0, 11.0, 7.0, 8.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0513916015625, -0.04991292953491211, -0.04843425750732422, -0.04695558547973633, -0.04547691345214844, -0.04399824142456055, -0.042519569396972656, -0.041040897369384766, -0.039562225341796875, -0.038083553314208984, -0.036604881286621094, -0.0351262092590332, -0.03364753723144531, -0.03216886520385742, -0.03069019317626953, -0.02921152114868164, -0.02773284912109375, -0.02625417709350586, -0.02477550506591797, -0.023296833038330078, -0.021818161010742188, -0.020339488983154297, -0.018860816955566406, -0.017382144927978516, -0.015903472900390625, -0.014424800872802734, -0.012946128845214844, -0.011467456817626953, -0.009988784790039062, -0.008510112762451172, -0.007031440734863281, -0.005552768707275391, -0.0040740966796875, -0.0025954246520996094, -0.0011167526245117188, 0.0003619194030761719, 0.0018405914306640625, 0.003319263458251953, 0.004797935485839844, 0.006276607513427734, 0.007755279541015625, 0.009233951568603516, 0.010712623596191406, 0.012191295623779297, 0.013669967651367188, 0.015148639678955078, 0.01662731170654297, 0.01810598373413086, 0.01958465576171875, 0.02106332778930664, 0.02254199981689453, 0.024020671844482422, 0.025499343872070312, 0.026978015899658203, 0.028456687927246094, 0.029935359954833984, 0.031414031982421875, 0.032892704010009766, 0.034371376037597656, 0.03585004806518555, 0.03732872009277344, 0.03880739212036133, 0.04028606414794922, 0.04176473617553711, 0.043243408203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 19.0, 15.0, 31.0, 62.0, 75.0, 122.0, 188.0, 344.0, 691.0, 1335.0, 2809.0, 6705.0, 17524.0, 52284.0, 172968.0, 648075.0, 1999847.0, 942762.0, 239090.0, 70867.0, 23022.0, 8512.0, 3456.0, 1646.0, 775.0, 438.0, 239.0, 142.0, 85.0, 54.0, 35.0, 19.0, 17.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07196044921875, -0.06935596466064453, -0.06675148010253906, -0.0641469955444336, -0.061542510986328125, -0.058938026428222656, -0.05633354187011719, -0.05372905731201172, -0.05112457275390625, -0.04852008819580078, -0.04591560363769531, -0.043311119079589844, -0.040706634521484375, -0.038102149963378906, -0.03549766540527344, -0.03289318084716797, -0.0302886962890625, -0.02768421173095703, -0.025079727172851562, -0.022475242614746094, -0.019870758056640625, -0.017266273498535156, -0.014661788940429688, -0.012057304382324219, -0.00945281982421875, -0.006848335266113281, -0.0042438507080078125, -0.0016393661499023438, 0.000965118408203125, 0.0035696029663085938, 0.0061740875244140625, 0.008778572082519531, 0.011383056640625, 0.013987541198730469, 0.016592025756835938, 0.019196510314941406, 0.021800994873046875, 0.024405479431152344, 0.027009963989257812, 0.02961444854736328, 0.03221893310546875, 0.03482341766357422, 0.03742790222167969, 0.040032386779785156, 0.042636871337890625, 0.045241355895996094, 0.04784584045410156, 0.05045032501220703, 0.0530548095703125, 0.05565929412841797, 0.05826377868652344, 0.060868263244628906, 0.06347274780273438, 0.06607723236083984, 0.06868171691894531, 0.07128620147705078, 0.07389068603515625, 0.07649517059326172, 0.07909965515136719, 0.08170413970947266, 0.08430862426757812, 0.0869131088256836, 0.08951759338378906, 0.09212207794189453, 0.0947265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 9.0, 9.0, 14.0, 17.0, 31.0, 48.0, 54.0, 96.0, 118.0, 189.0, 281.0, 423.0, 582.0, 676.0, 512.0, 350.0, 194.0, 135.0, 109.0, 77.0, 58.0, 27.0, 16.0, 10.0, 11.0, 6.0, 9.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072021484375, -0.06878471374511719, -0.06554794311523438, -0.06231117248535156, -0.05907440185546875, -0.05583763122558594, -0.052600860595703125, -0.04936408996582031, -0.0461273193359375, -0.04289054870605469, -0.039653778076171875, -0.03641700744628906, -0.03318023681640625, -0.029943466186523438, -0.026706695556640625, -0.023469924926757812, -0.020233154296875, -0.016996383666992188, -0.013759613037109375, -0.010522842407226562, -0.00728607177734375, -0.0040493011474609375, -0.000812530517578125, 0.0024242401123046875, 0.0056610107421875, 0.008897781372070312, 0.012134552001953125, 0.015371322631835938, 0.01860809326171875, 0.021844863891601562, 0.025081634521484375, 0.028318405151367188, 0.03155517578125, 0.03479194641113281, 0.038028717041015625, 0.04126548767089844, 0.04450225830078125, 0.04773902893066406, 0.050975799560546875, 0.05421257019042969, 0.0574493408203125, 0.06068611145019531, 0.06392288208007812, 0.06715965270996094, 0.07039642333984375, 0.07363319396972656, 0.07686996459960938, 0.08010673522949219, 0.083343505859375, 0.08658027648925781, 0.08981704711914062, 0.09305381774902344, 0.09629058837890625, 0.09952735900878906, 0.10276412963867188, 0.10600090026855469, 0.1092376708984375, 0.11247444152832031, 0.11571121215820312, 0.11894798278808594, 0.12218475341796875, 0.12542152404785156, 0.12865829467773438, 0.1318950653076172, 0.1351318359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 24.0, 38.0, 56.0, 64.0, 87.0, 140.0, 126.0, 140.0, 114.0, 65.0, 45.0, 30.0, 19.0, 11.0, 12.0, 5.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4022735357284546, -0.38456782698631287, -0.36686211824417114, -0.3491564095020294, -0.3314507007598877, -0.31374502182006836, -0.29603931307792664, -0.2783336043357849, -0.2606278955936432, -0.24292218685150146, -0.22521647810935974, -0.2075107842683792, -0.1898050755262375, -0.17209936678409576, -0.15439367294311523, -0.1366879642009735, -0.11898225545883179, -0.10127654671669006, -0.08357084542512894, -0.06586514413356781, -0.048159435391426086, -0.030453726649284363, -0.012748025357723236, 0.004957675933837891, 0.022663384675979614, 0.04036908969283104, 0.058074794709682465, 0.07578049600124359, 0.09348620474338531, 0.11119191348552704, 0.12889760732650757, 0.1466033160686493, 0.16430902481079102, 0.18201473355293274, 0.19972044229507446, 0.217426136136055, 0.23513184487819672, 0.25283753871917725, 0.27054324746131897, 0.2882489562034607, 0.3059546649456024, 0.32366037368774414, 0.34136608242988586, 0.3590717911720276, 0.3767774701118469, 0.39448320865631104, 0.41218888759613037, 0.4298945963382721, 0.4476003050804138, 0.46530601382255554, 0.48301172256469727, 0.5007174015045166, 0.5184231400489807, 0.5361288189888, 0.5538345575332642, 0.5715402364730835, 0.5892459154129028, 0.6069515943527222, 0.6246573328971863, 0.6423630118370056, 0.6600687503814697, 0.6777744293212891, 0.6954801678657532, 0.7131858468055725, 0.7308915853500366]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 7.0, 8.0, 23.0, 12.0, 13.0, 20.0, 21.0, 22.0, 32.0, 28.0, 37.0, 34.0, 29.0, 46.0, 38.0, 44.0, 41.0, 39.0, 40.0, 38.0, 42.0, 40.0, 44.0, 37.0, 35.0, 22.0, 34.0, 12.0, 26.0, 21.0, 21.0, 11.0, 11.0, 18.0, 6.0, 8.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.28799694776535034, -0.27979883551597595, -0.27160075306892395, -0.26340264081954956, -0.25520452857017517, -0.24700643122196198, -0.23880833387374878, -0.2306102216243744, -0.222412109375, -0.2142140120267868, -0.20601589977741241, -0.19781780242919922, -0.18961969017982483, -0.18142159283161163, -0.17322349548339844, -0.16502538323402405, -0.15682728588581085, -0.14862918853759766, -0.14043107628822327, -0.13223297894001007, -0.12403486669063568, -0.11583676934242249, -0.10763866454362869, -0.0994405597448349, -0.09124245494604111, -0.08304435014724731, -0.07484624534845352, -0.06664814054965973, -0.058450039476156235, -0.05025193467736244, -0.04205383360385895, -0.033855728805065155, -0.025657624006271362, -0.01745951920747757, -0.009261416271328926, -0.0010633133351802826, 0.00713479146361351, 0.015332896262407303, 0.023530997335910797, 0.03172910213470459, 0.03992720693349838, 0.048125311732292175, 0.05632341653108597, 0.06452152132987976, 0.07271961867809296, 0.08091773092746735, 0.08911582827568054, 0.09731393307447433, 0.10551203787326813, 0.11371014267206192, 0.12190824747085571, 0.1301063448190689, 0.1383044570684433, 0.1465025544166565, 0.15470066666603088, 0.16289876401424408, 0.17109686136245728, 0.17929495871067047, 0.18749307096004486, 0.19569116830825806, 0.20388928055763245, 0.21208737790584564, 0.22028547525405884, 0.22848358750343323, 0.23668169975280762]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 11.0, 13.0, 29.0, 36.0, 45.0, 102.0, 139.0, 217.0, 360.0, 688.0, 1176.0, 2040.0, 3972.0, 7334.0, 13932.0, 26706.0, 50431.0, 95767.0, 173658.0, 243074.0, 194441.0, 110266.0, 58678.0, 30927.0, 16049.0, 8476.0, 4464.0, 2421.0, 1256.0, 749.0, 420.0, 262.0, 142.0, 101.0, 55.0, 39.0, 22.0, 20.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09698486328125, -0.09381675720214844, -0.09064865112304688, -0.08748054504394531, -0.08431243896484375, -0.08114433288574219, -0.07797622680664062, -0.07480812072753906, -0.0716400146484375, -0.06847190856933594, -0.06530380249023438, -0.06213569641113281, -0.05896759033203125, -0.05579948425292969, -0.052631378173828125, -0.04946327209472656, -0.046295166015625, -0.04312705993652344, -0.039958953857421875, -0.03679084777832031, -0.03362274169921875, -0.030454635620117188, -0.027286529541015625, -0.024118423461914062, -0.0209503173828125, -0.017782211303710938, -0.014614105224609375, -0.011445999145507812, -0.00827789306640625, -0.0051097869873046875, -0.001941680908203125, 0.0012264251708984375, 0.00439453125, 0.0075626373291015625, 0.010730743408203125, 0.013898849487304688, 0.01706695556640625, 0.020235061645507812, 0.023403167724609375, 0.026571273803710938, 0.0297393798828125, 0.03290748596191406, 0.036075592041015625, 0.03924369812011719, 0.04241180419921875, 0.04557991027832031, 0.048748016357421875, 0.05191612243652344, 0.055084228515625, 0.05825233459472656, 0.061420440673828125, 0.06458854675292969, 0.06775665283203125, 0.07092475891113281, 0.07409286499023438, 0.07726097106933594, 0.0804290771484375, 0.08359718322753906, 0.08676528930664062, 0.08993339538574219, 0.09310150146484375, 0.09626960754394531, 0.09943771362304688, 0.10260581970214844, 0.10577392578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 6.0, 9.0, 13.0, 17.0, 19.0, 24.0, 21.0, 23.0, 26.0, 38.0, 39.0, 48.0, 44.0, 33.0, 30.0, 43.0, 45.0, 33.0, 46.0, 39.0, 36.0, 38.0, 36.0, 35.0, 35.0, 33.0, 25.0, 23.0, 17.0, 17.0, 16.0, 8.0, 9.0, 9.0, 15.0, 5.0, 8.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.04510498046875, -0.043860435485839844, -0.04261589050292969, -0.04137134552001953, -0.040126800537109375, -0.03888225555419922, -0.03763771057128906, -0.036393165588378906, -0.03514862060546875, -0.033904075622558594, -0.03265953063964844, -0.03141498565673828, -0.030170440673828125, -0.02892589569091797, -0.027681350708007812, -0.026436805725097656, -0.0251922607421875, -0.023947715759277344, -0.022703170776367188, -0.02145862579345703, -0.020214080810546875, -0.01896953582763672, -0.017724990844726562, -0.016480445861816406, -0.01523590087890625, -0.013991355895996094, -0.012746810913085938, -0.011502265930175781, -0.010257720947265625, -0.009013175964355469, -0.0077686309814453125, -0.006524085998535156, -0.005279541015625, -0.004034996032714844, -0.0027904510498046875, -0.0015459060668945312, -0.000301361083984375, 0.0009431838989257812, 0.0021877288818359375, 0.0034322738647460938, 0.00467681884765625, 0.005921363830566406, 0.0071659088134765625, 0.008410453796386719, 0.009654998779296875, 0.010899543762207031, 0.012144088745117188, 0.013388633728027344, 0.0146331787109375, 0.015877723693847656, 0.017122268676757812, 0.01836681365966797, 0.019611358642578125, 0.02085590362548828, 0.022100448608398438, 0.023344993591308594, 0.02458953857421875, 0.025834083557128906, 0.027078628540039062, 0.02832317352294922, 0.029567718505859375, 0.03081226348876953, 0.03205680847167969, 0.033301353454589844, 0.0345458984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 10.0, 11.0, 13.0, 20.0, 21.0, 34.0, 46.0, 56.0, 92.0, 128.0, 195.0, 294.0, 591.0, 1243.0, 3085.0, 8199.0, 24323.0, 69404.0, 177560.0, 328375.0, 258385.0, 112382.0, 41053.0, 14185.0, 5007.0, 1928.0, 790.0, 378.0, 222.0, 180.0, 99.0, 71.0, 43.0, 43.0, 24.0, 13.0, 18.0, 10.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.146728515625, -0.1426239013671875, -0.138519287109375, -0.1344146728515625, -0.13031005859375, -0.1262054443359375, -0.122100830078125, -0.1179962158203125, -0.1138916015625, -0.1097869873046875, -0.105682373046875, -0.1015777587890625, -0.09747314453125, -0.0933685302734375, -0.089263916015625, -0.0851593017578125, -0.0810546875, -0.0769500732421875, -0.072845458984375, -0.0687408447265625, -0.06463623046875, -0.0605316162109375, -0.056427001953125, -0.0523223876953125, -0.0482177734375, -0.0441131591796875, -0.040008544921875, -0.0359039306640625, -0.03179931640625, -0.0276947021484375, -0.023590087890625, -0.0194854736328125, -0.015380859375, -0.0112762451171875, -0.007171630859375, -0.0030670166015625, 0.00103759765625, 0.0051422119140625, 0.009246826171875, 0.0133514404296875, 0.0174560546875, 0.0215606689453125, 0.025665283203125, 0.0297698974609375, 0.03387451171875, 0.0379791259765625, 0.042083740234375, 0.0461883544921875, 0.05029296875, 0.0543975830078125, 0.058502197265625, 0.0626068115234375, 0.06671142578125, 0.0708160400390625, 0.074920654296875, 0.0790252685546875, 0.0831298828125, 0.0872344970703125, 0.091339111328125, 0.0954437255859375, 0.09954833984375, 0.1036529541015625, 0.107757568359375, 0.1118621826171875, 0.115966796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 5.0, 5.0, 5.0, 9.0, 13.0, 13.0, 17.0, 15.0, 18.0, 21.0, 24.0, 31.0, 31.0, 33.0, 32.0, 31.0, 47.0, 40.0, 54.0, 47.0, 30.0, 43.0, 30.0, 49.0, 28.0, 35.0, 31.0, 28.0, 39.0, 23.0, 24.0, 14.0, 23.0, 20.0, 19.0, 14.0, 11.0, 13.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.10986328125, -0.1063222885131836, -0.10278129577636719, -0.09924030303955078, -0.09569931030273438, -0.09215831756591797, -0.08861732482910156, -0.08507633209228516, -0.08153533935546875, -0.07799434661865234, -0.07445335388183594, -0.07091236114501953, -0.06737136840820312, -0.06383037567138672, -0.06028938293457031, -0.056748390197753906, -0.0532073974609375, -0.049666404724121094, -0.04612541198730469, -0.04258441925048828, -0.039043426513671875, -0.03550243377685547, -0.03196144104003906, -0.028420448303222656, -0.02487945556640625, -0.021338462829589844, -0.017797470092773438, -0.014256477355957031, -0.010715484619140625, -0.007174491882324219, -0.0036334991455078125, -9.250640869140625e-05, 0.003448486328125, 0.006989479064941406, 0.010530471801757812, 0.014071464538574219, 0.017612457275390625, 0.02115345001220703, 0.024694442749023438, 0.028235435485839844, 0.03177642822265625, 0.035317420959472656, 0.03885841369628906, 0.04239940643310547, 0.045940399169921875, 0.04948139190673828, 0.05302238464355469, 0.056563377380371094, 0.0601043701171875, 0.0636453628540039, 0.06718635559082031, 0.07072734832763672, 0.07426834106445312, 0.07780933380126953, 0.08135032653808594, 0.08489131927490234, 0.08843231201171875, 0.09197330474853516, 0.09551429748535156, 0.09905529022216797, 0.10259628295898438, 0.10613727569580078, 0.10967826843261719, 0.1132192611694336, 0.11676025390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 12.0, 11.0, 16.0, 38.0, 39.0, 65.0, 102.0, 151.0, 276.0, 425.0, 707.0, 1307.0, 2226.0, 4165.0, 7480.0, 13232.0, 23322.0, 41841.0, 79864.0, 160318.0, 250398.0, 215385.0, 115722.0, 58322.0, 31782.0, 18035.0, 10192.0, 5897.0, 3039.0, 1742.0, 1006.0, 536.0, 325.0, 195.0, 135.0, 63.0, 51.0, 40.0, 26.0, 17.0, 10.0, 11.0, 9.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03326416015625, -0.03224897384643555, -0.031233787536621094, -0.03021860122680664, -0.029203414916992188, -0.028188228607177734, -0.02717304229736328, -0.026157855987548828, -0.025142669677734375, -0.024127483367919922, -0.02311229705810547, -0.022097110748291016, -0.021081924438476562, -0.02006673812866211, -0.019051551818847656, -0.018036365509033203, -0.01702117919921875, -0.016005992889404297, -0.014990806579589844, -0.01397562026977539, -0.012960433959960938, -0.011945247650146484, -0.010930061340332031, -0.009914875030517578, -0.008899688720703125, -0.007884502410888672, -0.006869316101074219, -0.005854129791259766, -0.0048389434814453125, -0.0038237571716308594, -0.0028085708618164062, -0.0017933845520019531, -0.0007781982421875, 0.00023698806762695312, 0.0012521743774414062, 0.0022673606872558594, 0.0032825469970703125, 0.004297733306884766, 0.005312919616699219, 0.006328105926513672, 0.007343292236328125, 0.008358478546142578, 0.009373664855957031, 0.010388851165771484, 0.011404037475585938, 0.01241922378540039, 0.013434410095214844, 0.014449596405029297, 0.01546478271484375, 0.016479969024658203, 0.017495155334472656, 0.01851034164428711, 0.019525527954101562, 0.020540714263916016, 0.02155590057373047, 0.022571086883544922, 0.023586273193359375, 0.024601459503173828, 0.02561664581298828, 0.026631832122802734, 0.027647018432617188, 0.02866220474243164, 0.029677391052246094, 0.030692577362060547, 0.031707763671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 1.0, 4.0, 8.0, 15.0, 14.0, 9.0, 15.0, 10.0, 21.0, 28.0, 24.0, 28.0, 37.0, 31.0, 57.0, 46.0, 59.0, 60.0, 70.0, 47.0, 50.0, 46.0, 49.0, 48.0, 33.0, 34.0, 23.0, 21.0, 21.0, 14.0, 14.0, 7.0, 8.0, 4.0, 5.0, 6.0, 7.0, 7.0, 10.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.4483928680419922e-05, -1.4085322618484497e-05, -1.3686716556549072e-05, -1.3288110494613647e-05, -1.2889504432678223e-05, -1.2490898370742798e-05, -1.2092292308807373e-05, -1.1693686246871948e-05, -1.1295080184936523e-05, -1.0896474123001099e-05, -1.0497868061065674e-05, -1.0099261999130249e-05, -9.700655937194824e-06, -9.3020498752594e-06, -8.903443813323975e-06, -8.50483775138855e-06, -8.106231689453125e-06, -7.7076256275177e-06, -7.309019565582275e-06, -6.910413503646851e-06, -6.511807441711426e-06, -6.113201379776001e-06, -5.714595317840576e-06, -5.315989255905151e-06, -4.9173831939697266e-06, -4.518777132034302e-06, -4.120171070098877e-06, -3.721565008163452e-06, -3.3229589462280273e-06, -2.9243528842926025e-06, -2.5257468223571777e-06, -2.127140760421753e-06, -1.7285346984863281e-06, -1.3299286365509033e-06, -9.313225746154785e-07, -5.327165126800537e-07, -1.341104507446289e-07, 2.644956111907959e-07, 6.631016731262207e-07, 1.0617077350616455e-06, 1.4603137969970703e-06, 1.8589198589324951e-06, 2.25752592086792e-06, 2.6561319828033447e-06, 3.0547380447387695e-06, 3.4533441066741943e-06, 3.851950168609619e-06, 4.250556230545044e-06, 4.649162292480469e-06, 5.0477683544158936e-06, 5.446374416351318e-06, 5.844980478286743e-06, 6.243586540222168e-06, 6.642192602157593e-06, 7.040798664093018e-06, 7.439404726028442e-06, 7.838010787963867e-06, 8.236616849899292e-06, 8.635222911834717e-06, 9.033828973770142e-06, 9.432435035705566e-06, 9.831041097640991e-06, 1.0229647159576416e-05, 1.062825322151184e-05, 1.1026859283447266e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 5.0, 12.0, 13.0, 26.0, 31.0, 59.0, 76.0, 121.0, 203.0, 434.0, 787.0, 1627.0, 3577.0, 7978.0, 16426.0, 34010.0, 72999.0, 192305.0, 358457.0, 210199.0, 79408.0, 36289.0, 17507.0, 8337.0, 3947.0, 1818.0, 850.0, 441.0, 215.0, 128.0, 90.0, 48.0, 37.0, 20.0, 13.0, 16.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040130615234375, -0.03885841369628906, -0.037586212158203125, -0.03631401062011719, -0.03504180908203125, -0.03376960754394531, -0.032497406005859375, -0.031225204467773438, -0.0299530029296875, -0.028680801391601562, -0.027408599853515625, -0.026136398315429688, -0.02486419677734375, -0.023591995239257812, -0.022319793701171875, -0.021047592163085938, -0.019775390625, -0.018503189086914062, -0.017230987548828125, -0.015958786010742188, -0.01468658447265625, -0.013414382934570312, -0.012142181396484375, -0.010869979858398438, -0.0095977783203125, -0.008325576782226562, -0.007053375244140625, -0.0057811737060546875, -0.00450897216796875, -0.0032367706298828125, -0.001964569091796875, -0.0006923675537109375, 0.000579833984375, 0.0018520355224609375, 0.003124237060546875, 0.0043964385986328125, 0.00566864013671875, 0.0069408416748046875, 0.008213043212890625, 0.009485244750976562, 0.0107574462890625, 0.012029647827148438, 0.013301849365234375, 0.014574050903320312, 0.01584625244140625, 0.017118453979492188, 0.018390655517578125, 0.019662857055664062, 0.02093505859375, 0.022207260131835938, 0.023479461669921875, 0.024751663208007812, 0.02602386474609375, 0.027296066284179688, 0.028568267822265625, 0.029840469360351562, 0.0311126708984375, 0.03238487243652344, 0.033657073974609375, 0.03492927551269531, 0.03620147705078125, 0.03747367858886719, 0.038745880126953125, 0.04001808166503906, 0.041290283203125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 3.0, 0.0, 3.0, 7.0, 5.0, 8.0, 10.0, 16.0, 18.0, 15.0, 21.0, 29.0, 33.0, 27.0, 51.0, 41.0, 50.0, 82.0, 76.0, 62.0, 59.0, 55.0, 49.0, 55.0, 41.0, 34.0, 28.0, 27.0, 23.0, 14.0, 17.0, 10.0, 3.0, 4.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03125, -0.03022623062133789, -0.02920246124267578, -0.028178691864013672, -0.027154922485351562, -0.026131153106689453, -0.025107383728027344, -0.024083614349365234, -0.023059844970703125, -0.022036075592041016, -0.021012306213378906, -0.019988536834716797, -0.018964767456054688, -0.017940998077392578, -0.01691722869873047, -0.01589345932006836, -0.01486968994140625, -0.01384592056274414, -0.012822151184082031, -0.011798381805419922, -0.010774612426757812, -0.009750843048095703, -0.008727073669433594, -0.007703304290771484, -0.006679534912109375, -0.005655765533447266, -0.004631996154785156, -0.003608226776123047, -0.0025844573974609375, -0.0015606880187988281, -0.0005369186401367188, 0.0004868507385253906, 0.0015106201171875, 0.0025343894958496094, 0.0035581588745117188, 0.004581928253173828, 0.0056056976318359375, 0.006629467010498047, 0.007653236389160156, 0.008677005767822266, 0.009700775146484375, 0.010724544525146484, 0.011748313903808594, 0.012772083282470703, 0.013795852661132812, 0.014819622039794922, 0.01584339141845703, 0.01686716079711914, 0.01789093017578125, 0.01891469955444336, 0.01993846893310547, 0.020962238311767578, 0.021986007690429688, 0.023009777069091797, 0.024033546447753906, 0.025057315826416016, 0.026081085205078125, 0.027104854583740234, 0.028128623962402344, 0.029152393341064453, 0.030176162719726562, 0.031199932098388672, 0.03222370147705078, 0.03324747085571289, 0.034271240234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 4.0, 17.0, 17.0, 34.0, 30.0, 60.0, 78.0, 78.0, 87.0, 103.0, 108.0, 90.0, 79.0, 61.0, 42.0, 29.0, 25.0, 15.0, 15.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46429601311683655, -0.4510050415992737, -0.4377140998840332, -0.42442312836647034, -0.41113215684890747, -0.3978411853313446, -0.38455021381378174, -0.37125927209854126, -0.3579683005809784, -0.3446773290634155, -0.33138638734817505, -0.3180954158306122, -0.3048044443130493, -0.29151347279548645, -0.2782225012779236, -0.2649315595626831, -0.25164058804512024, -0.23834961652755737, -0.2250586599111557, -0.21176770329475403, -0.19847673177719116, -0.1851857602596283, -0.17189480364322662, -0.15860384702682495, -0.14531287550926208, -0.13202190399169922, -0.11873094737529755, -0.10543998330831528, -0.09214901924133301, -0.07885805517435074, -0.06556709110736847, -0.0522761270403862, -0.03898513317108154, -0.025694169104099274, -0.012403205037117004, 0.0008877590298652649, 0.014178723096847534, 0.027469687163829803, 0.04076065123081207, 0.05405161529779434, 0.06734257936477661, 0.08063354343175888, 0.09392450749874115, 0.10721547156572342, 0.12050643563270569, 0.13379740715026855, 0.14708836376667023, 0.1603793203830719, 0.17367029190063477, 0.18696126341819763, 0.2002522200345993, 0.21354317665100098, 0.22683414816856384, 0.2401251196861267, 0.2534160614013672, 0.26670703291893005, 0.2799980044364929, 0.2932889759540558, 0.30657994747161865, 0.31987088918685913, 0.333161860704422, 0.34645283222198486, 0.35974377393722534, 0.3730347454547882, 0.3863257169723511]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 7.0, 9.0, 5.0, 9.0, 10.0, 7.0, 23.0, 15.0, 20.0, 18.0, 16.0, 21.0, 22.0, 45.0, 36.0, 41.0, 45.0, 37.0, 34.0, 45.0, 43.0, 33.0, 47.0, 51.0, 56.0, 31.0, 32.0, 26.0, 25.0, 21.0, 25.0, 23.0, 14.0, 21.0, 20.0, 10.0, 15.0, 7.0, 7.0, 3.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31429964303970337, -0.30414900183677673, -0.2939983904361725, -0.28384774923324585, -0.2736971378326416, -0.26354649662971497, -0.2533958852291107, -0.24324524402618408, -0.23309463262557983, -0.2229440063238144, -0.21279338002204895, -0.2026427537202835, -0.19249212741851807, -0.18234150111675262, -0.17219087481498718, -0.16204023361206055, -0.1518896073102951, -0.14173898100852966, -0.13158835470676422, -0.12143772840499878, -0.11128710210323334, -0.1011364758014679, -0.09098584204912186, -0.08083521574735641, -0.07068458944559097, -0.06053396314382553, -0.05038333684206009, -0.04023270681500435, -0.030082080513238907, -0.019931454211473465, -0.009780824184417725, 0.0003698021173477173, 0.01052042841911316, 0.0206710547208786, 0.030821682885289192, 0.04097231104969978, 0.051122937351465225, 0.06127356365323067, 0.07142419368028641, 0.08157481998205185, 0.09172544628381729, 0.10187607258558273, 0.11202669888734818, 0.12217733263969421, 0.13232795894145966, 0.1424785852432251, 0.15262921154499054, 0.16277983784675598, 0.17293046414852142, 0.18308109045028687, 0.1932317167520523, 0.20338234305381775, 0.2135329693555832, 0.22368359565734863, 0.23383423686027527, 0.24398484826087952, 0.25413548946380615, 0.2642861306667328, 0.27443674206733704, 0.28458738327026367, 0.2947379946708679, 0.30488863587379456, 0.3150392472743988, 0.32518988847732544, 0.3353404998779297]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 8.0, 8.0, 10.0, 8.0, 23.0, 26.0, 45.0, 65.0, 120.0, 212.0, 371.0, 590.0, 1057.0, 2203.0, 4762.0, 10672.0, 26765.0, 74117.0, 254300.0, 1088637.0, 1922876.0, 580901.0, 145769.0, 47399.0, 18269.0, 7757.0, 3585.0, 1671.0, 865.0, 490.0, 280.0, 135.0, 96.0, 45.0, 45.0, 21.0, 22.0, 13.0, 10.0, 5.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0701904296875, -0.0677938461303711, -0.06539726257324219, -0.06300067901611328, -0.060604095458984375, -0.05820751190185547, -0.05581092834472656, -0.053414344787597656, -0.05101776123046875, -0.048621177673339844, -0.04622459411621094, -0.04382801055908203, -0.041431427001953125, -0.03903484344482422, -0.03663825988769531, -0.034241676330566406, -0.0318450927734375, -0.029448509216308594, -0.027051925659179688, -0.02465534210205078, -0.022258758544921875, -0.01986217498779297, -0.017465591430664062, -0.015069007873535156, -0.01267242431640625, -0.010275840759277344, -0.007879257202148438, -0.005482673645019531, -0.003086090087890625, -0.0006895065307617188, 0.0017070770263671875, 0.004103660583496094, 0.006500244140625, 0.008896827697753906, 0.011293411254882812, 0.013689994812011719, 0.016086578369140625, 0.01848316192626953, 0.020879745483398438, 0.023276329040527344, 0.02567291259765625, 0.028069496154785156, 0.030466079711914062, 0.03286266326904297, 0.035259246826171875, 0.03765583038330078, 0.04005241394042969, 0.042448997497558594, 0.0448455810546875, 0.047242164611816406, 0.04963874816894531, 0.05203533172607422, 0.054431915283203125, 0.05682849884033203, 0.05922508239746094, 0.061621665954589844, 0.06401824951171875, 0.06641483306884766, 0.06881141662597656, 0.07120800018310547, 0.07360458374023438, 0.07600116729736328, 0.07839775085449219, 0.0807943344116211, 0.08319091796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 11.0, 11.0, 12.0, 12.0, 10.0, 19.0, 20.0, 22.0, 22.0, 23.0, 26.0, 29.0, 40.0, 37.0, 34.0, 37.0, 43.0, 39.0, 47.0, 31.0, 46.0, 39.0, 37.0, 40.0, 30.0, 32.0, 27.0, 30.0, 23.0, 25.0, 20.0, 14.0, 12.0, 13.0, 14.0, 11.0, 14.0, 5.0, 6.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.040435791015625, -0.03916358947753906, -0.037891387939453125, -0.03661918640136719, -0.03534698486328125, -0.03407478332519531, -0.032802581787109375, -0.03153038024902344, -0.0302581787109375, -0.028985977172851562, -0.027713775634765625, -0.026441574096679688, -0.02516937255859375, -0.023897171020507812, -0.022624969482421875, -0.021352767944335938, -0.02008056640625, -0.018808364868164062, -0.017536163330078125, -0.016263961791992188, -0.01499176025390625, -0.013719558715820312, -0.012447357177734375, -0.011175155639648438, -0.0099029541015625, -0.008630752563476562, -0.007358551025390625, -0.0060863494873046875, -0.00481414794921875, -0.0035419464111328125, -0.002269744873046875, -0.0009975433349609375, 0.000274658203125, 0.0015468597412109375, 0.002819061279296875, 0.0040912628173828125, 0.00536346435546875, 0.0066356658935546875, 0.007907867431640625, 0.009180068969726562, 0.0104522705078125, 0.011724472045898438, 0.012996673583984375, 0.014268875122070312, 0.01554107666015625, 0.016813278198242188, 0.018085479736328125, 0.019357681274414062, 0.0206298828125, 0.021902084350585938, 0.023174285888671875, 0.024446487426757812, 0.02571868896484375, 0.026990890502929688, 0.028263092041015625, 0.029535293579101562, 0.0308074951171875, 0.03207969665527344, 0.033351898193359375, 0.03462409973144531, 0.03589630126953125, 0.03716850280761719, 0.038440704345703125, 0.03971290588378906, 0.040985107421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 3.0, 12.0, 14.0, 21.0, 17.0, 39.0, 75.0, 121.0, 174.0, 342.0, 684.0, 1443.0, 3458.0, 9306.0, 28766.0, 100911.0, 402466.0, 1731385.0, 1463225.0, 329133.0, 84492.0, 24454.0, 7921.0, 3066.0, 1350.0, 621.0, 308.0, 175.0, 90.0, 65.0, 35.0, 29.0, 17.0, 15.0, 9.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.09820556640625, -0.09512996673583984, -0.09205436706542969, -0.08897876739501953, -0.08590316772460938, -0.08282756805419922, -0.07975196838378906, -0.0766763687133789, -0.07360076904296875, -0.0705251693725586, -0.06744956970214844, -0.06437397003173828, -0.061298370361328125, -0.05822277069091797, -0.05514717102050781, -0.052071571350097656, -0.0489959716796875, -0.045920372009277344, -0.04284477233886719, -0.03976917266845703, -0.036693572998046875, -0.03361797332763672, -0.030542373657226562, -0.027466773986816406, -0.02439117431640625, -0.021315574645996094, -0.018239974975585938, -0.015164375305175781, -0.012088775634765625, -0.009013175964355469, -0.0059375762939453125, -0.0028619766235351562, 0.000213623046875, 0.0032892227172851562, 0.0063648223876953125, 0.009440422058105469, 0.012516021728515625, 0.015591621398925781, 0.018667221069335938, 0.021742820739746094, 0.02481842041015625, 0.027894020080566406, 0.030969619750976562, 0.03404521942138672, 0.037120819091796875, 0.04019641876220703, 0.04327201843261719, 0.046347618103027344, 0.0494232177734375, 0.052498817443847656, 0.05557441711425781, 0.05865001678466797, 0.061725616455078125, 0.06480121612548828, 0.06787681579589844, 0.0709524154663086, 0.07402801513671875, 0.0771036148071289, 0.08017921447753906, 0.08325481414794922, 0.08633041381835938, 0.08940601348876953, 0.09248161315917969, 0.09555721282958984, 0.0986328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 9.0, 4.0, 19.0, 22.0, 20.0, 47.0, 57.0, 82.0, 136.0, 197.0, 328.0, 565.0, 686.0, 620.0, 430.0, 281.0, 192.0, 117.0, 88.0, 55.0, 42.0, 25.0, 12.0, 11.0, 6.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.16162109375, -0.1579303741455078, -0.15423965454101562, -0.15054893493652344, -0.14685821533203125, -0.14316749572753906, -0.13947677612304688, -0.1357860565185547, -0.1320953369140625, -0.1284046173095703, -0.12471389770507812, -0.12102317810058594, -0.11733245849609375, -0.11364173889160156, -0.10995101928710938, -0.10626029968261719, -0.102569580078125, -0.09887886047363281, -0.09518814086914062, -0.09149742126464844, -0.08780670166015625, -0.08411598205566406, -0.08042526245117188, -0.07673454284667969, -0.0730438232421875, -0.06935310363769531, -0.06566238403320312, -0.06197166442871094, -0.05828094482421875, -0.05459022521972656, -0.050899505615234375, -0.04720878601074219, -0.04351806640625, -0.03982734680175781, -0.036136627197265625, -0.03244590759277344, -0.02875518798828125, -0.025064468383789062, -0.021373748779296875, -0.017683029174804688, -0.0139923095703125, -0.010301589965820312, -0.006610870361328125, -0.0029201507568359375, 0.00077056884765625, 0.0044612884521484375, 0.008152008056640625, 0.011842727661132812, 0.015533447265625, 0.019224166870117188, 0.022914886474609375, 0.026605606079101562, 0.03029632568359375, 0.03398704528808594, 0.037677764892578125, 0.04136848449707031, 0.0450592041015625, 0.04874992370605469, 0.052440643310546875, 0.05613136291503906, 0.05982208251953125, 0.06351280212402344, 0.06720352172851562, 0.07089424133300781, 0.0745849609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 21.0, 45.0, 76.0, 110.0, 145.0, 150.0, 158.0, 123.0, 71.0, 51.0, 27.0, 15.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953783631324768, -0.17190924286842346, -0.1484401375055313, -0.12497102469205856, -0.10150191187858582, -0.07803279906511307, -0.05456368625164032, -0.03109458088874817, -0.007625460624694824, 0.015843652188777924, 0.03931276500225067, 0.06278187781572342, 0.08625099062919617, 0.10972010344266891, 0.13318921625614166, 0.1566583216190338, 0.18012744188308716, 0.2035965621471405, 0.22706566751003265, 0.2505347728729248, 0.27400389313697815, 0.2974730134010315, 0.32094210386276245, 0.3444112241268158, 0.36788034439086914, 0.3913494646549225, 0.41481858491897583, 0.4382876753807068, 0.46175679564476013, 0.4852259159088135, 0.5086950063705444, 0.5321640968322754, 0.5556333065032959, 0.5791023969650269, 0.6025715470314026, 0.6260406374931335, 0.6495097875595093, 0.6729788780212402, 0.6964479684829712, 0.7199170589447021, 0.7433862090110779, 0.7668552994728088, 0.7903244495391846, 0.8137935400009155, 0.8372626304626465, 0.8607317805290222, 0.8842008709907532, 0.9076700210571289, 0.9311391115188599, 0.9546082019805908, 0.9780773520469666, 1.0015465021133423, 1.0250155925750732, 1.0484846830368042, 1.0719537734985352, 1.0954228639602661, 1.118891954421997, 1.142361044883728, 1.165830135345459, 1.1892993450164795, 1.2127684354782104, 1.2362375259399414, 1.2597066164016724, 1.2831757068634033, 1.3066449165344238]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 8.0, 14.0, 10.0, 10.0, 18.0, 10.0, 17.0, 27.0, 26.0, 30.0, 32.0, 42.0, 39.0, 24.0, 25.0, 45.0, 37.0, 47.0, 37.0, 50.0, 45.0, 40.0, 44.0, 32.0, 38.0, 37.0, 24.0, 26.0, 28.0, 22.0, 21.0, 16.0, 15.0, 12.0, 12.0, 9.0, 12.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3129574656486511, -0.3040841519832611, -0.2952108383178711, -0.2863375246524811, -0.27746421098709106, -0.26859086751937866, -0.25971755385398865, -0.25084424018859863, -0.24197092652320862, -0.2330976128578186, -0.2242242991924286, -0.21535097062587738, -0.20647765696048737, -0.19760434329509735, -0.18873101472854614, -0.17985770106315613, -0.1709843873977661, -0.1621110737323761, -0.15323776006698608, -0.14436443150043488, -0.13549111783504486, -0.12661780416965485, -0.11774448305368423, -0.10887116193771362, -0.09999784827232361, -0.0911245346069336, -0.08225121349096298, -0.07337789237499237, -0.06450457870960236, -0.05563126131892204, -0.04675794392824173, -0.03788462653756142, -0.029011309146881104, -0.02013799175620079, -0.011264674365520477, -0.002391356974840164, 0.006481960415840149, 0.015355277806520462, 0.024228595197200775, 0.03310191258788109, 0.0419752299785614, 0.050848547369241714, 0.05972186475992203, 0.06859518587589264, 0.07746849954128265, 0.08634181320667267, 0.09521513432264328, 0.10408845543861389, 0.1129617691040039, 0.12183508276939392, 0.13070839643478394, 0.13958172500133514, 0.14845503866672516, 0.15732835233211517, 0.16620168089866638, 0.1750749945640564, 0.1839483082294464, 0.19282162189483643, 0.20169493556022644, 0.21056826412677765, 0.21944157779216766, 0.22831489145755768, 0.2371882200241089, 0.2460615336894989, 0.2549348473548889]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 9.0, 22.0, 49.0, 76.0, 114.0, 209.0, 378.0, 701.0, 1379.0, 2698.0, 5333.0, 10707.0, 21220.0, 40409.0, 74818.0, 128446.0, 202851.0, 219333.0, 150020.0, 88712.0, 48797.0, 25523.0, 13239.0, 6505.0, 3349.0, 1727.0, 838.0, 459.0, 265.0, 132.0, 79.0, 62.0, 28.0, 28.0, 10.0, 10.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1212158203125, -0.117767333984375, -0.11431884765625, -0.110870361328125, -0.107421875, -0.103973388671875, -0.10052490234375, -0.097076416015625, -0.0936279296875, -0.090179443359375, -0.08673095703125, -0.083282470703125, -0.079833984375, -0.076385498046875, -0.07293701171875, -0.069488525390625, -0.0660400390625, -0.062591552734375, -0.05914306640625, -0.055694580078125, -0.05224609375, -0.048797607421875, -0.04534912109375, -0.041900634765625, -0.0384521484375, -0.035003662109375, -0.03155517578125, -0.028106689453125, -0.024658203125, -0.021209716796875, -0.01776123046875, -0.014312744140625, -0.0108642578125, -0.007415771484375, -0.00396728515625, -0.000518798828125, 0.0029296875, 0.006378173828125, 0.00982666015625, 0.013275146484375, 0.0167236328125, 0.020172119140625, 0.02362060546875, 0.027069091796875, 0.030517578125, 0.033966064453125, 0.03741455078125, 0.040863037109375, 0.0443115234375, 0.047760009765625, 0.05120849609375, 0.054656982421875, 0.05810546875, 0.061553955078125, 0.06500244140625, 0.068450927734375, 0.0718994140625, 0.075347900390625, 0.07879638671875, 0.082244873046875, 0.085693359375, 0.089141845703125, 0.09259033203125, 0.096038818359375, 0.0994873046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 7.0, 9.0, 9.0, 6.0, 6.0, 16.0, 16.0, 13.0, 28.0, 25.0, 22.0, 29.0, 32.0, 30.0, 34.0, 32.0, 36.0, 44.0, 42.0, 49.0, 35.0, 39.0, 38.0, 43.0, 35.0, 26.0, 26.0, 31.0, 31.0, 25.0, 27.0, 16.0, 20.0, 16.0, 19.0, 15.0, 9.0, 12.0, 9.0, 4.0, 9.0, 5.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0396728515625, -0.038448333740234375, -0.03722381591796875, -0.035999298095703125, -0.0347747802734375, -0.033550262451171875, -0.03232574462890625, -0.031101226806640625, -0.029876708984375, -0.028652191162109375, -0.02742767333984375, -0.026203155517578125, -0.0249786376953125, -0.023754119873046875, -0.02252960205078125, -0.021305084228515625, -0.02008056640625, -0.018856048583984375, -0.01763153076171875, -0.016407012939453125, -0.0151824951171875, -0.013957977294921875, -0.01273345947265625, -0.011508941650390625, -0.010284423828125, -0.009059906005859375, -0.00783538818359375, -0.006610870361328125, -0.0053863525390625, -0.004161834716796875, -0.00293731689453125, -0.001712799072265625, -0.00048828125, 0.000736236572265625, 0.00196075439453125, 0.003185272216796875, 0.0044097900390625, 0.005634307861328125, 0.00685882568359375, 0.008083343505859375, 0.009307861328125, 0.010532379150390625, 0.01175689697265625, 0.012981414794921875, 0.0142059326171875, 0.015430450439453125, 0.01665496826171875, 0.017879486083984375, 0.01910400390625, 0.020328521728515625, 0.02155303955078125, 0.022777557373046875, 0.0240020751953125, 0.025226593017578125, 0.02645111083984375, 0.027675628662109375, 0.028900146484375, 0.030124664306640625, 0.03134918212890625, 0.032573699951171875, 0.0337982177734375, 0.035022735595703125, 0.03624725341796875, 0.037471771240234375, 0.0386962890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 15.0, 13.0, 32.0, 34.0, 69.0, 62.0, 109.0, 247.0, 414.0, 992.0, 2137.0, 5097.0, 13209.0, 33592.0, 83273.0, 181134.0, 290227.0, 235657.0, 119073.0, 50106.0, 19632.0, 7631.0, 3083.0, 1278.0, 612.0, 336.0, 173.0, 87.0, 75.0, 44.0, 25.0, 17.0, 19.0, 12.0, 7.0, 8.0, 6.0, 4.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.11360645294189453, -0.10935401916503906, -0.1051015853881836, -0.10084915161132812, -0.09659671783447266, -0.09234428405761719, -0.08809185028076172, -0.08383941650390625, -0.07958698272705078, -0.07533454895019531, -0.07108211517333984, -0.06682968139648438, -0.0625772476196289, -0.05832481384277344, -0.05407238006591797, -0.0498199462890625, -0.04556751251220703, -0.04131507873535156, -0.037062644958496094, -0.032810211181640625, -0.028557777404785156, -0.024305343627929688, -0.02005290985107422, -0.01580047607421875, -0.011548042297363281, -0.0072956085205078125, -0.0030431747436523438, 0.001209259033203125, 0.005461692810058594, 0.009714126586914062, 0.013966560363769531, 0.018218994140625, 0.02247142791748047, 0.026723861694335938, 0.030976295471191406, 0.035228729248046875, 0.039481163024902344, 0.04373359680175781, 0.04798603057861328, 0.05223846435546875, 0.05649089813232422, 0.06074333190917969, 0.06499576568603516, 0.06924819946289062, 0.0735006332397461, 0.07775306701660156, 0.08200550079345703, 0.0862579345703125, 0.09051036834716797, 0.09476280212402344, 0.0990152359008789, 0.10326766967773438, 0.10752010345458984, 0.11177253723144531, 0.11602497100830078, 0.12027740478515625, 0.12452983856201172, 0.1287822723388672, 0.13303470611572266, 0.13728713989257812, 0.1415395736694336, 0.14579200744628906, 0.15004444122314453, 0.154296875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 3.0, 3.0, 5.0, 12.0, 7.0, 9.0, 8.0, 8.0, 17.0, 7.0, 22.0, 21.0, 28.0, 31.0, 15.0, 35.0, 28.0, 30.0, 34.0, 35.0, 33.0, 40.0, 40.0, 41.0, 45.0, 29.0, 40.0, 30.0, 39.0, 32.0, 29.0, 20.0, 28.0, 23.0, 23.0, 25.0, 10.0, 15.0, 19.0, 13.0, 15.0, 13.0, 8.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.11669921875, -0.11330318450927734, -0.10990715026855469, -0.10651111602783203, -0.10311508178710938, -0.09971904754638672, -0.09632301330566406, -0.0929269790649414, -0.08953094482421875, -0.0861349105834961, -0.08273887634277344, -0.07934284210205078, -0.07594680786132812, -0.07255077362060547, -0.06915473937988281, -0.06575870513916016, -0.0623626708984375, -0.058966636657714844, -0.05557060241699219, -0.05217456817626953, -0.048778533935546875, -0.04538249969482422, -0.04198646545410156, -0.038590431213378906, -0.03519439697265625, -0.031798362731933594, -0.028402328491210938, -0.02500629425048828, -0.021610260009765625, -0.01821422576904297, -0.014818191528320312, -0.011422157287597656, -0.008026123046875, -0.004630088806152344, -0.0012340545654296875, 0.0021619796752929688, 0.005558013916015625, 0.008954048156738281, 0.012350082397460938, 0.015746116638183594, 0.01914215087890625, 0.022538185119628906, 0.025934219360351562, 0.02933025360107422, 0.032726287841796875, 0.03612232208251953, 0.03951835632324219, 0.042914390563964844, 0.0463104248046875, 0.049706459045410156, 0.05310249328613281, 0.05649852752685547, 0.059894561767578125, 0.06329059600830078, 0.06668663024902344, 0.0700826644897461, 0.07347869873046875, 0.0768747329711914, 0.08027076721191406, 0.08366680145263672, 0.08706283569335938, 0.09045886993408203, 0.09385490417480469, 0.09725093841552734, 0.10064697265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 3.0, 7.0, 14.0, 25.0, 27.0, 56.0, 81.0, 113.0, 211.0, 288.0, 519.0, 833.0, 1431.0, 2309.0, 3974.0, 6850.0, 11683.0, 19936.0, 33424.0, 55713.0, 89419.0, 133188.0, 172014.0, 170141.0, 129450.0, 85641.0, 53309.0, 31797.0, 19184.0, 10995.0, 6457.0, 3801.0, 2250.0, 1344.0, 812.0, 467.0, 274.0, 192.0, 109.0, 73.0, 45.0, 30.0, 20.0, 12.0, 8.0, 5.0, 10.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0302581787109375, -0.029340028762817383, -0.028421878814697266, -0.02750372886657715, -0.02658557891845703, -0.025667428970336914, -0.024749279022216797, -0.02383112907409668, -0.022912979125976562, -0.021994829177856445, -0.021076679229736328, -0.02015852928161621, -0.019240379333496094, -0.018322229385375977, -0.01740407943725586, -0.016485929489135742, -0.015567779541015625, -0.014649629592895508, -0.01373147964477539, -0.012813329696655273, -0.011895179748535156, -0.010977029800415039, -0.010058879852294922, -0.009140729904174805, -0.008222579956054688, -0.00730443000793457, -0.006386280059814453, -0.005468130111694336, -0.004549980163574219, -0.0036318302154541016, -0.0027136802673339844, -0.0017955303192138672, -0.00087738037109375, 4.076957702636719e-05, 0.0009589195251464844, 0.0018770694732666016, 0.0027952194213867188, 0.003713369369506836, 0.004631519317626953, 0.00554966926574707, 0.0064678192138671875, 0.007385969161987305, 0.008304119110107422, 0.009222269058227539, 0.010140419006347656, 0.011058568954467773, 0.01197671890258789, 0.012894868850708008, 0.013813018798828125, 0.014731168746948242, 0.01564931869506836, 0.016567468643188477, 0.017485618591308594, 0.01840376853942871, 0.019321918487548828, 0.020240068435668945, 0.021158218383789062, 0.02207636833190918, 0.022994518280029297, 0.023912668228149414, 0.02483081817626953, 0.02574896812438965, 0.026667118072509766, 0.027585268020629883, 0.02850341796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 4.0, 8.0, 9.0, 8.0, 8.0, 8.0, 12.0, 10.0, 12.0, 13.0, 21.0, 22.0, 16.0, 30.0, 24.0, 28.0, 44.0, 42.0, 42.0, 50.0, 54.0, 68.0, 41.0, 57.0, 41.0, 49.0, 46.0, 23.0, 29.0, 33.0, 20.0, 25.0, 15.0, 9.0, 11.0, 11.0, 9.0, 8.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.4781951904296875e-05, -1.4328397810459137e-05, -1.3874843716621399e-05, -1.3421289622783661e-05, -1.2967735528945923e-05, -1.2514181435108185e-05, -1.2060627341270447e-05, -1.1607073247432709e-05, -1.115351915359497e-05, -1.0699965059757233e-05, -1.0246410965919495e-05, -9.792856872081757e-06, -9.339302778244019e-06, -8.88574868440628e-06, -8.432194590568542e-06, -7.978640496730804e-06, -7.525086402893066e-06, -7.071532309055328e-06, -6.61797821521759e-06, -6.164424121379852e-06, -5.710870027542114e-06, -5.257315933704376e-06, -4.803761839866638e-06, -4.3502077460289e-06, -3.896653652191162e-06, -3.443099558353424e-06, -2.989545464515686e-06, -2.535991370677948e-06, -2.08243727684021e-06, -1.628883183002472e-06, -1.1753290891647339e-06, -7.217749953269958e-07, -2.682209014892578e-07, 1.8533319234848022e-07, 6.388872861862183e-07, 1.0924413800239563e-06, 1.5459954738616943e-06, 1.9995495676994324e-06, 2.4531036615371704e-06, 2.9066577553749084e-06, 3.3602118492126465e-06, 3.8137659430503845e-06, 4.2673200368881226e-06, 4.720874130725861e-06, 5.174428224563599e-06, 5.627982318401337e-06, 6.081536412239075e-06, 6.535090506076813e-06, 6.988644599914551e-06, 7.442198693752289e-06, 7.895752787590027e-06, 8.349306881427765e-06, 8.802860975265503e-06, 9.256415069103241e-06, 9.709969162940979e-06, 1.0163523256778717e-05, 1.0617077350616455e-05, 1.1070631444454193e-05, 1.1524185538291931e-05, 1.197773963212967e-05, 1.2431293725967407e-05, 1.2884847819805145e-05, 1.3338401913642883e-05, 1.3791956007480621e-05, 1.424551010131836e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 12.0, 15.0, 20.0, 24.0, 43.0, 68.0, 113.0, 157.0, 300.0, 591.0, 1050.0, 2027.0, 3671.0, 7146.0, 13434.0, 26263.0, 50495.0, 94677.0, 167477.0, 232281.0, 196697.0, 118840.0, 63885.0, 33176.0, 17080.0, 8990.0, 4624.0, 2407.0, 1279.0, 713.0, 377.0, 219.0, 125.0, 62.0, 45.0, 34.0, 28.0, 16.0, 20.0, 11.0, 16.0, 10.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.037689208984375, -0.03660249710083008, -0.035515785217285156, -0.034429073333740234, -0.03334236145019531, -0.03225564956665039, -0.03116893768310547, -0.030082225799560547, -0.028995513916015625, -0.027908802032470703, -0.02682209014892578, -0.02573537826538086, -0.024648666381835938, -0.023561954498291016, -0.022475242614746094, -0.021388530731201172, -0.02030181884765625, -0.019215106964111328, -0.018128395080566406, -0.017041683197021484, -0.015954971313476562, -0.01486825942993164, -0.013781547546386719, -0.012694835662841797, -0.011608123779296875, -0.010521411895751953, -0.009434700012207031, -0.00834798812866211, -0.0072612762451171875, -0.006174564361572266, -0.005087852478027344, -0.004001140594482422, -0.0029144287109375, -0.0018277168273925781, -0.0007410049438476562, 0.0003457069396972656, 0.0014324188232421875, 0.0025191307067871094, 0.0036058425903320312, 0.004692554473876953, 0.005779266357421875, 0.006865978240966797, 0.007952690124511719, 0.00903940200805664, 0.010126113891601562, 0.011212825775146484, 0.012299537658691406, 0.013386249542236328, 0.01447296142578125, 0.015559673309326172, 0.016646385192871094, 0.017733097076416016, 0.018819808959960938, 0.01990652084350586, 0.02099323272705078, 0.022079944610595703, 0.023166656494140625, 0.024253368377685547, 0.02534008026123047, 0.02642679214477539, 0.027513504028320312, 0.028600215911865234, 0.029686927795410156, 0.030773639678955078, 0.0318603515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 10.0, 6.0, 7.0, 13.0, 13.0, 14.0, 17.0, 28.0, 22.0, 28.0, 30.0, 23.0, 39.0, 51.0, 51.0, 41.0, 52.0, 71.0, 57.0, 54.0, 36.0, 52.0, 38.0, 27.0, 27.0, 24.0, 22.0, 12.0, 15.0, 15.0, 11.0, 11.0, 4.0, 7.0, 11.0, 5.0, 12.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.03192138671875, -0.03090047836303711, -0.02987957000732422, -0.028858661651611328, -0.027837753295898438, -0.026816844940185547, -0.025795936584472656, -0.024775028228759766, -0.023754119873046875, -0.022733211517333984, -0.021712303161621094, -0.020691394805908203, -0.019670486450195312, -0.018649578094482422, -0.01762866973876953, -0.01660776138305664, -0.01558685302734375, -0.01456594467163086, -0.013545036315917969, -0.012524127960205078, -0.011503219604492188, -0.010482311248779297, -0.009461402893066406, -0.008440494537353516, -0.007419586181640625, -0.006398677825927734, -0.005377769470214844, -0.004356861114501953, -0.0033359527587890625, -0.002315044403076172, -0.0012941360473632812, -0.0002732276916503906, 0.0007476806640625, 0.0017685890197753906, 0.0027894973754882812, 0.003810405731201172, 0.0048313140869140625, 0.005852222442626953, 0.006873130798339844, 0.007894039154052734, 0.008914947509765625, 0.009935855865478516, 0.010956764221191406, 0.011977672576904297, 0.012998580932617188, 0.014019489288330078, 0.015040397644042969, 0.01606130599975586, 0.01708221435546875, 0.01810312271118164, 0.01912403106689453, 0.020144939422607422, 0.021165847778320312, 0.022186756134033203, 0.023207664489746094, 0.024228572845458984, 0.025249481201171875, 0.026270389556884766, 0.027291297912597656, 0.028312206268310547, 0.029333114624023438, 0.030354022979736328, 0.03137493133544922, 0.03239583969116211, 0.033416748046875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 10.0, 12.0, 14.0, 24.0, 20.0, 45.0, 58.0, 55.0, 75.0, 80.0, 108.0, 79.0, 91.0, 71.0, 50.0, 58.0, 45.0, 21.0, 21.0, 18.0, 13.0, 8.0, 9.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280575692653656, -0.26758620142936707, -0.2545967102050781, -0.241607204079628, -0.22861771285533905, -0.21562820672988892, -0.20263871550559998, -0.18964922428131104, -0.1766597330570221, -0.16367024183273315, -0.15068073570728302, -0.13769124448299408, -0.12470175325870514, -0.1117122545838356, -0.09872275590896606, -0.08573326468467712, -0.07274375855922699, -0.05975426360964775, -0.04676476866006851, -0.033775269985198975, -0.020785775035619736, -0.007796280086040497, 0.0051932185888290405, 0.01818270981311798, 0.03117220848798752, 0.04416170343756676, 0.057151198387145996, 0.07014069706201553, 0.08313019573688507, 0.09611968696117401, 0.10910918563604355, 0.12209867686033249, 0.13508817553520203, 0.14807766675949097, 0.1610671728849411, 0.17405666410923004, 0.18704615533351898, 0.20003566145896912, 0.21302515268325806, 0.226014643907547, 0.23900413513183594, 0.2519936263561249, 0.2649831175804138, 0.27797263860702515, 0.2909621298313141, 0.303951621055603, 0.31694111227989197, 0.3299306035041809, 0.34292012453079224, 0.3559096157550812, 0.3688991069793701, 0.38188862800598145, 0.3948781192302704, 0.4078676104545593, 0.42085710167884827, 0.4338465929031372, 0.44683608412742615, 0.4598255753517151, 0.47281506657600403, 0.48580455780029297, 0.4987940788269043, 0.5117835402488708, 0.5247730612754822, 0.5377625226974487, 0.5507520437240601]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 6.0, 5.0, 7.0, 1.0, 5.0, 10.0, 10.0, 13.0, 12.0, 14.0, 10.0, 15.0, 20.0, 26.0, 22.0, 21.0, 24.0, 39.0, 41.0, 37.0, 33.0, 42.0, 38.0, 30.0, 50.0, 28.0, 48.0, 43.0, 42.0, 27.0, 30.0, 20.0, 26.0, 29.0, 27.0, 15.0, 24.0, 19.0, 16.0, 13.0, 10.0, 10.0, 9.0, 5.0, 5.0, 7.0, 3.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2848557233810425, -0.2759571969509125, -0.26705870032310486, -0.25816017389297485, -0.24926164746284485, -0.24036313593387604, -0.23146462440490723, -0.22256609797477722, -0.21366757154464722, -0.2047690600156784, -0.1958705335855484, -0.1869720220565796, -0.17807349562644958, -0.16917498409748077, -0.16027647256851196, -0.15137794613838196, -0.14247943460941315, -0.13358092308044434, -0.12468239665031433, -0.11578388512134552, -0.10688535869121552, -0.0979868471622467, -0.0890883281826973, -0.08018980920314789, -0.07129129022359848, -0.06239277124404907, -0.053494252264499664, -0.044595737010240555, -0.03569721803069115, -0.02679869905114174, -0.01790018379688263, -0.009001664817333221, -0.00010314583778381348, 0.00879537221044302, 0.017693890258669853, 0.026592407375574112, 0.03549092635512352, 0.04438944533467293, 0.05328796058893204, 0.062186479568481445, 0.07108499854803085, 0.07998351752758026, 0.08888203650712967, 0.09778055548667908, 0.10667906701564789, 0.1155775934457779, 0.1244761049747467, 0.1333746314048767, 0.14227314293384552, 0.15117165446281433, 0.16007018089294434, 0.16896869242191315, 0.17786721885204315, 0.18676573038101196, 0.19566425681114197, 0.20456276834011078, 0.2134612798690796, 0.2223597913980484, 0.2312583178281784, 0.24015682935714722, 0.24905535578727722, 0.2579538822174072, 0.26685237884521484, 0.27575090527534485, 0.28464943170547485]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 18.0, 15.0, 20.0, 26.0, 34.0, 64.0, 79.0, 111.0, 160.0, 202.0, 292.0, 355.0, 613.0, 958.0, 1575.0, 2526.0, 4360.0, 8081.0, 15272.0, 31293.0, 69678.0, 177315.0, 556419.0, 1685366.0, 1096133.0, 329558.0, 116336.0, 48209.0, 22714.0, 11396.0, 6026.0, 3404.0, 2035.0, 1204.0, 789.0, 502.0, 329.0, 233.0, 163.0, 111.0, 78.0, 56.0, 41.0, 33.0, 25.0, 21.0, 14.0, 3.0, 9.0, 0.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.058837890625, -0.056986331939697266, -0.05513477325439453, -0.0532832145690918, -0.05143165588378906, -0.04958009719848633, -0.047728538513183594, -0.04587697982788086, -0.044025421142578125, -0.04217386245727539, -0.040322303771972656, -0.03847074508666992, -0.03661918640136719, -0.03476762771606445, -0.03291606903076172, -0.031064510345458984, -0.02921295166015625, -0.027361392974853516, -0.02550983428955078, -0.023658275604248047, -0.021806716918945312, -0.019955158233642578, -0.018103599548339844, -0.01625204086303711, -0.014400482177734375, -0.01254892349243164, -0.010697364807128906, -0.008845806121826172, -0.0069942474365234375, -0.005142688751220703, -0.0032911300659179688, -0.0014395713806152344, 0.0004119873046875, 0.0022635459899902344, 0.004115104675292969, 0.005966663360595703, 0.007818222045898438, 0.009669780731201172, 0.011521339416503906, 0.01337289810180664, 0.015224456787109375, 0.01707601547241211, 0.018927574157714844, 0.020779132843017578, 0.022630691528320312, 0.024482250213623047, 0.02633380889892578, 0.028185367584228516, 0.03003692626953125, 0.031888484954833984, 0.03374004364013672, 0.03559160232543945, 0.03744316101074219, 0.03929471969604492, 0.041146278381347656, 0.04299783706665039, 0.044849395751953125, 0.04670095443725586, 0.048552513122558594, 0.05040407180786133, 0.05225563049316406, 0.0541071891784668, 0.05595874786376953, 0.057810306549072266, 0.059661865234375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 12.0, 6.0, 10.0, 10.0, 12.0, 16.0, 11.0, 28.0, 18.0, 22.0, 25.0, 19.0, 33.0, 19.0, 37.0, 28.0, 34.0, 41.0, 39.0, 43.0, 43.0, 36.0, 39.0, 39.0, 27.0, 29.0, 27.0, 35.0, 33.0, 23.0, 22.0, 23.0, 15.0, 18.0, 21.0, 16.0, 14.0, 14.0, 16.0, 7.0, 6.0, 9.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0390625, -0.03779411315917969, -0.036525726318359375, -0.03525733947753906, -0.03398895263671875, -0.03272056579589844, -0.031452178955078125, -0.030183792114257812, -0.0289154052734375, -0.027647018432617188, -0.026378631591796875, -0.025110244750976562, -0.02384185791015625, -0.022573471069335938, -0.021305084228515625, -0.020036697387695312, -0.018768310546875, -0.017499923706054688, -0.016231536865234375, -0.014963150024414062, -0.01369476318359375, -0.012426376342773438, -0.011157989501953125, -0.009889602661132812, -0.0086212158203125, -0.0073528289794921875, -0.006084442138671875, -0.0048160552978515625, -0.00354766845703125, -0.0022792816162109375, -0.001010894775390625, 0.0002574920654296875, 0.00152587890625, 0.0027942657470703125, 0.004062652587890625, 0.0053310394287109375, 0.00659942626953125, 0.007867813110351562, 0.009136199951171875, 0.010404586791992188, 0.0116729736328125, 0.012941360473632812, 0.014209747314453125, 0.015478134155273438, 0.01674652099609375, 0.018014907836914062, 0.019283294677734375, 0.020551681518554688, 0.021820068359375, 0.023088455200195312, 0.024356842041015625, 0.025625228881835938, 0.02689361572265625, 0.028162002563476562, 0.029430389404296875, 0.030698776245117188, 0.0319671630859375, 0.03323554992675781, 0.034503936767578125, 0.03577232360839844, 0.03704071044921875, 0.03830909729003906, 0.039577484130859375, 0.04084587097167969, 0.0421142578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 16.0, 25.0, 26.0, 39.0, 44.0, 92.0, 95.0, 160.0, 247.0, 370.0, 586.0, 873.0, 1663.0, 2973.0, 5890.0, 12129.0, 26958.0, 64570.0, 168004.0, 493936.0, 1528070.0, 1258020.0, 393253.0, 137575.0, 53546.0, 22912.0, 10465.0, 5171.0, 2662.0, 1478.0, 855.0, 481.0, 341.0, 235.0, 148.0, 85.0, 67.0, 62.0, 43.0, 22.0, 21.0, 17.0, 12.0, 7.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.07366943359375, -0.07128524780273438, -0.06890106201171875, -0.06651687622070312, -0.0641326904296875, -0.061748504638671875, -0.05936431884765625, -0.056980133056640625, -0.054595947265625, -0.052211761474609375, -0.04982757568359375, -0.047443389892578125, -0.0450592041015625, -0.042675018310546875, -0.04029083251953125, -0.037906646728515625, -0.0355224609375, -0.033138275146484375, -0.03075408935546875, -0.028369903564453125, -0.0259857177734375, -0.023601531982421875, -0.02121734619140625, -0.018833160400390625, -0.016448974609375, -0.014064788818359375, -0.01168060302734375, -0.009296417236328125, -0.0069122314453125, -0.004528045654296875, -0.00214385986328125, 0.000240325927734375, 0.00262451171875, 0.005008697509765625, 0.00739288330078125, 0.009777069091796875, 0.0121612548828125, 0.014545440673828125, 0.01692962646484375, 0.019313812255859375, 0.021697998046875, 0.024082183837890625, 0.02646636962890625, 0.028850555419921875, 0.0312347412109375, 0.033618927001953125, 0.03600311279296875, 0.038387298583984375, 0.040771484375, 0.043155670166015625, 0.04553985595703125, 0.047924041748046875, 0.0503082275390625, 0.052692413330078125, 0.05507659912109375, 0.057460784912109375, 0.059844970703125, 0.062229156494140625, 0.06461334228515625, 0.06699752807617188, 0.0693817138671875, 0.07176589965820312, 0.07415008544921875, 0.07653427124023438, 0.07891845703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 7.0, 15.0, 18.0, 19.0, 33.0, 37.0, 46.0, 74.0, 107.0, 163.0, 196.0, 290.0, 435.0, 587.0, 626.0, 442.0, 281.0, 214.0, 151.0, 88.0, 67.0, 49.0, 24.0, 21.0, 14.0, 18.0, 8.0, 11.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08856201171875, -0.0857076644897461, -0.08285331726074219, -0.07999897003173828, -0.07714462280273438, -0.07429027557373047, -0.07143592834472656, -0.06858158111572266, -0.06572723388671875, -0.06287288665771484, -0.06001853942871094, -0.05716419219970703, -0.054309844970703125, -0.05145549774169922, -0.04860115051269531, -0.045746803283691406, -0.0428924560546875, -0.040038108825683594, -0.03718376159667969, -0.03432941436767578, -0.031475067138671875, -0.02862071990966797, -0.025766372680664062, -0.022912025451660156, -0.02005767822265625, -0.017203330993652344, -0.014348983764648438, -0.011494636535644531, -0.008640289306640625, -0.005785942077636719, -0.0029315948486328125, -7.724761962890625e-05, 0.002777099609375, 0.005631446838378906, 0.008485794067382812, 0.011340141296386719, 0.014194488525390625, 0.01704883575439453, 0.019903182983398438, 0.022757530212402344, 0.02561187744140625, 0.028466224670410156, 0.03132057189941406, 0.03417491912841797, 0.037029266357421875, 0.03988361358642578, 0.04273796081542969, 0.045592308044433594, 0.0484466552734375, 0.051301002502441406, 0.05415534973144531, 0.05700969696044922, 0.059864044189453125, 0.06271839141845703, 0.06557273864746094, 0.06842708587646484, 0.07128143310546875, 0.07413578033447266, 0.07699012756347656, 0.07984447479248047, 0.08269882202148438, 0.08555316925048828, 0.08840751647949219, 0.0912618637084961, 0.0941162109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 4.0, 11.0, 9.0, 6.0, 13.0, 16.0, 33.0, 36.0, 41.0, 49.0, 51.0, 62.0, 81.0, 77.0, 77.0, 87.0, 69.0, 55.0, 54.0, 43.0, 32.0, 25.0, 19.0, 10.0, 7.0, 4.0, 8.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31754857301712036, -0.30716583132743835, -0.29678308963775635, -0.28640034794807434, -0.27601760625839233, -0.2656348943710327, -0.2552521526813507, -0.2448694109916687, -0.2344866693019867, -0.2241039276123047, -0.21372118592262268, -0.20333845913410187, -0.19295571744441986, -0.18257297575473785, -0.17219024896621704, -0.16180750727653503, -0.15142476558685303, -0.14104202389717102, -0.130659282207489, -0.1202765554189682, -0.1098938137292862, -0.09951107203960419, -0.08912833780050278, -0.07874560356140137, -0.06836286187171936, -0.05798012390732765, -0.047597385942935944, -0.037214647978544235, -0.026831910014152527, -0.01644917204976082, -0.00606643408536911, 0.0043163001537323, 0.014699041843414307, 0.025081779807806015, 0.03546451777219772, 0.04584725573658943, 0.05622999370098114, 0.06661273539066315, 0.07699546962976456, 0.08737820386886597, 0.09776094555854797, 0.10814368724822998, 0.11852642148733139, 0.1289091557264328, 0.1392918974161148, 0.14967463910579681, 0.16005736589431763, 0.17044010758399963, 0.18082284927368164, 0.19120559096336365, 0.20158833265304565, 0.21197105944156647, 0.22235380113124847, 0.23273654282093048, 0.2431192696094513, 0.2535020112991333, 0.2638847529888153, 0.2742674946784973, 0.2846502363681793, 0.29503297805786133, 0.30541568994522095, 0.31579843163490295, 0.32618117332458496, 0.33656391501426697, 0.346946656703949]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 14.0, 7.0, 9.0, 10.0, 13.0, 13.0, 20.0, 26.0, 18.0, 23.0, 30.0, 24.0, 28.0, 31.0, 31.0, 27.0, 38.0, 29.0, 33.0, 26.0, 29.0, 44.0, 39.0, 43.0, 38.0, 35.0, 26.0, 28.0, 39.0, 25.0, 32.0, 27.0, 12.0, 22.0, 19.0, 14.0, 11.0, 6.0, 19.0, 6.0, 5.0, 3.0, 6.0, 6.0, 4.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.21680021286010742, -0.21019044518470764, -0.20358067750930786, -0.19697090983390808, -0.1903611421585083, -0.18375137448310852, -0.17714160680770874, -0.17053183913230896, -0.16392207145690918, -0.1573123037815094, -0.15070253610610962, -0.14409276843070984, -0.13748300075531006, -0.13087323307991028, -0.1242634579539299, -0.11765369027853012, -0.11104391515254974, -0.10443414747714996, -0.09782437980175018, -0.0912146121263504, -0.08460484445095062, -0.07799507677555084, -0.07138530164957047, -0.06477553397417068, -0.058165766298770905, -0.051555998623371124, -0.044946230947971344, -0.038336459547281265, -0.031726691871881485, -0.025116924196481705, -0.018507152795791626, -0.011897385120391846, -0.005287617444992065, 0.0013221511617302895, 0.007931919768452644, 0.014541689306497574, 0.021151456981897354, 0.027761224657297134, 0.03437099605798721, 0.04098076373338699, 0.047590531408786774, 0.054200299084186554, 0.060810066759586334, 0.06741984188556671, 0.07402960956096649, 0.08063937723636627, 0.08724914491176605, 0.09385891258716583, 0.10046868026256561, 0.1070784479379654, 0.11368821561336517, 0.12029798328876495, 0.12690775096416473, 0.13351751863956451, 0.1401273012161255, 0.14673706889152527, 0.15334683656692505, 0.15995660424232483, 0.1665663719177246, 0.1731761395931244, 0.17978590726852417, 0.18639567494392395, 0.19300544261932373, 0.1996152102947235, 0.2062249779701233]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 17.0, 11.0, 19.0, 35.0, 62.0, 65.0, 94.0, 148.0, 278.0, 409.0, 666.0, 1102.0, 1815.0, 3038.0, 5036.0, 8701.0, 14374.0, 24643.0, 42832.0, 72425.0, 121642.0, 180194.0, 197349.0, 149066.0, 92623.0, 54410.0, 31460.0, 18526.0, 10962.0, 6588.0, 3921.0, 2243.0, 1483.0, 855.0, 519.0, 334.0, 220.0, 140.0, 86.0, 54.0, 40.0, 18.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07720947265625, -0.07465553283691406, -0.07210159301757812, -0.06954765319824219, -0.06699371337890625, -0.06443977355957031, -0.061885833740234375, -0.05933189392089844, -0.0567779541015625, -0.05422401428222656, -0.051670074462890625, -0.04911613464355469, -0.04656219482421875, -0.04400825500488281, -0.041454315185546875, -0.03890037536621094, -0.036346435546875, -0.03379249572753906, -0.031238555908203125, -0.028684616088867188, -0.02613067626953125, -0.023576736450195312, -0.021022796630859375, -0.018468856811523438, -0.0159149169921875, -0.013360977172851562, -0.010807037353515625, -0.008253097534179688, -0.00569915771484375, -0.0031452178955078125, -0.000591278076171875, 0.0019626617431640625, 0.0045166015625, 0.0070705413818359375, 0.009624481201171875, 0.012178421020507812, 0.01473236083984375, 0.017286300659179688, 0.019840240478515625, 0.022394180297851562, 0.0249481201171875, 0.027502059936523438, 0.030055999755859375, 0.03260993957519531, 0.03516387939453125, 0.03771781921386719, 0.040271759033203125, 0.04282569885253906, 0.045379638671875, 0.04793357849121094, 0.050487518310546875, 0.05304145812988281, 0.05559539794921875, 0.05814933776855469, 0.060703277587890625, 0.06325721740722656, 0.0658111572265625, 0.06836509704589844, 0.07091903686523438, 0.07347297668457031, 0.07602691650390625, 0.07858085632324219, 0.08113479614257812, 0.08368873596191406, 0.08624267578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 7.0, 3.0, 8.0, 14.0, 16.0, 14.0, 15.0, 15.0, 18.0, 20.0, 19.0, 27.0, 26.0, 28.0, 38.0, 31.0, 40.0, 27.0, 38.0, 33.0, 37.0, 38.0, 46.0, 37.0, 46.0, 37.0, 30.0, 32.0, 26.0, 28.0, 23.0, 16.0, 25.0, 16.0, 26.0, 11.0, 9.0, 14.0, 12.0, 7.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.03912353515625, -0.03788423538208008, -0.036644935607910156, -0.035405635833740234, -0.03416633605957031, -0.03292703628540039, -0.03168773651123047, -0.030448436737060547, -0.029209136962890625, -0.027969837188720703, -0.02673053741455078, -0.02549123764038086, -0.024251937866210938, -0.023012638092041016, -0.021773338317871094, -0.020534038543701172, -0.01929473876953125, -0.018055438995361328, -0.016816139221191406, -0.015576839447021484, -0.014337539672851562, -0.01309823989868164, -0.011858940124511719, -0.010619640350341797, -0.009380340576171875, -0.008141040802001953, -0.006901741027832031, -0.005662441253662109, -0.0044231414794921875, -0.0031838417053222656, -0.0019445419311523438, -0.0007052421569824219, 0.0005340576171875, 0.0017733573913574219, 0.0030126571655273438, 0.004251956939697266, 0.0054912567138671875, 0.006730556488037109, 0.007969856262207031, 0.009209156036376953, 0.010448455810546875, 0.011687755584716797, 0.012927055358886719, 0.01416635513305664, 0.015405654907226562, 0.016644954681396484, 0.017884254455566406, 0.019123554229736328, 0.02036285400390625, 0.021602153778076172, 0.022841453552246094, 0.024080753326416016, 0.025320053100585938, 0.02655935287475586, 0.02779865264892578, 0.029037952423095703, 0.030277252197265625, 0.03151655197143555, 0.03275585174560547, 0.03399515151977539, 0.03523445129394531, 0.036473751068115234, 0.037713050842285156, 0.03895235061645508, 0.040191650390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 13.0, 12.0, 18.0, 27.0, 36.0, 49.0, 91.0, 112.0, 175.0, 283.0, 561.0, 1109.0, 2601.0, 5873.0, 14383.0, 35658.0, 89588.0, 219777.0, 337805.0, 202548.0, 82084.0, 32517.0, 13185.0, 5423.0, 2234.0, 1055.0, 508.0, 279.0, 180.0, 108.0, 74.0, 51.0, 36.0, 18.0, 25.0, 16.0, 11.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12197113037109375, -0.1179656982421875, -0.11396026611328125, -0.109954833984375, -0.10594940185546875, -0.1019439697265625, -0.09793853759765625, -0.09393310546875, -0.08992767333984375, -0.0859222412109375, -0.08191680908203125, -0.077911376953125, -0.07390594482421875, -0.0699005126953125, -0.06589508056640625, -0.0618896484375, -0.05788421630859375, -0.0538787841796875, -0.04987335205078125, -0.045867919921875, -0.04186248779296875, -0.0378570556640625, -0.03385162353515625, -0.02984619140625, -0.02584075927734375, -0.0218353271484375, -0.01782989501953125, -0.013824462890625, -0.00981903076171875, -0.0058135986328125, -0.00180816650390625, 0.002197265625, 0.00620269775390625, 0.0102081298828125, 0.01421356201171875, 0.018218994140625, 0.02222442626953125, 0.0262298583984375, 0.03023529052734375, 0.03424072265625, 0.03824615478515625, 0.0422515869140625, 0.04625701904296875, 0.050262451171875, 0.05426788330078125, 0.0582733154296875, 0.06227874755859375, 0.0662841796875, 0.07028961181640625, 0.0742950439453125, 0.07830047607421875, 0.082305908203125, 0.08631134033203125, 0.0903167724609375, 0.09432220458984375, 0.09832763671875, 0.10233306884765625, 0.1063385009765625, 0.11034393310546875, 0.114349365234375, 0.11835479736328125, 0.1223602294921875, 0.12636566162109375, 0.13037109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 1.0, 8.0, 9.0, 8.0, 10.0, 13.0, 6.0, 16.0, 34.0, 19.0, 27.0, 36.0, 28.0, 28.0, 35.0, 30.0, 37.0, 49.0, 36.0, 48.0, 51.0, 49.0, 50.0, 46.0, 32.0, 39.0, 34.0, 26.0, 25.0, 29.0, 15.0, 21.0, 20.0, 18.0, 18.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.102294921875, -0.0985260009765625, -0.094757080078125, -0.0909881591796875, -0.08721923828125, -0.0834503173828125, -0.079681396484375, -0.0759124755859375, -0.0721435546875, -0.0683746337890625, -0.064605712890625, -0.0608367919921875, -0.05706787109375, -0.0532989501953125, -0.049530029296875, -0.0457611083984375, -0.0419921875, -0.0382232666015625, -0.034454345703125, -0.0306854248046875, -0.02691650390625, -0.0231475830078125, -0.019378662109375, -0.0156097412109375, -0.0118408203125, -0.0080718994140625, -0.004302978515625, -0.0005340576171875, 0.00323486328125, 0.0070037841796875, 0.010772705078125, 0.0145416259765625, 0.018310546875, 0.0220794677734375, 0.025848388671875, 0.0296173095703125, 0.03338623046875, 0.0371551513671875, 0.040924072265625, 0.0446929931640625, 0.0484619140625, 0.0522308349609375, 0.055999755859375, 0.0597686767578125, 0.06353759765625, 0.0673065185546875, 0.071075439453125, 0.0748443603515625, 0.07861328125, 0.0823822021484375, 0.086151123046875, 0.0899200439453125, 0.09368896484375, 0.0974578857421875, 0.101226806640625, 0.1049957275390625, 0.1087646484375, 0.1125335693359375, 0.116302490234375, 0.1200714111328125, 0.12384033203125, 0.1276092529296875, 0.131378173828125, 0.1351470947265625, 0.138916015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 4.0, 6.0, 17.0, 18.0, 32.0, 67.0, 86.0, 151.0, 223.0, 394.0, 691.0, 1093.0, 1778.0, 2895.0, 4849.0, 8337.0, 13945.0, 23730.0, 41694.0, 73532.0, 130247.0, 205509.0, 212006.0, 140207.0, 79302.0, 44777.0, 25491.0, 15204.0, 8944.0, 5335.0, 3183.0, 1863.0, 1174.0, 667.0, 415.0, 247.0, 162.0, 98.0, 69.0, 40.0, 24.0, 20.0, 8.0, 12.0, 6.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297088623046875, -0.028752565383911133, -0.027796268463134766, -0.0268399715423584, -0.02588367462158203, -0.024927377700805664, -0.023971080780029297, -0.02301478385925293, -0.022058486938476562, -0.021102190017700195, -0.020145893096923828, -0.01918959617614746, -0.018233299255371094, -0.017277002334594727, -0.01632070541381836, -0.015364408493041992, -0.014408111572265625, -0.013451814651489258, -0.01249551773071289, -0.011539220809936523, -0.010582923889160156, -0.009626626968383789, -0.008670330047607422, -0.007714033126831055, -0.0067577362060546875, -0.00580143928527832, -0.004845142364501953, -0.003888845443725586, -0.0029325485229492188, -0.0019762516021728516, -0.0010199546813964844, -6.365776062011719e-05, 0.00089263916015625, 0.0018489360809326172, 0.0028052330017089844, 0.0037615299224853516, 0.004717826843261719, 0.005674123764038086, 0.006630420684814453, 0.00758671760559082, 0.008543014526367188, 0.009499311447143555, 0.010455608367919922, 0.011411905288696289, 0.012368202209472656, 0.013324499130249023, 0.01428079605102539, 0.015237092971801758, 0.016193389892578125, 0.017149686813354492, 0.01810598373413086, 0.019062280654907227, 0.020018577575683594, 0.02097487449645996, 0.021931171417236328, 0.022887468338012695, 0.023843765258789062, 0.02480006217956543, 0.025756359100341797, 0.026712656021118164, 0.02766895294189453, 0.0286252498626709, 0.029581546783447266, 0.030537843704223633, 0.031494140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 2.0, 5.0, 5.0, 9.0, 13.0, 12.0, 19.0, 29.0, 26.0, 20.0, 40.0, 46.0, 58.0, 59.0, 50.0, 56.0, 62.0, 70.0, 49.0, 53.0, 57.0, 56.0, 42.0, 23.0, 26.0, 20.0, 20.0, 16.0, 12.0, 6.0, 6.0, 4.0, 10.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3649463653564453e-05, -1.3178214430809021e-05, -1.2706965208053589e-05, -1.2235715985298157e-05, -1.1764466762542725e-05, -1.1293217539787292e-05, -1.082196831703186e-05, -1.0350719094276428e-05, -9.879469871520996e-06, -9.408220648765564e-06, -8.936971426010132e-06, -8.4657222032547e-06, -7.994472980499268e-06, -7.5232237577438354e-06, -7.051974534988403e-06, -6.580725312232971e-06, -6.109476089477539e-06, -5.638226866722107e-06, -5.166977643966675e-06, -4.695728421211243e-06, -4.2244791984558105e-06, -3.7532299757003784e-06, -3.2819807529449463e-06, -2.810731530189514e-06, -2.339482307434082e-06, -1.86823308467865e-06, -1.3969838619232178e-06, -9.257346391677856e-07, -4.544854164123535e-07, 1.6763806343078613e-08, 4.880130290985107e-07, 9.592622518539429e-07, 1.430511474609375e-06, 1.9017606973648071e-06, 2.3730099201202393e-06, 2.8442591428756714e-06, 3.3155083656311035e-06, 3.7867575883865356e-06, 4.258006811141968e-06, 4.7292560338974e-06, 5.200505256652832e-06, 5.671754479408264e-06, 6.143003702163696e-06, 6.614252924919128e-06, 7.0855021476745605e-06, 7.556751370429993e-06, 8.028000593185425e-06, 8.499249815940857e-06, 8.970499038696289e-06, 9.441748261451721e-06, 9.912997484207153e-06, 1.0384246706962585e-05, 1.0855495929718018e-05, 1.132674515247345e-05, 1.1797994375228882e-05, 1.2269243597984314e-05, 1.2740492820739746e-05, 1.3211742043495178e-05, 1.368299126625061e-05, 1.4154240489006042e-05, 1.4625489711761475e-05, 1.5096738934516907e-05, 1.556798815727234e-05, 1.603923738002777e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 9.0, 9.0, 14.0, 18.0, 41.0, 48.0, 77.0, 143.0, 222.0, 450.0, 896.0, 1719.0, 3735.0, 7940.0, 16984.0, 37281.0, 83385.0, 183229.0, 297936.0, 222838.0, 104268.0, 46734.0, 21499.0, 9943.0, 4576.0, 2166.0, 1096.0, 538.0, 311.0, 169.0, 99.0, 55.0, 39.0, 31.0, 11.0, 12.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0390625, -0.03782796859741211, -0.03659343719482422, -0.03535890579223633, -0.03412437438964844, -0.03288984298706055, -0.031655311584472656, -0.030420780181884766, -0.029186248779296875, -0.027951717376708984, -0.026717185974121094, -0.025482654571533203, -0.024248123168945312, -0.023013591766357422, -0.02177906036376953, -0.02054452896118164, -0.01930999755859375, -0.01807546615600586, -0.01684093475341797, -0.015606403350830078, -0.014371871948242188, -0.013137340545654297, -0.011902809143066406, -0.010668277740478516, -0.009433746337890625, -0.008199214935302734, -0.006964683532714844, -0.005730152130126953, -0.0044956207275390625, -0.003261089324951172, -0.0020265579223632812, -0.0007920265197753906, 0.0004425048828125, 0.0016770362854003906, 0.0029115676879882812, 0.004146099090576172, 0.0053806304931640625, 0.006615161895751953, 0.007849693298339844, 0.009084224700927734, 0.010318756103515625, 0.011553287506103516, 0.012787818908691406, 0.014022350311279297, 0.015256881713867188, 0.016491413116455078, 0.01772594451904297, 0.01896047592163086, 0.02019500732421875, 0.02142953872680664, 0.02266407012939453, 0.023898601531982422, 0.025133132934570312, 0.026367664337158203, 0.027602195739746094, 0.028836727142333984, 0.030071258544921875, 0.031305789947509766, 0.032540321350097656, 0.03377485275268555, 0.03500938415527344, 0.03624391555786133, 0.03747844696044922, 0.03871297836303711, 0.039947509765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 6.0, 11.0, 4.0, 5.0, 14.0, 18.0, 23.0, 13.0, 19.0, 28.0, 24.0, 50.0, 52.0, 55.0, 48.0, 61.0, 63.0, 63.0, 54.0, 62.0, 46.0, 49.0, 49.0, 31.0, 26.0, 27.0, 20.0, 17.0, 7.0, 15.0, 4.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.041961669921875, -0.04085278511047363, -0.039743900299072266, -0.0386350154876709, -0.03752613067626953, -0.036417245864868164, -0.0353083610534668, -0.03419947624206543, -0.03309059143066406, -0.031981706619262695, -0.030872821807861328, -0.02976393699645996, -0.028655052185058594, -0.027546167373657227, -0.02643728256225586, -0.025328397750854492, -0.024219512939453125, -0.023110628128051758, -0.02200174331665039, -0.020892858505249023, -0.019783973693847656, -0.01867508888244629, -0.017566204071044922, -0.016457319259643555, -0.015348434448242188, -0.01423954963684082, -0.013130664825439453, -0.012021780014038086, -0.010912895202636719, -0.009804010391235352, -0.008695125579833984, -0.007586240768432617, -0.00647735595703125, -0.005368471145629883, -0.004259586334228516, -0.0031507015228271484, -0.0020418167114257812, -0.0009329319000244141, 0.00017595291137695312, 0.0012848377227783203, 0.0023937225341796875, 0.0035026073455810547, 0.004611492156982422, 0.005720376968383789, 0.006829261779785156, 0.007938146591186523, 0.00904703140258789, 0.010155916213989258, 0.011264801025390625, 0.012373685836791992, 0.01348257064819336, 0.014591455459594727, 0.015700340270996094, 0.01680922508239746, 0.017918109893798828, 0.019026994705200195, 0.020135879516601562, 0.02124476432800293, 0.022353649139404297, 0.023462533950805664, 0.02457141876220703, 0.0256803035736084, 0.026789188385009766, 0.027898073196411133, 0.0290069580078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 11.0, 21.0, 38.0, 45.0, 73.0, 85.0, 103.0, 99.0, 109.0, 87.0, 102.0, 85.0, 41.0, 30.0, 35.0, 15.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6966410875320435, -0.6796780228614807, -0.6627150177955627, -0.645751953125, -0.628788948059082, -0.6118258833885193, -0.5948628783226013, -0.5778998136520386, -0.5609368085861206, -0.5439737439155579, -0.5270107388496399, -0.5100476741790771, -0.4930846691131592, -0.47612160444259644, -0.4591585695743561, -0.4421955347061157, -0.425232470035553, -0.4082694351673126, -0.39130640029907227, -0.3743433654308319, -0.35738033056259155, -0.3404172658920288, -0.32345423102378845, -0.3064911961555481, -0.28952816128730774, -0.2725651264190674, -0.255602091550827, -0.23863904178142548, -0.22167600691318512, -0.20471297204494476, -0.1877499222755432, -0.17078688740730286, -0.1538238525390625, -0.13686081767082214, -0.11989777535200119, -0.10293473303318024, -0.08597169816493988, -0.06900866329669952, -0.05204562097787857, -0.03508257865905762, -0.01811954379081726, -0.0011565051972866058, 0.01580653339624405, 0.032769571989774704, 0.04973261058330536, 0.06669564545154572, 0.08365868777036667, 0.10062173008918762, 0.11758476495742798, 0.13454779982566833, 0.1515108346939087, 0.16847388446331024, 0.1854369193315506, 0.20239995419979095, 0.2193630039691925, 0.23632603883743286, 0.2532890737056732, 0.2702521085739136, 0.28721514344215393, 0.3041781783103943, 0.32114124298095703, 0.338104248046875, 0.35506731271743774, 0.3720303475856781, 0.38899338245391846]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 13.0, 9.0, 8.0, 9.0, 17.0, 10.0, 24.0, 22.0, 16.0, 31.0, 34.0, 24.0, 37.0, 26.0, 34.0, 27.0, 47.0, 43.0, 44.0, 39.0, 44.0, 48.0, 28.0, 45.0, 41.0, 34.0, 41.0, 25.0, 21.0, 21.0, 15.0, 20.0, 26.0, 16.0, 15.0, 11.0, 7.0, 9.0, 5.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31484436988830566, -0.3046812415122986, -0.2945181131362915, -0.2843549847602844, -0.27419185638427734, -0.26402872800827026, -0.2538655996322632, -0.2437024861574173, -0.23353935778141022, -0.22337622940540314, -0.21321310102939606, -0.20304997265338898, -0.1928868591785431, -0.182723730802536, -0.17256060242652893, -0.16239747405052185, -0.15223434567451477, -0.1420712172985077, -0.1319080889225006, -0.12174496799707413, -0.11158183962106705, -0.10141871124505997, -0.09125559031963348, -0.0810924619436264, -0.07092933356761932, -0.060766205191612244, -0.05060308054089546, -0.04043995589017868, -0.0302768275141716, -0.02011369913816452, -0.009950574487447739, 0.00021255016326904297, 0.010375678539276123, 0.020538805052638054, 0.030701931565999985, 0.040865056216716766, 0.051028184592723846, 0.061191312968730927, 0.07135443389415741, 0.08151756227016449, 0.09168069064617157, 0.10184381902217865, 0.11200694739818573, 0.12217006832361221, 0.1323331892490387, 0.14249631762504578, 0.15265944600105286, 0.16282257437705994, 0.17298570275306702, 0.1831488311290741, 0.19331195950508118, 0.20347508788108826, 0.21363821625709534, 0.22380134463310242, 0.2339644581079483, 0.24412758648395538, 0.25429069995880127, 0.26445382833480835, 0.27461695671081543, 0.2847800850868225, 0.2949432134628296, 0.30510634183883667, 0.31526947021484375, 0.32543259859085083, 0.3355957269668579]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 6.0, 9.0, 7.0, 12.0, 14.0, 11.0, 20.0, 22.0, 43.0, 41.0, 44.0, 116.0, 191.0, 343.0, 894.0, 2575.0, 9923.0, 46257.0, 378411.0, 3186339.0, 496524.0, 56469.0, 11035.0, 2952.0, 986.0, 404.0, 218.0, 107.0, 79.0, 61.0, 34.0, 27.0, 21.0, 20.0, 15.0, 11.0, 3.0, 6.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13016319274902344, -0.12543869018554688, -0.12071418762207031, -0.11598968505859375, -0.11126518249511719, -0.10654067993164062, -0.10181617736816406, -0.0970916748046875, -0.09236717224121094, -0.08764266967773438, -0.08291816711425781, -0.07819366455078125, -0.07346916198730469, -0.06874465942382812, -0.06402015686035156, -0.059295654296875, -0.05457115173339844, -0.049846649169921875, -0.04512214660644531, -0.04039764404296875, -0.03567314147949219, -0.030948638916015625, -0.026224136352539062, -0.0214996337890625, -0.016775131225585938, -0.012050628662109375, -0.0073261260986328125, -0.00260162353515625, 0.0021228790283203125, 0.006847381591796875, 0.011571884155273438, 0.01629638671875, 0.021020889282226562, 0.025745391845703125, 0.030469894409179688, 0.03519439697265625, 0.03991889953613281, 0.044643402099609375, 0.04936790466308594, 0.0540924072265625, 0.05881690979003906, 0.06354141235351562, 0.06826591491699219, 0.07299041748046875, 0.07771492004394531, 0.08243942260742188, 0.08716392517089844, 0.091888427734375, 0.09661293029785156, 0.10133743286132812, 0.10606193542480469, 0.11078643798828125, 0.11551094055175781, 0.12023544311523438, 0.12495994567871094, 0.1296844482421875, 0.13440895080566406, 0.13913345336914062, 0.1438579559326172, 0.14858245849609375, 0.1533069610595703, 0.15803146362304688, 0.16275596618652344, 0.16748046875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 7.0, 4.0, 3.0, 6.0, 7.0, 6.0, 13.0, 13.0, 12.0, 14.0, 14.0, 20.0, 21.0, 27.0, 34.0, 30.0, 29.0, 33.0, 30.0, 36.0, 45.0, 37.0, 37.0, 30.0, 39.0, 42.0, 42.0, 36.0, 30.0, 31.0, 31.0, 37.0, 31.0, 20.0, 23.0, 17.0, 20.0, 21.0, 18.0, 7.0, 11.0, 5.0, 8.0, 6.0, 2.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.04376220703125, -0.0423741340637207, -0.040986061096191406, -0.03959798812866211, -0.03820991516113281, -0.036821842193603516, -0.03543376922607422, -0.03404569625854492, -0.032657623291015625, -0.03126955032348633, -0.02988147735595703, -0.028493404388427734, -0.027105331420898438, -0.02571725845336914, -0.024329185485839844, -0.022941112518310547, -0.02155303955078125, -0.020164966583251953, -0.018776893615722656, -0.01738882064819336, -0.016000747680664062, -0.014612674713134766, -0.013224601745605469, -0.011836528778076172, -0.010448455810546875, -0.009060382843017578, -0.007672309875488281, -0.006284236907958984, -0.0048961639404296875, -0.0035080909729003906, -0.0021200180053710938, -0.0007319450378417969, 0.0006561279296875, 0.002044200897216797, 0.0034322738647460938, 0.004820346832275391, 0.0062084197998046875, 0.007596492767333984, 0.008984565734863281, 0.010372638702392578, 0.011760711669921875, 0.013148784637451172, 0.014536857604980469, 0.015924930572509766, 0.017313003540039062, 0.01870107650756836, 0.020089149475097656, 0.021477222442626953, 0.02286529541015625, 0.024253368377685547, 0.025641441345214844, 0.02702951431274414, 0.028417587280273438, 0.029805660247802734, 0.03119373321533203, 0.03258180618286133, 0.033969879150390625, 0.03535795211791992, 0.03674602508544922, 0.038134098052978516, 0.03952217102050781, 0.04091024398803711, 0.042298316955566406, 0.0436863899230957, 0.045074462890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 9.0, 6.0, 14.0, 8.0, 26.0, 26.0, 37.0, 57.0, 81.0, 152.0, 206.0, 311.0, 517.0, 841.0, 1537.0, 2648.0, 5325.0, 10503.0, 21946.0, 48422.0, 113888.0, 294059.0, 856464.0, 1701799.0, 708078.0, 247889.0, 97577.0, 42181.0, 19527.0, 9391.0, 4646.0, 2509.0, 1486.0, 801.0, 460.0, 292.0, 178.0, 114.0, 85.0, 54.0, 32.0, 29.0, 21.0, 12.0, 12.0, 11.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07440185546875, -0.07195568084716797, -0.06950950622558594, -0.0670633316040039, -0.06461715698242188, -0.062170982360839844, -0.05972480773925781, -0.05727863311767578, -0.05483245849609375, -0.05238628387451172, -0.04994010925292969, -0.047493934631347656, -0.045047760009765625, -0.042601585388183594, -0.04015541076660156, -0.03770923614501953, -0.0352630615234375, -0.03281688690185547, -0.030370712280273438, -0.027924537658691406, -0.025478363037109375, -0.023032188415527344, -0.020586013793945312, -0.01813983917236328, -0.01569366455078125, -0.013247489929199219, -0.010801315307617188, -0.008355140686035156, -0.005908966064453125, -0.0034627914428710938, -0.0010166168212890625, 0.0014295578002929688, 0.003875732421875, 0.006321907043457031, 0.008768081665039062, 0.011214256286621094, 0.013660430908203125, 0.016106605529785156, 0.018552780151367188, 0.02099895477294922, 0.02344512939453125, 0.02589130401611328, 0.028337478637695312, 0.030783653259277344, 0.033229827880859375, 0.035676002502441406, 0.03812217712402344, 0.04056835174560547, 0.0430145263671875, 0.04546070098876953, 0.04790687561035156, 0.050353050231933594, 0.052799224853515625, 0.055245399475097656, 0.05769157409667969, 0.06013774871826172, 0.06258392333984375, 0.06503009796142578, 0.06747627258300781, 0.06992244720458984, 0.07236862182617188, 0.0748147964477539, 0.07726097106933594, 0.07970714569091797, 0.0821533203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 6.0, 10.0, 28.0, 27.0, 41.0, 48.0, 76.0, 104.0, 156.0, 236.0, 332.0, 525.0, 707.0, 619.0, 383.0, 288.0, 162.0, 112.0, 68.0, 44.0, 26.0, 22.0, 20.0, 13.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11578369140625, -0.11253643035888672, -0.10928916931152344, -0.10604190826416016, -0.10279464721679688, -0.0995473861694336, -0.09630012512207031, -0.09305286407470703, -0.08980560302734375, -0.08655834197998047, -0.08331108093261719, -0.0800638198852539, -0.07681655883789062, -0.07356929779052734, -0.07032203674316406, -0.06707477569580078, -0.0638275146484375, -0.06058025360107422, -0.05733299255371094, -0.054085731506347656, -0.050838470458984375, -0.047591209411621094, -0.04434394836425781, -0.04109668731689453, -0.03784942626953125, -0.03460216522216797, -0.03135490417480469, -0.028107643127441406, -0.024860382080078125, -0.021613121032714844, -0.018365859985351562, -0.015118598937988281, -0.011871337890625, -0.008624076843261719, -0.0053768157958984375, -0.0021295547485351562, 0.001117706298828125, 0.004364967346191406, 0.0076122283935546875, 0.010859489440917969, 0.01410675048828125, 0.01735401153564453, 0.020601272583007812, 0.023848533630371094, 0.027095794677734375, 0.030343055725097656, 0.03359031677246094, 0.03683757781982422, 0.0400848388671875, 0.04333209991455078, 0.04657936096191406, 0.049826622009277344, 0.053073883056640625, 0.056321144104003906, 0.05956840515136719, 0.06281566619873047, 0.06606292724609375, 0.06931018829345703, 0.07255744934082031, 0.0758047103881836, 0.07905197143554688, 0.08229923248291016, 0.08554649353027344, 0.08879375457763672, 0.092041015625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 15.0, 16.0, 21.0, 28.0, 27.0, 39.0, 46.0, 55.0, 70.0, 46.0, 53.0, 77.0, 75.0, 61.0, 53.0, 50.0, 46.0, 34.0, 35.0, 21.0, 27.0, 18.0, 15.0, 16.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25698065757751465, -0.2487000674009323, -0.24041947722434998, -0.23213888704776764, -0.2238582968711853, -0.21557770669460297, -0.20729711651802063, -0.1990165263414383, -0.19073593616485596, -0.18245534598827362, -0.17417475581169128, -0.16589416563510895, -0.1576135754585266, -0.14933298528194427, -0.14105239510536194, -0.1327718049287796, -0.12449121475219727, -0.11621062457561493, -0.10793003439903259, -0.09964944422245026, -0.09136885404586792, -0.08308826386928558, -0.07480767369270325, -0.06652708351612091, -0.058246493339538574, -0.04996590316295624, -0.0416853129863739, -0.033404722809791565, -0.02512413263320923, -0.016843542456626892, -0.008562952280044556, -0.00028236210346221924, 0.007998228073120117, 0.016278818249702454, 0.02455940842628479, 0.032839998602867126, 0.04112058877944946, 0.0494011789560318, 0.057681769132614136, 0.06596235930919647, 0.07424294948577881, 0.08252353966236115, 0.09080412983894348, 0.09908472001552582, 0.10736531019210815, 0.11564590036869049, 0.12392649054527283, 0.13220708072185516, 0.1404876708984375, 0.14876826107501984, 0.15704885125160217, 0.1653294414281845, 0.17361003160476685, 0.18189062178134918, 0.19017121195793152, 0.19845180213451385, 0.2067323923110962, 0.21501298248767853, 0.22329357266426086, 0.2315741628408432, 0.23985475301742554, 0.24813534319400787, 0.2564159333705902, 0.26469653844833374, 0.2729771137237549]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 4.0, 4.0, 9.0, 6.0, 16.0, 14.0, 16.0, 17.0, 16.0, 27.0, 29.0, 26.0, 32.0, 23.0, 30.0, 45.0, 37.0, 42.0, 49.0, 56.0, 46.0, 36.0, 51.0, 31.0, 39.0, 38.0, 34.0, 30.0, 26.0, 23.0, 18.0, 22.0, 13.0, 19.0, 14.0, 7.0, 15.0, 10.0, 6.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21432888507843018, -0.20741678774356842, -0.20050470530986786, -0.1935926079750061, -0.18668051064014435, -0.1797684133052826, -0.17285633087158203, -0.16594423353672028, -0.15903213620185852, -0.15212003886699677, -0.1452079564332962, -0.13829585909843445, -0.1313837617635727, -0.12447167187929153, -0.11755958199501038, -0.11064748466014862, -0.10373540222644806, -0.0968233123421669, -0.08991121500730515, -0.08299912512302399, -0.07608702778816223, -0.06917493790388107, -0.062262848019599915, -0.05535075441002846, -0.048438660800457, -0.041526567190885544, -0.03461447358131409, -0.02770238369703293, -0.02079029008746147, -0.013878196477890015, -0.006966106593608856, -5.401298403739929e-05, 0.006858080625534058, 0.01377017330378294, 0.020682265982031822, 0.02759435772895813, 0.03450645133852959, 0.041418544948101044, 0.0483306348323822, 0.05524272844195366, 0.062154822051525116, 0.06906691193580627, 0.07597900927066803, 0.08289109915494919, 0.08980318903923035, 0.0967152863740921, 0.10362737625837326, 0.11053946614265442, 0.11745156347751617, 0.12436365336179733, 0.1312757432460785, 0.13818784058094025, 0.145099937915802, 0.15201202034950256, 0.15892411768436432, 0.16583621501922607, 0.17274829745292664, 0.1796603947877884, 0.18657247722148895, 0.1934845745563507, 0.20039667189121246, 0.20730876922607422, 0.21422085165977478, 0.22113294899463654, 0.2280450463294983]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 3.0, 15.0, 13.0, 31.0, 42.0, 71.0, 113.0, 202.0, 322.0, 480.0, 770.0, 1210.0, 2060.0, 3230.0, 5140.0, 8007.0, 12460.0, 19731.0, 31571.0, 52003.0, 90785.0, 160969.0, 227034.0, 178652.0, 101910.0, 57965.0, 34564.0, 21807.0, 13562.0, 8849.0, 5642.0, 3536.0, 2209.0, 1363.0, 831.0, 493.0, 337.0, 216.0, 137.0, 79.0, 44.0, 33.0, 17.0, 17.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.07293701171875, -0.07069969177246094, -0.06846237182617188, -0.06622505187988281, -0.06398773193359375, -0.06175041198730469, -0.059513092041015625, -0.05727577209472656, -0.0550384521484375, -0.05280113220214844, -0.050563812255859375, -0.04832649230957031, -0.04608917236328125, -0.04385185241699219, -0.041614532470703125, -0.03937721252441406, -0.037139892578125, -0.03490257263183594, -0.032665252685546875, -0.030427932739257812, -0.02819061279296875, -0.025953292846679688, -0.023715972900390625, -0.021478652954101562, -0.0192413330078125, -0.017004013061523438, -0.014766693115234375, -0.012529373168945312, -0.01029205322265625, -0.008054733276367188, -0.005817413330078125, -0.0035800933837890625, -0.0013427734375, 0.0008945465087890625, 0.003131866455078125, 0.0053691864013671875, 0.00760650634765625, 0.009843826293945312, 0.012081146240234375, 0.014318466186523438, 0.0165557861328125, 0.018793106079101562, 0.021030426025390625, 0.023267745971679688, 0.02550506591796875, 0.027742385864257812, 0.029979705810546875, 0.03221702575683594, 0.034454345703125, 0.03669166564941406, 0.038928985595703125, 0.04116630554199219, 0.04340362548828125, 0.04564094543457031, 0.047878265380859375, 0.05011558532714844, 0.0523529052734375, 0.05459022521972656, 0.056827545166015625, 0.05906486511230469, 0.06130218505859375, 0.06353950500488281, 0.06577682495117188, 0.06801414489746094, 0.07025146484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 9.0, 14.0, 7.0, 13.0, 14.0, 18.0, 19.0, 20.0, 24.0, 23.0, 33.0, 29.0, 25.0, 28.0, 42.0, 46.0, 31.0, 39.0, 37.0, 41.0, 36.0, 32.0, 49.0, 31.0, 35.0, 30.0, 33.0, 33.0, 18.0, 21.0, 20.0, 25.0, 22.0, 18.0, 8.0, 10.0, 11.0, 7.0, 12.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.044586181640625, -0.04315996170043945, -0.041733741760253906, -0.04030752182006836, -0.03888130187988281, -0.037455081939697266, -0.03602886199951172, -0.03460264205932617, -0.033176422119140625, -0.03175020217895508, -0.03032398223876953, -0.028897762298583984, -0.027471542358398438, -0.02604532241821289, -0.024619102478027344, -0.023192882537841797, -0.02176666259765625, -0.020340442657470703, -0.018914222717285156, -0.01748800277709961, -0.016061782836914062, -0.014635562896728516, -0.013209342956542969, -0.011783123016357422, -0.010356903076171875, -0.008930683135986328, -0.007504463195800781, -0.006078243255615234, -0.0046520233154296875, -0.0032258033752441406, -0.0017995834350585938, -0.0003733634948730469, 0.0010528564453125, 0.002479076385498047, 0.0039052963256835938, 0.005331516265869141, 0.0067577362060546875, 0.008183956146240234, 0.009610176086425781, 0.011036396026611328, 0.012462615966796875, 0.013888835906982422, 0.015315055847167969, 0.016741275787353516, 0.018167495727539062, 0.01959371566772461, 0.021019935607910156, 0.022446155548095703, 0.02387237548828125, 0.025298595428466797, 0.026724815368652344, 0.02815103530883789, 0.029577255249023438, 0.031003475189208984, 0.03242969512939453, 0.03385591506958008, 0.035282135009765625, 0.03670835494995117, 0.03813457489013672, 0.039560794830322266, 0.04098701477050781, 0.04241323471069336, 0.043839454650878906, 0.04526567459106445, 0.04669189453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 15.0, 19.0, 24.0, 37.0, 39.0, 61.0, 85.0, 117.0, 205.0, 411.0, 963.0, 3010.0, 10719.0, 36797.0, 144492.0, 541758.0, 232627.0, 54200.0, 15614.0, 4641.0, 1341.0, 575.0, 266.0, 160.0, 81.0, 71.0, 65.0, 31.0, 34.0, 14.0, 20.0, 7.0, 9.0, 1.0, 3.0, 1.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1640625, -0.15790557861328125, -0.1517486572265625, -0.14559173583984375, -0.139434814453125, -0.13327789306640625, -0.1271209716796875, -0.12096405029296875, -0.11480712890625, -0.10865020751953125, -0.1024932861328125, -0.09633636474609375, -0.090179443359375, -0.08402252197265625, -0.0778656005859375, -0.07170867919921875, -0.0655517578125, -0.05939483642578125, -0.0532379150390625, -0.04708099365234375, -0.040924072265625, -0.03476715087890625, -0.0286102294921875, -0.02245330810546875, -0.01629638671875, -0.01013946533203125, -0.0039825439453125, 0.00217437744140625, 0.008331298828125, 0.01448822021484375, 0.0206451416015625, 0.02680206298828125, 0.032958984375, 0.03911590576171875, 0.0452728271484375, 0.05142974853515625, 0.057586669921875, 0.06374359130859375, 0.0699005126953125, 0.07605743408203125, 0.08221435546875, 0.08837127685546875, 0.0945281982421875, 0.10068511962890625, 0.106842041015625, 0.11299896240234375, 0.1191558837890625, 0.12531280517578125, 0.1314697265625, 0.13762664794921875, 0.1437835693359375, 0.14994049072265625, 0.156097412109375, 0.16225433349609375, 0.1684112548828125, 0.17456817626953125, 0.18072509765625, 0.18688201904296875, 0.1930389404296875, 0.19919586181640625, 0.205352783203125, 0.21150970458984375, 0.2176666259765625, 0.22382354736328125, 0.22998046875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 8.0, 3.0, 7.0, 4.0, 20.0, 19.0, 25.0, 29.0, 33.0, 40.0, 28.0, 47.0, 51.0, 44.0, 51.0, 55.0, 52.0, 48.0, 44.0, 54.0, 52.0, 58.0, 45.0, 36.0, 37.0, 21.0, 18.0, 22.0, 11.0, 10.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15933990478515625, -0.1536407470703125, -0.14794158935546875, -0.142242431640625, -0.13654327392578125, -0.1308441162109375, -0.12514495849609375, -0.11944580078125, -0.11374664306640625, -0.1080474853515625, -0.10234832763671875, -0.096649169921875, -0.09095001220703125, -0.0852508544921875, -0.07955169677734375, -0.0738525390625, -0.06815338134765625, -0.0624542236328125, -0.05675506591796875, -0.051055908203125, -0.04535675048828125, -0.0396575927734375, -0.03395843505859375, -0.02825927734375, -0.02256011962890625, -0.0168609619140625, -0.01116180419921875, -0.005462646484375, 0.00023651123046875, 0.0059356689453125, 0.01163482666015625, 0.017333984375, 0.02303314208984375, 0.0287322998046875, 0.03443145751953125, 0.040130615234375, 0.04582977294921875, 0.0515289306640625, 0.05722808837890625, 0.06292724609375, 0.06862640380859375, 0.0743255615234375, 0.08002471923828125, 0.085723876953125, 0.09142303466796875, 0.0971221923828125, 0.10282135009765625, 0.1085205078125, 0.11421966552734375, 0.1199188232421875, 0.12561798095703125, 0.131317138671875, 0.13701629638671875, 0.1427154541015625, 0.14841461181640625, 0.15411376953125, 0.15981292724609375, 0.1655120849609375, 0.17121124267578125, 0.176910400390625, 0.18260955810546875, 0.1883087158203125, 0.19400787353515625, 0.19970703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 8.0, 18.0, 25.0, 30.0, 44.0, 97.0, 153.0, 285.0, 518.0, 1009.0, 2126.0, 4380.0, 9101.0, 18875.0, 41601.0, 123219.0, 461207.0, 264647.0, 67969.0, 27837.0, 13035.0, 6315.0, 2997.0, 1499.0, 693.0, 407.0, 183.0, 115.0, 54.0, 31.0, 23.0, 14.0, 11.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.06437397003173828, -0.06228065490722656, -0.060187339782714844, -0.058094024658203125, -0.056000709533691406, -0.05390739440917969, -0.05181407928466797, -0.04972076416015625, -0.04762744903564453, -0.04553413391113281, -0.043440818786621094, -0.041347503662109375, -0.039254188537597656, -0.03716087341308594, -0.03506755828857422, -0.0329742431640625, -0.03088092803955078, -0.028787612915039062, -0.026694297790527344, -0.024600982666015625, -0.022507667541503906, -0.020414352416992188, -0.01832103729248047, -0.01622772216796875, -0.014134407043457031, -0.012041091918945312, -0.009947776794433594, -0.007854461669921875, -0.005761146545410156, -0.0036678314208984375, -0.0015745162963867188, 0.000518798828125, 0.0026121139526367188, 0.0047054290771484375, 0.006798744201660156, 0.008892059326171875, 0.010985374450683594, 0.013078689575195312, 0.015172004699707031, 0.01726531982421875, 0.01935863494873047, 0.021451950073242188, 0.023545265197753906, 0.025638580322265625, 0.027731895446777344, 0.029825210571289062, 0.03191852569580078, 0.0340118408203125, 0.03610515594482422, 0.03819847106933594, 0.040291786193847656, 0.042385101318359375, 0.044478416442871094, 0.04657173156738281, 0.04866504669189453, 0.05075836181640625, 0.05285167694091797, 0.05494499206542969, 0.057038307189941406, 0.059131622314453125, 0.061224937438964844, 0.06331825256347656, 0.06541156768798828, 0.0675048828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 9.0, 5.0, 13.0, 10.0, 11.0, 14.0, 17.0, 28.0, 32.0, 38.0, 34.0, 61.0, 59.0, 79.0, 79.0, 57.0, 59.0, 61.0, 60.0, 52.0, 37.0, 31.0, 27.0, 16.0, 21.0, 21.0, 10.0, 4.0, 6.0, 6.0, 6.0, 5.0, 1.0, 8.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7523765563964844e-05, -1.70096755027771e-05, -1.6495585441589355e-05, -1.598149538040161e-05, -1.5467405319213867e-05, -1.4953315258026123e-05, -1.4439225196838379e-05, -1.3925135135650635e-05, -1.341104507446289e-05, -1.2896955013275146e-05, -1.2382864952087402e-05, -1.1868774890899658e-05, -1.1354684829711914e-05, -1.084059476852417e-05, -1.0326504707336426e-05, -9.812414646148682e-06, -9.298324584960938e-06, -8.784234523773193e-06, -8.27014446258545e-06, -7.756054401397705e-06, -7.241964340209961e-06, -6.727874279022217e-06, -6.213784217834473e-06, -5.6996941566467285e-06, -5.185604095458984e-06, -4.67151403427124e-06, -4.157423973083496e-06, -3.643333911895752e-06, -3.129243850708008e-06, -2.6151537895202637e-06, -2.1010637283325195e-06, -1.5869736671447754e-06, -1.0728836059570312e-06, -5.587935447692871e-07, -4.470348358154297e-08, 4.6938657760620117e-07, 9.834766387939453e-07, 1.4975666999816895e-06, 2.0116567611694336e-06, 2.5257468223571777e-06, 3.039836883544922e-06, 3.553926944732666e-06, 4.06801700592041e-06, 4.582107067108154e-06, 5.0961971282958984e-06, 5.610287189483643e-06, 6.124377250671387e-06, 6.638467311859131e-06, 7.152557373046875e-06, 7.666647434234619e-06, 8.180737495422363e-06, 8.694827556610107e-06, 9.208917617797852e-06, 9.723007678985596e-06, 1.023709774017334e-05, 1.0751187801361084e-05, 1.1265277862548828e-05, 1.1779367923736572e-05, 1.2293457984924316e-05, 1.280754804611206e-05, 1.3321638107299805e-05, 1.3835728168487549e-05, 1.4349818229675293e-05, 1.4863908290863037e-05, 1.537799835205078e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 1.0, 12.0, 15.0, 16.0, 22.0, 30.0, 45.0, 62.0, 126.0, 238.0, 483.0, 1121.0, 3125.0, 8430.0, 23011.0, 70029.0, 305723.0, 471536.0, 111597.0, 33588.0, 12124.0, 4246.0, 1595.0, 691.0, 297.0, 140.0, 90.0, 55.0, 29.0, 31.0, 15.0, 13.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08905029296875, -0.0867772102355957, -0.0845041275024414, -0.08223104476928711, -0.07995796203613281, -0.07768487930297852, -0.07541179656982422, -0.07313871383666992, -0.07086563110351562, -0.06859254837036133, -0.06631946563720703, -0.06404638290405273, -0.06177330017089844, -0.05950021743774414, -0.057227134704589844, -0.05495405197143555, -0.05268096923828125, -0.05040788650512695, -0.048134803771972656, -0.04586172103881836, -0.04358863830566406, -0.041315555572509766, -0.03904247283935547, -0.03676939010620117, -0.034496307373046875, -0.03222322463989258, -0.02995014190673828, -0.027677059173583984, -0.025403976440429688, -0.02313089370727539, -0.020857810974121094, -0.018584728240966797, -0.0163116455078125, -0.014038562774658203, -0.011765480041503906, -0.00949239730834961, -0.0072193145751953125, -0.004946231842041016, -0.0026731491088867188, -0.0004000663757324219, 0.001873016357421875, 0.004146099090576172, 0.006419181823730469, 0.008692264556884766, 0.010965347290039062, 0.01323843002319336, 0.015511512756347656, 0.017784595489501953, 0.02005767822265625, 0.022330760955810547, 0.024603843688964844, 0.02687692642211914, 0.029150009155273438, 0.031423091888427734, 0.03369617462158203, 0.03596925735473633, 0.038242340087890625, 0.04051542282104492, 0.04278850555419922, 0.045061588287353516, 0.04733467102050781, 0.04960775375366211, 0.051880836486816406, 0.0541539192199707, 0.056427001953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 5.0, 5.0, 7.0, 13.0, 6.0, 16.0, 21.0, 26.0, 31.0, 58.0, 71.0, 93.0, 101.0, 109.0, 98.0, 85.0, 61.0, 42.0, 33.0, 26.0, 13.0, 18.0, 11.0, 7.0, 7.0, 3.0, 7.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06085205078125, -0.05918312072753906, -0.057514190673828125, -0.05584526062011719, -0.05417633056640625, -0.05250740051269531, -0.050838470458984375, -0.04916954040527344, -0.0475006103515625, -0.04583168029785156, -0.044162750244140625, -0.04249382019042969, -0.04082489013671875, -0.03915596008300781, -0.037487030029296875, -0.03581809997558594, -0.034149169921875, -0.03248023986816406, -0.030811309814453125, -0.029142379760742188, -0.02747344970703125, -0.025804519653320312, -0.024135589599609375, -0.022466659545898438, -0.0207977294921875, -0.019128799438476562, -0.017459869384765625, -0.015790939331054688, -0.01412200927734375, -0.012453079223632812, -0.010784149169921875, -0.009115219116210938, -0.0074462890625, -0.0057773590087890625, -0.004108428955078125, -0.0024394989013671875, -0.00077056884765625, 0.0008983612060546875, 0.002567291259765625, 0.0042362213134765625, 0.0059051513671875, 0.0075740814208984375, 0.009243011474609375, 0.010911941528320312, 0.01258087158203125, 0.014249801635742188, 0.015918731689453125, 0.017587661743164062, 0.019256591796875, 0.020925521850585938, 0.022594451904296875, 0.024263381958007812, 0.02593231201171875, 0.027601242065429688, 0.029270172119140625, 0.030939102172851562, 0.0326080322265625, 0.03427696228027344, 0.035945892333984375, 0.03761482238769531, 0.03928375244140625, 0.04095268249511719, 0.042621612548828125, 0.04429054260253906, 0.04595947265625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 15.0, 35.0, 59.0, 115.0, 179.0, 169.0, 170.0, 114.0, 95.0, 27.0, 15.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389845073223114, -0.3586246967315674, -0.32740435004234314, -0.2961840033531189, -0.26496362686157227, -0.23374326527118683, -0.2025229036808014, -0.17130254209041595, -0.14008218050003052, -0.10886181890964508, -0.07764145731925964, -0.04642109572887421, -0.01520073413848877, 0.016019627451896667, 0.047239989042282104, 0.07846035063266754, 0.10968071222305298, 0.14090107381343842, 0.17212143540382385, 0.2033417969942093, 0.23456215858459473, 0.26578253507614136, 0.2970028817653656, 0.32822322845458984, 0.3594436049461365, 0.3906639814376831, 0.42188432812690735, 0.4531046748161316, 0.4843250513076782, 0.5155454277992249, 0.5467658042907715, 0.5779861211776733, 0.6092064380645752, 0.6404268145561218, 0.6716471910476685, 0.7028675079345703, 0.7340878844261169, 0.7653082609176636, 0.7965285778045654, 0.8277489542961121, 0.8589693307876587, 0.8901897072792053, 0.921410083770752, 0.9526304006576538, 0.9838507771492004, 1.015071153640747, 1.046291470527649, 1.0775119066238403, 1.1087322235107422, 1.139952540397644, 1.1711729764938354, 1.2023932933807373, 1.2336137294769287, 1.2648340463638306, 1.2960543632507324, 1.3272747993469238, 1.3584951162338257, 1.3897154331207275, 1.420935869216919, 1.4521561861038208, 1.4833765029907227, 1.514596939086914, 1.545817255973816, 1.5770376920700073, 1.6082580089569092]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 10.0, 14.0, 9.0, 10.0, 22.0, 23.0, 29.0, 33.0, 36.0, 29.0, 37.0, 30.0, 43.0, 39.0, 44.0, 43.0, 33.0, 43.0, 48.0, 34.0, 41.0, 46.0, 39.0, 31.0, 38.0, 21.0, 24.0, 25.0, 16.0, 14.0, 15.0, 12.0, 12.0, 10.0, 4.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4383001923561096, -0.4258387088775635, -0.4133772552013397, -0.40091580152511597, -0.3884543180465698, -0.3759928345680237, -0.3635313808917999, -0.35106992721557617, -0.33860844373703003, -0.3261469602584839, -0.31368550658226013, -0.3012240529060364, -0.28876256942749023, -0.2763010859489441, -0.26383963227272034, -0.2513781785964966, -0.23891669511795044, -0.2264552265405655, -0.21399375796318054, -0.2015322893857956, -0.18907082080841064, -0.1766093522310257, -0.16414788365364075, -0.1516864150762558, -0.13922494649887085, -0.1267634779214859, -0.11430200934410095, -0.101840540766716, -0.08937907218933105, -0.0769176036119461, -0.06445613503456116, -0.05199466645717621, -0.03953319787979126, -0.02707172930240631, -0.014610260725021362, -0.0021487921476364136, 0.010312676429748535, 0.022774145007133484, 0.03523561358451843, 0.04769708216190338, 0.06015855073928833, 0.07262001931667328, 0.08508148789405823, 0.09754295647144318, 0.11000442504882812, 0.12246589362621307, 0.13492736220359802, 0.14738883078098297, 0.15985029935836792, 0.17231176793575287, 0.18477323651313782, 0.19723470509052277, 0.20969617366790771, 0.22215764224529266, 0.2346191108226776, 0.24708057940006256, 0.2595420479774475, 0.27200353145599365, 0.2844649851322174, 0.29692643880844116, 0.3093879222869873, 0.32184940576553345, 0.3343108594417572, 0.34677231311798096, 0.3592337965965271]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 12.0, 12.0, 13.0, 18.0, 34.0, 46.0, 56.0, 94.0, 126.0, 242.0, 400.0, 680.0, 1153.0, 2205.0, 4067.0, 8372.0, 17294.0, 38702.0, 90198.0, 237473.0, 758514.0, 2019100.0, 652329.0, 212959.0, 82805.0, 34984.0, 16013.0, 7741.0, 3795.0, 2052.0, 1142.0, 638.0, 354.0, 218.0, 121.0, 84.0, 62.0, 36.0, 32.0, 26.0, 20.0, 14.0, 10.0, 9.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.06310367584228516, -0.06096076965332031, -0.05881786346435547, -0.056674957275390625, -0.05453205108642578, -0.05238914489746094, -0.050246238708496094, -0.04810333251953125, -0.045960426330566406, -0.04381752014160156, -0.04167461395263672, -0.039531707763671875, -0.03738880157470703, -0.03524589538574219, -0.033102989196777344, -0.0309600830078125, -0.028817176818847656, -0.026674270629882812, -0.02453136444091797, -0.022388458251953125, -0.02024555206298828, -0.018102645874023438, -0.015959739685058594, -0.01381683349609375, -0.011673927307128906, -0.009531021118164062, -0.007388114929199219, -0.005245208740234375, -0.0031023025512695312, -0.0009593963623046875, 0.0011835098266601562, 0.003326416015625, 0.005469322204589844, 0.0076122283935546875, 0.009755134582519531, 0.011898040771484375, 0.014040946960449219, 0.016183853149414062, 0.018326759338378906, 0.02046966552734375, 0.022612571716308594, 0.024755477905273438, 0.02689838409423828, 0.029041290283203125, 0.03118419647216797, 0.03332710266113281, 0.035470008850097656, 0.0376129150390625, 0.039755821228027344, 0.04189872741699219, 0.04404163360595703, 0.046184539794921875, 0.04832744598388672, 0.05047035217285156, 0.052613258361816406, 0.05475616455078125, 0.056899070739746094, 0.05904197692871094, 0.06118488311767578, 0.06332778930664062, 0.06547069549560547, 0.06761360168457031, 0.06975650787353516, 0.0718994140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 12.0, 8.0, 14.0, 12.0, 18.0, 19.0, 18.0, 17.0, 27.0, 29.0, 26.0, 27.0, 31.0, 38.0, 45.0, 34.0, 39.0, 43.0, 50.0, 51.0, 46.0, 30.0, 43.0, 42.0, 37.0, 25.0, 32.0, 34.0, 24.0, 15.0, 16.0, 15.0, 17.0, 12.0, 16.0, 8.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06494140625, -0.06314706802368164, -0.06135272979736328, -0.05955839157104492, -0.05776405334472656, -0.0559697151184082, -0.054175376892089844, -0.052381038665771484, -0.050586700439453125, -0.048792362213134766, -0.046998023986816406, -0.04520368576049805, -0.04340934753417969, -0.04161500930786133, -0.03982067108154297, -0.03802633285522461, -0.03623199462890625, -0.03443765640258789, -0.03264331817626953, -0.030848979949951172, -0.029054641723632812, -0.027260303497314453, -0.025465965270996094, -0.023671627044677734, -0.021877288818359375, -0.020082950592041016, -0.018288612365722656, -0.016494274139404297, -0.014699935913085938, -0.012905597686767578, -0.011111259460449219, -0.00931692123413086, -0.0075225830078125, -0.005728244781494141, -0.003933906555175781, -0.002139568328857422, -0.0003452301025390625, 0.0014491081237792969, 0.0032434463500976562, 0.005037784576416016, 0.006832122802734375, 0.008626461029052734, 0.010420799255371094, 0.012215137481689453, 0.014009475708007812, 0.015803813934326172, 0.01759815216064453, 0.01939249038696289, 0.02118682861328125, 0.02298116683959961, 0.02477550506591797, 0.026569843292236328, 0.028364181518554688, 0.030158519744873047, 0.031952857971191406, 0.033747196197509766, 0.035541534423828125, 0.037335872650146484, 0.039130210876464844, 0.0409245491027832, 0.04271888732910156, 0.04451322555541992, 0.04630756378173828, 0.04810190200805664, 0.049896240234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 14.0, 13.0, 26.0, 34.0, 74.0, 86.0, 102.0, 167.0, 271.0, 384.0, 605.0, 898.0, 1409.0, 2090.0, 3554.0, 5915.0, 10194.0, 18638.0, 35483.0, 69969.0, 145649.0, 319326.0, 786014.0, 1516821.0, 709975.0, 291808.0, 134336.0, 65179.0, 33065.0, 17582.0, 9604.0, 5671.0, 3320.0, 2097.0, 1321.0, 826.0, 606.0, 368.0, 241.0, 158.0, 118.0, 67.0, 67.0, 37.0, 34.0, 25.0, 11.0, 8.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06890392303466797, -0.06664085388183594, -0.0643777847290039, -0.062114715576171875, -0.059851646423339844, -0.05758857727050781, -0.05532550811767578, -0.05306243896484375, -0.05079936981201172, -0.04853630065917969, -0.046273231506347656, -0.044010162353515625, -0.041747093200683594, -0.03948402404785156, -0.03722095489501953, -0.0349578857421875, -0.03269481658935547, -0.030431747436523438, -0.028168678283691406, -0.025905609130859375, -0.023642539978027344, -0.021379470825195312, -0.01911640167236328, -0.01685333251953125, -0.014590263366699219, -0.012327194213867188, -0.010064125061035156, -0.007801055908203125, -0.005537986755371094, -0.0032749176025390625, -0.0010118484497070312, 0.001251220703125, 0.0035142898559570312, 0.0057773590087890625, 0.008040428161621094, 0.010303497314453125, 0.012566566467285156, 0.014829635620117188, 0.01709270477294922, 0.01935577392578125, 0.02161884307861328, 0.023881912231445312, 0.026144981384277344, 0.028408050537109375, 0.030671119689941406, 0.03293418884277344, 0.03519725799560547, 0.0374603271484375, 0.03972339630126953, 0.04198646545410156, 0.044249534606933594, 0.046512603759765625, 0.048775672912597656, 0.05103874206542969, 0.05330181121826172, 0.05556488037109375, 0.05782794952392578, 0.06009101867675781, 0.062354087829589844, 0.06461715698242188, 0.0668802261352539, 0.06914329528808594, 0.07140636444091797, 0.07366943359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 9.0, 7.0, 11.0, 9.0, 14.0, 23.0, 34.0, 37.0, 51.0, 71.0, 104.0, 132.0, 172.0, 266.0, 358.0, 563.0, 589.0, 506.0, 307.0, 215.0, 151.0, 104.0, 75.0, 72.0, 47.0, 27.0, 20.0, 27.0, 12.0, 20.0, 7.0, 7.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.099853515625, -0.09702587127685547, -0.09419822692871094, -0.0913705825805664, -0.08854293823242188, -0.08571529388427734, -0.08288764953613281, -0.08006000518798828, -0.07723236083984375, -0.07440471649169922, -0.07157707214355469, -0.06874942779541016, -0.06592178344726562, -0.0630941390991211, -0.06026649475097656, -0.05743885040283203, -0.0546112060546875, -0.05178356170654297, -0.04895591735839844, -0.046128273010253906, -0.043300628662109375, -0.040472984313964844, -0.03764533996582031, -0.03481769561767578, -0.03199005126953125, -0.02916240692138672, -0.026334762573242188, -0.023507118225097656, -0.020679473876953125, -0.017851829528808594, -0.015024185180664062, -0.012196540832519531, -0.009368896484375, -0.006541252136230469, -0.0037136077880859375, -0.0008859634399414062, 0.001941680908203125, 0.004769325256347656, 0.0075969696044921875, 0.010424613952636719, 0.01325225830078125, 0.01607990264892578, 0.018907546997070312, 0.021735191345214844, 0.024562835693359375, 0.027390480041503906, 0.030218124389648438, 0.03304576873779297, 0.0358734130859375, 0.03870105743408203, 0.04152870178222656, 0.044356346130371094, 0.047183990478515625, 0.050011634826660156, 0.05283927917480469, 0.05566692352294922, 0.05849456787109375, 0.06132221221923828, 0.06414985656738281, 0.06697750091552734, 0.06980514526367188, 0.0726327896118164, 0.07546043395996094, 0.07828807830810547, 0.08111572265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 11.0, 13.0, 15.0, 32.0, 33.0, 45.0, 57.0, 59.0, 75.0, 75.0, 77.0, 91.0, 76.0, 73.0, 52.0, 53.0, 41.0, 36.0, 12.0, 21.0, 13.0, 3.0, 8.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3206601142883301, -0.3084813356399536, -0.29630255699157715, -0.2841237783432007, -0.2719449996948242, -0.25976622104644775, -0.2475874423980713, -0.23540866374969482, -0.22322988510131836, -0.2110511064529419, -0.19887232780456543, -0.18669354915618896, -0.1745147705078125, -0.16233599185943604, -0.15015721321105957, -0.1379784345626831, -0.12579967081546783, -0.11362089216709137, -0.1014421135187149, -0.08926333487033844, -0.07708455622196198, -0.06490577757358551, -0.05272700637578964, -0.04054822772741318, -0.028369449079036713, -0.016190670430660248, -0.004011893644928932, 0.008166883140802383, 0.02034566178917885, 0.03252444043755531, 0.04470321536064148, 0.056881994009017944, 0.06906077265739441, 0.08123955130577087, 0.09341832995414734, 0.1055971086025238, 0.11777588725090027, 0.12995466589927673, 0.1421334445476532, 0.15431222319602966, 0.16649100184440613, 0.1786697804927826, 0.19084855914115906, 0.20302733778953552, 0.215206116437912, 0.22738489508628845, 0.23956367373466492, 0.2517424523830414, 0.26392120122909546, 0.2760999798774719, 0.2882787585258484, 0.30045753717422485, 0.3126363158226013, 0.3248150944709778, 0.33699387311935425, 0.3491726517677307, 0.3613514304161072, 0.37353020906448364, 0.3857089877128601, 0.3978877663612366, 0.41006654500961304, 0.4222453236579895, 0.43442410230636597, 0.44660288095474243, 0.4587816596031189]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 11.0, 6.0, 6.0, 13.0, 12.0, 13.0, 16.0, 25.0, 14.0, 28.0, 26.0, 24.0, 36.0, 40.0, 44.0, 30.0, 47.0, 38.0, 45.0, 58.0, 40.0, 49.0, 43.0, 33.0, 41.0, 37.0, 41.0, 18.0, 17.0, 17.0, 29.0, 21.0, 20.0, 16.0, 10.0, 9.0, 11.0, 4.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29413020610809326, -0.2850360572338104, -0.27594193816185, -0.26684778928756714, -0.2577536404132843, -0.24865950644016266, -0.23956537246704102, -0.23047122359275818, -0.22137708961963654, -0.2122829556465149, -0.20318880677223206, -0.1940946727991104, -0.18500053882598877, -0.17590638995170593, -0.1668122559785843, -0.15771812200546265, -0.1486239731311798, -0.13952983915805817, -0.13043569028377533, -0.12134155631065369, -0.11224741488695145, -0.1031532734632492, -0.09405913949012756, -0.08496499806642532, -0.07587085664272308, -0.06677671521902084, -0.0576825775206089, -0.04858843982219696, -0.03949429839849472, -0.03040015697479248, -0.02130601927638054, -0.012211881577968597, -0.0031177401542663574, 0.005976399406790733, 0.015070538967847824, 0.024164678528904915, 0.033258818089962006, 0.042352959513664246, 0.05144709721207619, 0.06054123491048813, 0.06963537633419037, 0.07872951775789261, 0.08782365918159485, 0.09691779315471649, 0.10601193457841873, 0.11510607600212097, 0.12420020997524261, 0.13329434394836426, 0.1423884928226471, 0.15148262679576874, 0.16057677567005157, 0.16967090964317322, 0.17876505851745605, 0.1878591924905777, 0.19695332646369934, 0.20604747533798218, 0.21514160931110382, 0.22423574328422546, 0.2333298921585083, 0.24242402613162994, 0.2515181601047516, 0.2606123089790344, 0.26970645785331726, 0.2788005769252777, 0.28789472579956055]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 7.0, 7.0, 19.0, 11.0, 23.0, 41.0, 61.0, 99.0, 157.0, 283.0, 532.0, 990.0, 1733.0, 3175.0, 6101.0, 11763.0, 22771.0, 43793.0, 87335.0, 176514.0, 284369.0, 203599.0, 100198.0, 50614.0, 25977.0, 13329.0, 7028.0, 3556.0, 1975.0, 1047.0, 622.0, 342.0, 177.0, 109.0, 64.0, 40.0, 31.0, 12.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08294677734375, -0.0800466537475586, -0.07714653015136719, -0.07424640655517578, -0.07134628295898438, -0.06844615936279297, -0.06554603576660156, -0.06264591217041016, -0.05974578857421875, -0.056845664978027344, -0.05394554138183594, -0.05104541778564453, -0.048145294189453125, -0.04524517059326172, -0.04234504699707031, -0.039444923400878906, -0.0365447998046875, -0.033644676208496094, -0.030744552612304688, -0.02784442901611328, -0.024944305419921875, -0.02204418182373047, -0.019144058227539062, -0.016243934631347656, -0.01334381103515625, -0.010443687438964844, -0.0075435638427734375, -0.004643440246582031, -0.001743316650390625, 0.0011568069458007812, 0.0040569305419921875, 0.006957054138183594, 0.009857177734375, 0.012757301330566406, 0.015657424926757812, 0.01855754852294922, 0.021457672119140625, 0.02435779571533203, 0.027257919311523438, 0.030158042907714844, 0.03305816650390625, 0.035958290100097656, 0.03885841369628906, 0.04175853729248047, 0.044658660888671875, 0.04755878448486328, 0.05045890808105469, 0.053359031677246094, 0.0562591552734375, 0.059159278869628906, 0.06205940246582031, 0.06495952606201172, 0.06785964965820312, 0.07075977325439453, 0.07365989685058594, 0.07656002044677734, 0.07946014404296875, 0.08236026763916016, 0.08526039123535156, 0.08816051483154297, 0.09106063842773438, 0.09396076202392578, 0.09686088562011719, 0.0997610092163086, 0.1026611328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 0.0, 5.0, 8.0, 10.0, 7.0, 6.0, 10.0, 6.0, 13.0, 17.0, 24.0, 28.0, 17.0, 24.0, 33.0, 28.0, 37.0, 37.0, 43.0, 41.0, 38.0, 45.0, 44.0, 42.0, 45.0, 26.0, 39.0, 40.0, 39.0, 34.0, 36.0, 26.0, 22.0, 22.0, 22.0, 15.0, 9.0, 15.0, 7.0, 10.0, 6.0, 6.0, 2.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.052215576171875, -0.050501346588134766, -0.04878711700439453, -0.0470728874206543, -0.04535865783691406, -0.04364442825317383, -0.041930198669433594, -0.04021596908569336, -0.038501739501953125, -0.03678750991821289, -0.035073280334472656, -0.03335905075073242, -0.03164482116699219, -0.029930591583251953, -0.02821636199951172, -0.026502132415771484, -0.02478790283203125, -0.023073673248291016, -0.02135944366455078, -0.019645214080810547, -0.017930984497070312, -0.016216754913330078, -0.014502525329589844, -0.01278829574584961, -0.011074066162109375, -0.00935983657836914, -0.007645606994628906, -0.005931377410888672, -0.0042171478271484375, -0.002502918243408203, -0.0007886886596679688, 0.0009255409240722656, 0.0026397705078125, 0.004354000091552734, 0.006068229675292969, 0.007782459259033203, 0.009496688842773438, 0.011210918426513672, 0.012925148010253906, 0.01463937759399414, 0.016353607177734375, 0.01806783676147461, 0.019782066345214844, 0.021496295928955078, 0.023210525512695312, 0.024924755096435547, 0.02663898468017578, 0.028353214263916016, 0.03006744384765625, 0.031781673431396484, 0.03349590301513672, 0.03521013259887695, 0.03692436218261719, 0.03863859176635742, 0.040352821350097656, 0.04206705093383789, 0.043781280517578125, 0.04549551010131836, 0.047209739685058594, 0.04892396926879883, 0.05063819885253906, 0.0523524284362793, 0.05406665802001953, 0.055780887603759766, 0.0574951171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 10.0, 7.0, 10.0, 18.0, 27.0, 26.0, 31.0, 50.0, 54.0, 58.0, 116.0, 164.0, 264.0, 571.0, 1415.0, 3806.0, 11909.0, 37257.0, 118694.0, 409357.0, 329859.0, 91801.0, 28547.0, 9086.0, 3014.0, 1105.0, 464.0, 257.0, 140.0, 100.0, 74.0, 65.0, 55.0, 20.0, 27.0, 19.0, 14.0, 11.0, 16.0, 7.0, 9.0, 4.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.18761634826660156, -0.18223953247070312, -0.1768627166748047, -0.17148590087890625, -0.1661090850830078, -0.16073226928710938, -0.15535545349121094, -0.1499786376953125, -0.14460182189941406, -0.13922500610351562, -0.1338481903076172, -0.12847137451171875, -0.12309455871582031, -0.11771774291992188, -0.11234092712402344, -0.106964111328125, -0.10158729553222656, -0.09621047973632812, -0.09083366394042969, -0.08545684814453125, -0.08008003234863281, -0.07470321655273438, -0.06932640075683594, -0.0639495849609375, -0.05857276916503906, -0.053195953369140625, -0.04781913757324219, -0.04244232177734375, -0.03706550598144531, -0.031688690185546875, -0.026311874389648438, -0.02093505859375, -0.015558242797851562, -0.010181427001953125, -0.0048046112060546875, 0.00057220458984375, 0.0059490203857421875, 0.011325836181640625, 0.016702651977539062, 0.0220794677734375, 0.027456283569335938, 0.032833099365234375, 0.03820991516113281, 0.04358673095703125, 0.04896354675292969, 0.054340362548828125, 0.05971717834472656, 0.065093994140625, 0.07047080993652344, 0.07584762573242188, 0.08122444152832031, 0.08660125732421875, 0.09197807312011719, 0.09735488891601562, 0.10273170471191406, 0.1081085205078125, 0.11348533630371094, 0.11886215209960938, 0.12423896789550781, 0.12961578369140625, 0.1349925994873047, 0.14036941528320312, 0.14574623107910156, 0.151123046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 11.0, 12.0, 12.0, 10.0, 19.0, 19.0, 23.0, 37.0, 25.0, 23.0, 42.0, 40.0, 38.0, 35.0, 39.0, 45.0, 43.0, 51.0, 42.0, 48.0, 49.0, 37.0, 57.0, 31.0, 32.0, 28.0, 23.0, 16.0, 17.0, 16.0, 17.0, 10.0, 10.0, 7.0, 6.0, 8.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.169189453125, -0.1636810302734375, -0.158172607421875, -0.1526641845703125, -0.14715576171875, -0.1416473388671875, -0.136138916015625, -0.1306304931640625, -0.1251220703125, -0.1196136474609375, -0.114105224609375, -0.1085968017578125, -0.10308837890625, -0.0975799560546875, -0.092071533203125, -0.0865631103515625, -0.0810546875, -0.0755462646484375, -0.070037841796875, -0.0645294189453125, -0.05902099609375, -0.0535125732421875, -0.048004150390625, -0.0424957275390625, -0.0369873046875, -0.0314788818359375, -0.025970458984375, -0.0204620361328125, -0.01495361328125, -0.0094451904296875, -0.003936767578125, 0.0015716552734375, 0.007080078125, 0.0125885009765625, 0.018096923828125, 0.0236053466796875, 0.02911376953125, 0.0346221923828125, 0.040130615234375, 0.0456390380859375, 0.0511474609375, 0.0566558837890625, 0.062164306640625, 0.0676727294921875, 0.07318115234375, 0.0786895751953125, 0.084197998046875, 0.0897064208984375, 0.09521484375, 0.1007232666015625, 0.106231689453125, 0.1117401123046875, 0.11724853515625, 0.1227569580078125, 0.128265380859375, 0.1337738037109375, 0.1392822265625, 0.1447906494140625, 0.150299072265625, 0.1558074951171875, 0.16131591796875, 0.1668243408203125, 0.172332763671875, 0.1778411865234375, 0.183349609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 6.0, 11.0, 29.0, 23.0, 66.0, 86.0, 131.0, 210.0, 386.0, 876.0, 2041.0, 5536.0, 14806.0, 39112.0, 107972.0, 357033.0, 352239.0, 105571.0, 38316.0, 14835.0, 5428.0, 2087.0, 826.0, 368.0, 193.0, 126.0, 78.0, 50.0, 37.0, 20.0, 14.0, 14.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07843017578125, -0.07625102996826172, -0.07407188415527344, -0.07189273834228516, -0.06971359252929688, -0.0675344467163086, -0.06535530090332031, -0.06317615509033203, -0.06099700927734375, -0.05881786346435547, -0.05663871765136719, -0.054459571838378906, -0.052280426025390625, -0.050101280212402344, -0.04792213439941406, -0.04574298858642578, -0.0435638427734375, -0.04138469696044922, -0.03920555114746094, -0.037026405334472656, -0.034847259521484375, -0.032668113708496094, -0.030488967895507812, -0.02830982208251953, -0.02613067626953125, -0.02395153045654297, -0.021772384643554688, -0.019593238830566406, -0.017414093017578125, -0.015234947204589844, -0.013055801391601562, -0.010876655578613281, -0.008697509765625, -0.006518363952636719, -0.0043392181396484375, -0.0021600723266601562, 1.9073486328125e-05, 0.0021982192993164062, 0.0043773651123046875, 0.006556510925292969, 0.00873565673828125, 0.010914802551269531, 0.013093948364257812, 0.015273094177246094, 0.017452239990234375, 0.019631385803222656, 0.021810531616210938, 0.02398967742919922, 0.0261688232421875, 0.02834796905517578, 0.030527114868164062, 0.032706260681152344, 0.034885406494140625, 0.037064552307128906, 0.03924369812011719, 0.04142284393310547, 0.04360198974609375, 0.04578113555908203, 0.04796028137207031, 0.050139427185058594, 0.052318572998046875, 0.054497718811035156, 0.05667686462402344, 0.05885601043701172, 0.06103515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 3.0, 11.0, 13.0, 15.0, 26.0, 25.0, 26.0, 40.0, 51.0, 79.0, 76.0, 90.0, 94.0, 83.0, 65.0, 48.0, 53.0, 55.0, 30.0, 26.0, 19.0, 11.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9729137420654297e-05, -1.9137747585773468e-05, -1.854635775089264e-05, -1.795496791601181e-05, -1.736357808113098e-05, -1.6772188246250153e-05, -1.6180798411369324e-05, -1.5589408576488495e-05, -1.4998018741607666e-05, -1.4406628906726837e-05, -1.3815239071846008e-05, -1.322384923696518e-05, -1.263245940208435e-05, -1.2041069567203522e-05, -1.1449679732322693e-05, -1.0858289897441864e-05, -1.0266900062561035e-05, -9.675510227680206e-06, -9.084120392799377e-06, -8.492730557918549e-06, -7.90134072303772e-06, -7.309950888156891e-06, -6.718561053276062e-06, -6.127171218395233e-06, -5.535781383514404e-06, -4.9443915486335754e-06, -4.353001713752747e-06, -3.7616118788719177e-06, -3.170222043991089e-06, -2.57883220911026e-06, -1.987442374229431e-06, -1.3960525393486023e-06, -8.046627044677734e-07, -2.1327286958694458e-07, 3.781169652938843e-07, 9.695068001747131e-07, 1.560896635055542e-06, 2.152286469936371e-06, 2.7436763048171997e-06, 3.3350661396980286e-06, 3.926455974578857e-06, 4.517845809459686e-06, 5.109235644340515e-06, 5.700625479221344e-06, 6.292015314102173e-06, 6.883405148983002e-06, 7.4747949838638306e-06, 8.06618481874466e-06, 8.657574653625488e-06, 9.248964488506317e-06, 9.840354323387146e-06, 1.0431744158267975e-05, 1.1023133993148804e-05, 1.1614523828029633e-05, 1.2205913662910461e-05, 1.279730349779129e-05, 1.3388693332672119e-05, 1.3980083167552948e-05, 1.4571473002433777e-05, 1.5162862837314606e-05, 1.5754252672195435e-05, 1.6345642507076263e-05, 1.6937032341957092e-05, 1.752842217683792e-05, 1.811981201171875e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 14.0, 25.0, 30.0, 56.0, 94.0, 149.0, 319.0, 798.0, 3224.0, 17064.0, 106708.0, 605336.0, 265297.0, 40098.0, 6821.0, 1497.0, 506.0, 216.0, 136.0, 62.0, 42.0, 22.0, 15.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11846923828125, -0.11485004425048828, -0.11123085021972656, -0.10761165618896484, -0.10399246215820312, -0.1003732681274414, -0.09675407409667969, -0.09313488006591797, -0.08951568603515625, -0.08589649200439453, -0.08227729797363281, -0.0786581039428711, -0.07503890991210938, -0.07141971588134766, -0.06780052185058594, -0.06418132781982422, -0.0605621337890625, -0.05694293975830078, -0.05332374572753906, -0.049704551696777344, -0.046085357666015625, -0.042466163635253906, -0.03884696960449219, -0.03522777557373047, -0.03160858154296875, -0.02798938751220703, -0.024370193481445312, -0.020750999450683594, -0.017131805419921875, -0.013512611389160156, -0.009893417358398438, -0.006274223327636719, -0.002655029296875, 0.0009641647338867188, 0.0045833587646484375, 0.008202552795410156, 0.011821746826171875, 0.015440940856933594, 0.019060134887695312, 0.02267932891845703, 0.02629852294921875, 0.02991771697998047, 0.03353691101074219, 0.037156105041503906, 0.040775299072265625, 0.044394493103027344, 0.04801368713378906, 0.05163288116455078, 0.0552520751953125, 0.05887126922607422, 0.06249046325683594, 0.06610965728759766, 0.06972885131835938, 0.0733480453491211, 0.07696723937988281, 0.08058643341064453, 0.08420562744140625, 0.08782482147216797, 0.09144401550292969, 0.0950632095336914, 0.09868240356445312, 0.10230159759521484, 0.10592079162597656, 0.10953998565673828, 0.1131591796875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 10.0, 11.0, 12.0, 16.0, 17.0, 22.0, 22.0, 39.0, 40.0, 47.0, 67.0, 76.0, 106.0, 89.0, 95.0, 65.0, 52.0, 41.0, 36.0, 26.0, 25.0, 21.0, 13.0, 5.0, 11.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0523681640625, -0.05062532424926758, -0.048882484436035156, -0.047139644622802734, -0.04539680480957031, -0.04365396499633789, -0.04191112518310547, -0.04016828536987305, -0.038425445556640625, -0.0366826057434082, -0.03493976593017578, -0.03319692611694336, -0.03145408630371094, -0.029711246490478516, -0.027968406677246094, -0.026225566864013672, -0.02448272705078125, -0.022739887237548828, -0.020997047424316406, -0.019254207611083984, -0.017511367797851562, -0.01576852798461914, -0.014025688171386719, -0.012282848358154297, -0.010540008544921875, -0.008797168731689453, -0.007054328918457031, -0.005311489105224609, -0.0035686492919921875, -0.0018258094787597656, -8.296966552734375e-05, 0.0016598701477050781, 0.0034027099609375, 0.005145549774169922, 0.006888389587402344, 0.008631229400634766, 0.010374069213867188, 0.01211690902709961, 0.013859748840332031, 0.015602588653564453, 0.017345428466796875, 0.019088268280029297, 0.02083110809326172, 0.02257394790649414, 0.024316787719726562, 0.026059627532958984, 0.027802467346191406, 0.029545307159423828, 0.03128814697265625, 0.03303098678588867, 0.034773826599121094, 0.036516666412353516, 0.03825950622558594, 0.04000234603881836, 0.04174518585205078, 0.0434880256652832, 0.045230865478515625, 0.04697370529174805, 0.04871654510498047, 0.05045938491821289, 0.05220222473144531, 0.053945064544677734, 0.055687904357910156, 0.05743074417114258, 0.059173583984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 13.0, 28.0, 65.0, 129.0, 215.0, 226.0, 170.0, 106.0, 34.0, 13.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.140767812728882, -2.101344347000122, -2.0619211196899414, -2.0224976539611816, -1.983074426651001, -1.9436509609222412, -1.904227614402771, -1.8648042678833008, -1.8253809213638306, -1.7859575748443604, -1.7465342283248901, -1.70711088180542, -1.6676874160766602, -1.62826406955719, -1.5888407230377197, -1.5494173765182495, -1.5099940299987793, -1.470570683479309, -1.4311473369598389, -1.3917239904403687, -1.3523006439208984, -1.3128771781921387, -1.2734538316726685, -1.2340304851531982, -1.194607138633728, -1.1551837921142578, -1.1157604455947876, -1.0763370990753174, -1.0369136333465576, -0.9974903464317322, -0.9580669403076172, -0.918643593788147, -0.879220187664032, -0.8397968411445618, -0.8003734350204468, -0.7609500885009766, -0.7215267419815063, -0.6821033954620361, -0.6426800489425659, -0.6032566428184509, -0.5638332962989807, -0.5244099497795105, -0.4849865734577179, -0.4455631971359253, -0.4061398506164551, -0.36671650409698486, -0.32729312777519226, -0.28786975145339966, -0.24844640493392944, -0.20902304351329803, -0.16959968209266663, -0.13017632067203522, -0.09075295925140381, -0.0513295978307724, -0.011906236410140991, 0.02751713991165161, 0.06694048643112183, 0.10636384785175323, 0.14578720927238464, 0.18521057069301605, 0.22463393211364746, 0.2640572786331177, 0.3034806549549103, 0.3429040312767029, 0.3823273777961731]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 10.0, 19.0, 13.0, 21.0, 16.0, 31.0, 27.0, 44.0, 43.0, 28.0, 37.0, 50.0, 44.0, 50.0, 53.0, 40.0, 48.0, 47.0, 36.0, 46.0, 36.0, 35.0, 34.0, 29.0, 27.0, 24.0, 19.0, 18.0, 14.0, 8.0, 7.0, 7.0, 5.0, 6.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4714987874031067, -0.4570818245410919, -0.44266486167907715, -0.42824786901474, -0.4138309061527252, -0.39941394329071045, -0.3849969804286957, -0.3705800175666809, -0.35616302490234375, -0.341746062040329, -0.3273290991783142, -0.31291210651397705, -0.2984951436519623, -0.2840781807899475, -0.26966121792793274, -0.25524425506591797, -0.2408272922039032, -0.22641032934188843, -0.21199335157871246, -0.1975763887166977, -0.18315941095352173, -0.16874244809150696, -0.1543254852294922, -0.13990852236747742, -0.12549154460430145, -0.11107457429170609, -0.09665760397911072, -0.08224064111709595, -0.06782367080450058, -0.05340670049190521, -0.03898973762989044, -0.024572767317295074, -0.010155797004699707, 0.004261171445250511, 0.01867813989520073, 0.0330951064825058, 0.047512076795101166, 0.06192904710769653, 0.0763460099697113, 0.09076298028230667, 0.10517995059490204, 0.1195969209074974, 0.13401389122009277, 0.14843085408210754, 0.16284781694412231, 0.17726479470729828, 0.19168175756931305, 0.206098735332489, 0.22051569819450378, 0.23493266105651855, 0.24934963881969452, 0.2637665867805481, 0.27818357944488525, 0.2926005423069, 0.3070175051689148, 0.32143446803092957, 0.33585143089294434, 0.3502683937549591, 0.3646853566169739, 0.37910234928131104, 0.3935193121433258, 0.4079362750053406, 0.42235323786735535, 0.4367702007293701, 0.4511871933937073]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 9.0, 12.0, 14.0, 20.0, 22.0, 46.0, 57.0, 101.0, 118.0, 220.0, 345.0, 599.0, 1064.0, 1909.0, 3300.0, 6045.0, 11485.0, 22437.0, 45206.0, 96256.0, 222717.0, 591815.0, 1520102.0, 1026428.0, 364044.0, 147088.0, 65978.0, 32139.0, 16041.0, 8167.0, 4511.0, 2495.0, 1381.0, 805.0, 474.0, 274.0, 194.0, 119.0, 91.0, 60.0, 25.0, 24.0, 17.0, 4.0, 4.0, 7.0, 9.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06201171875, -0.059927940368652344, -0.05784416198730469, -0.05576038360595703, -0.053676605224609375, -0.05159282684326172, -0.04950904846191406, -0.047425270080566406, -0.04534149169921875, -0.043257713317871094, -0.04117393493652344, -0.03909015655517578, -0.037006378173828125, -0.03492259979248047, -0.03283882141113281, -0.030755043029785156, -0.0286712646484375, -0.026587486267089844, -0.024503707885742188, -0.02241992950439453, -0.020336151123046875, -0.01825237274169922, -0.016168594360351562, -0.014084815979003906, -0.01200103759765625, -0.009917259216308594, -0.007833480834960938, -0.005749702453613281, -0.003665924072265625, -0.0015821456909179688, 0.0005016326904296875, 0.0025854110717773438, 0.004669189453125, 0.006752967834472656, 0.008836746215820312, 0.010920524597167969, 0.013004302978515625, 0.015088081359863281, 0.017171859741210938, 0.019255638122558594, 0.02133941650390625, 0.023423194885253906, 0.025506973266601562, 0.02759075164794922, 0.029674530029296875, 0.03175830841064453, 0.03384208679199219, 0.035925865173339844, 0.0380096435546875, 0.040093421936035156, 0.04217720031738281, 0.04426097869873047, 0.046344757080078125, 0.04842853546142578, 0.05051231384277344, 0.052596092224121094, 0.05467987060546875, 0.056763648986816406, 0.05884742736816406, 0.06093120574951172, 0.06301498413085938, 0.06509876251220703, 0.06718254089355469, 0.06926631927490234, 0.07135009765625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 7.0, 11.0, 13.0, 11.0, 19.0, 19.0, 24.0, 18.0, 29.0, 29.0, 24.0, 32.0, 32.0, 45.0, 35.0, 35.0, 57.0, 46.0, 48.0, 56.0, 44.0, 45.0, 41.0, 33.0, 28.0, 33.0, 30.0, 26.0, 23.0, 19.0, 10.0, 16.0, 7.0, 6.0, 7.0, 5.0, 9.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05718994140625, -0.05518913269042969, -0.053188323974609375, -0.05118751525878906, -0.04918670654296875, -0.04718589782714844, -0.045185089111328125, -0.04318428039550781, -0.0411834716796875, -0.03918266296386719, -0.037181854248046875, -0.03518104553222656, -0.03318023681640625, -0.031179428100585938, -0.029178619384765625, -0.027177810668945312, -0.025177001953125, -0.023176193237304688, -0.021175384521484375, -0.019174575805664062, -0.01717376708984375, -0.015172958374023438, -0.013172149658203125, -0.011171340942382812, -0.0091705322265625, -0.0071697235107421875, -0.005168914794921875, -0.0031681060791015625, -0.00116729736328125, 0.0008335113525390625, 0.002834320068359375, 0.0048351287841796875, 0.0068359375, 0.008836746215820312, 0.010837554931640625, 0.012838363647460938, 0.01483917236328125, 0.016839981079101562, 0.018840789794921875, 0.020841598510742188, 0.0228424072265625, 0.024843215942382812, 0.026844024658203125, 0.028844833374023438, 0.03084564208984375, 0.03284645080566406, 0.034847259521484375, 0.03684806823730469, 0.038848876953125, 0.04084968566894531, 0.042850494384765625, 0.04485130310058594, 0.04685211181640625, 0.04885292053222656, 0.050853729248046875, 0.05285453796386719, 0.0548553466796875, 0.05685615539550781, 0.058856964111328125, 0.06085777282714844, 0.06285858154296875, 0.06485939025878906, 0.06686019897460938, 0.06886100769042969, 0.07086181640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 6.0, 9.0, 9.0, 25.0, 27.0, 44.0, 71.0, 93.0, 145.0, 199.0, 336.0, 473.0, 834.0, 1326.0, 2282.0, 3996.0, 7221.0, 14640.0, 30310.0, 66291.0, 156797.0, 410652.0, 1275361.0, 1436501.0, 470418.0, 175821.0, 73126.0, 33209.0, 15765.0, 7949.0, 4087.0, 2450.0, 1400.0, 837.0, 534.0, 329.0, 232.0, 142.0, 107.0, 60.0, 64.0, 41.0, 24.0, 8.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0931396484375, -0.09023475646972656, -0.08732986450195312, -0.08442497253417969, -0.08152008056640625, -0.07861518859863281, -0.07571029663085938, -0.07280540466308594, -0.0699005126953125, -0.06699562072753906, -0.06409072875976562, -0.06118583679199219, -0.05828094482421875, -0.05537605285644531, -0.052471160888671875, -0.04956626892089844, -0.046661376953125, -0.04375648498535156, -0.040851593017578125, -0.03794670104980469, -0.03504180908203125, -0.03213691711425781, -0.029232025146484375, -0.026327133178710938, -0.0234222412109375, -0.020517349243164062, -0.017612457275390625, -0.014707565307617188, -0.01180267333984375, -0.008897781372070312, -0.005992889404296875, -0.0030879974365234375, -0.00018310546875, 0.0027217864990234375, 0.005626678466796875, 0.008531570434570312, 0.01143646240234375, 0.014341354370117188, 0.017246246337890625, 0.020151138305664062, 0.0230560302734375, 0.025960922241210938, 0.028865814208984375, 0.03177070617675781, 0.03467559814453125, 0.03758049011230469, 0.040485382080078125, 0.04339027404785156, 0.046295166015625, 0.04920005798339844, 0.052104949951171875, 0.05500984191894531, 0.05791473388671875, 0.06081962585449219, 0.06372451782226562, 0.06662940979003906, 0.0695343017578125, 0.07243919372558594, 0.07534408569335938, 0.07824897766113281, 0.08115386962890625, 0.08405876159667969, 0.08696365356445312, 0.08986854553222656, 0.0927734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 19.0, 27.0, 25.0, 50.0, 79.0, 103.0, 166.0, 248.0, 417.0, 627.0, 749.0, 557.0, 336.0, 232.0, 131.0, 86.0, 58.0, 46.0, 37.0, 14.0, 16.0, 7.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1256103515625, -0.12064552307128906, -0.11568069458007812, -0.11071586608886719, -0.10575103759765625, -0.10078620910644531, -0.09582138061523438, -0.09085655212402344, -0.0858917236328125, -0.08092689514160156, -0.07596206665039062, -0.07099723815917969, -0.06603240966796875, -0.06106758117675781, -0.056102752685546875, -0.05113792419433594, -0.046173095703125, -0.04120826721191406, -0.036243438720703125, -0.03127861022949219, -0.02631378173828125, -0.021348953247070312, -0.016384124755859375, -0.011419296264648438, -0.0064544677734375, -0.0014896392822265625, 0.003475189208984375, 0.008440017700195312, 0.01340484619140625, 0.018369674682617188, 0.023334503173828125, 0.028299331665039062, 0.03326416015625, 0.03822898864746094, 0.043193817138671875, 0.04815864562988281, 0.05312347412109375, 0.05808830261230469, 0.06305313110351562, 0.06801795959472656, 0.0729827880859375, 0.07794761657714844, 0.08291244506835938, 0.08787727355957031, 0.09284210205078125, 0.09780693054199219, 0.10277175903320312, 0.10773658752441406, 0.112701416015625, 0.11766624450683594, 0.12263107299804688, 0.1275959014892578, 0.13256072998046875, 0.1375255584716797, 0.14249038696289062, 0.14745521545410156, 0.1524200439453125, 0.15738487243652344, 0.16234970092773438, 0.1673145294189453, 0.17227935791015625, 0.1772441864013672, 0.18220901489257812, 0.18717384338378906, 0.192138671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 15.0, 26.0, 50.0, 42.0, 84.0, 99.0, 120.0, 124.0, 115.0, 94.0, 72.0, 59.0, 45.0, 24.0, 10.0, 10.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0500328540802002, -1.024706482887268, -0.9993801712989807, -0.9740538597106934, -0.9487274885177612, -0.9234011769294739, -0.8980748653411865, -0.8727484941482544, -0.847422182559967, -0.8220958709716797, -0.7967694997787476, -0.7714431881904602, -0.7461168169975281, -0.7207905054092407, -0.6954641342163086, -0.6701378226280212, -0.6448115110397339, -0.6194851994514465, -0.5941588282585144, -0.568832516670227, -0.5435061454772949, -0.5181798338890076, -0.4928534924983978, -0.4675271511077881, -0.44220077991485596, -0.4168744385242462, -0.3915480971336365, -0.3662217855453491, -0.3408954441547394, -0.31556910276412964, -0.2902427613735199, -0.26491641998291016, -0.2395901083946228, -0.21426376700401306, -0.18893744051456451, -0.16361109912395477, -0.13828477263450623, -0.11295843124389648, -0.08763208985328674, -0.062305763363838196, -0.036979421973228455, -0.011653086170554161, 0.013673249632120132, 0.038999587297439575, 0.06432592123746872, 0.08965225517749786, 0.1149785965681076, 0.14030492305755615, 0.1656312644481659, 0.19095760583877563, 0.21628393232822418, 0.24161027371883392, 0.26693660020828247, 0.2922629415988922, 0.31758928298950195, 0.3429155945777893, 0.36824196577072144, 0.3935683071613312, 0.4188946485519409, 0.44422096014022827, 0.469547301530838, 0.49487364292144775, 0.5202000141143799, 0.5455263257026672, 0.5708526372909546]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 8.0, 7.0, 7.0, 10.0, 15.0, 18.0, 19.0, 20.0, 25.0, 36.0, 28.0, 34.0, 37.0, 35.0, 40.0, 39.0, 44.0, 41.0, 39.0, 48.0, 39.0, 37.0, 39.0, 39.0, 36.0, 29.0, 31.0, 28.0, 31.0, 26.0, 16.0, 19.0, 13.0, 8.0, 11.0, 5.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.38728368282318115, -0.3750231862068176, -0.3627626895904541, -0.35050222277641296, -0.33824172616004944, -0.3259812295436859, -0.3137207329273224, -0.30146026611328125, -0.2891997694969177, -0.2769392728805542, -0.2646787762641907, -0.25241830945014954, -0.240157812833786, -0.22789731621742249, -0.21563681960105896, -0.20337633788585663, -0.1911158412694931, -0.17885534465312958, -0.16659486293792725, -0.15433436632156372, -0.1420738846063614, -0.12981338798999786, -0.11755289882421494, -0.105292409658432, -0.09303192049264908, -0.08077143132686615, -0.06851094216108322, -0.056250449270009995, -0.043989960104227066, -0.03172947093844414, -0.01946897804737091, -0.007208488881587982, 0.005052000284194946, 0.017312489449977875, 0.029572980478405952, 0.04183347150683403, 0.05409396067261696, 0.06635445356369019, 0.07861494272947311, 0.09087543189525604, 0.10313592106103897, 0.1153964102268219, 0.12765690684318542, 0.13991738855838776, 0.15217788517475128, 0.1644383668899536, 0.17669886350631714, 0.18895936012268066, 0.201219841837883, 0.21348033845424652, 0.22574082016944885, 0.23800131678581238, 0.2502618134021759, 0.26252228021621704, 0.27478277683258057, 0.2870432734489441, 0.2993037700653076, 0.31156426668167114, 0.32382476329803467, 0.3360852301120758, 0.34834572672843933, 0.36060622334480286, 0.3728667199611664, 0.3851271867752075, 0.39738768339157104]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 11.0, 13.0, 18.0, 34.0, 39.0, 70.0, 118.0, 142.0, 294.0, 430.0, 687.0, 1015.0, 1618.0, 2513.0, 4057.0, 6210.0, 9620.0, 14848.0, 23489.0, 37911.0, 62632.0, 107178.0, 177346.0, 217001.0, 151513.0, 88854.0, 52507.0, 32270.0, 20066.0, 12936.0, 8233.0, 5400.0, 3444.0, 2155.0, 1356.0, 930.0, 521.0, 405.0, 228.0, 166.0, 91.0, 68.0, 46.0, 28.0, 13.0, 12.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.074462890625, -0.0721597671508789, -0.06985664367675781, -0.06755352020263672, -0.06525039672851562, -0.06294727325439453, -0.06064414978027344, -0.058341026306152344, -0.05603790283203125, -0.053734779357910156, -0.05143165588378906, -0.04912853240966797, -0.046825408935546875, -0.04452228546142578, -0.04221916198730469, -0.039916038513183594, -0.0376129150390625, -0.035309791564941406, -0.03300666809082031, -0.03070354461669922, -0.028400421142578125, -0.02609729766845703, -0.023794174194335938, -0.021491050720214844, -0.01918792724609375, -0.016884803771972656, -0.014581680297851562, -0.012278556823730469, -0.009975433349609375, -0.007672309875488281, -0.0053691864013671875, -0.0030660629272460938, -0.000762939453125, 0.0015401840209960938, 0.0038433074951171875, 0.006146430969238281, 0.008449554443359375, 0.010752677917480469, 0.013055801391601562, 0.015358924865722656, 0.01766204833984375, 0.019965171813964844, 0.022268295288085938, 0.02457141876220703, 0.026874542236328125, 0.02917766571044922, 0.03148078918457031, 0.033783912658691406, 0.0360870361328125, 0.038390159606933594, 0.04069328308105469, 0.04299640655517578, 0.045299530029296875, 0.04760265350341797, 0.04990577697753906, 0.052208900451660156, 0.05451202392578125, 0.056815147399902344, 0.05911827087402344, 0.06142139434814453, 0.06372451782226562, 0.06602764129638672, 0.06833076477050781, 0.0706338882446289, 0.07293701171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 12.0, 5.0, 9.0, 9.0, 10.0, 22.0, 21.0, 26.0, 30.0, 23.0, 28.0, 27.0, 40.0, 38.0, 50.0, 37.0, 41.0, 42.0, 38.0, 47.0, 35.0, 40.0, 37.0, 45.0, 30.0, 40.0, 32.0, 30.0, 28.0, 19.0, 25.0, 9.0, 13.0, 9.0, 5.0, 4.0, 12.0, 3.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05621337890625, -0.054299354553222656, -0.05238533020019531, -0.05047130584716797, -0.048557281494140625, -0.04664325714111328, -0.04472923278808594, -0.042815208435058594, -0.04090118408203125, -0.038987159729003906, -0.03707313537597656, -0.03515911102294922, -0.033245086669921875, -0.03133106231689453, -0.029417037963867188, -0.027503013610839844, -0.0255889892578125, -0.023674964904785156, -0.021760940551757812, -0.01984691619873047, -0.017932891845703125, -0.01601886749267578, -0.014104843139648438, -0.012190818786621094, -0.01027679443359375, -0.008362770080566406, -0.0064487457275390625, -0.004534721374511719, -0.002620697021484375, -0.0007066726684570312, 0.0012073516845703125, 0.0031213760375976562, 0.005035400390625, 0.006949424743652344, 0.008863449096679688, 0.010777473449707031, 0.012691497802734375, 0.014605522155761719, 0.016519546508789062, 0.018433570861816406, 0.02034759521484375, 0.022261619567871094, 0.024175643920898438, 0.02608966827392578, 0.028003692626953125, 0.02991771697998047, 0.03183174133300781, 0.033745765686035156, 0.0356597900390625, 0.037573814392089844, 0.03948783874511719, 0.04140186309814453, 0.043315887451171875, 0.04522991180419922, 0.04714393615722656, 0.049057960510253906, 0.05097198486328125, 0.052886009216308594, 0.05480003356933594, 0.05671405792236328, 0.058628082275390625, 0.06054210662841797, 0.06245613098144531, 0.06437015533447266, 0.0662841796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 10.0, 6.0, 8.0, 9.0, 15.0, 31.0, 24.0, 39.0, 50.0, 62.0, 96.0, 145.0, 234.0, 324.0, 607.0, 1592.0, 4950.0, 17198.0, 61364.0, 225380.0, 485938.0, 180014.0, 49755.0, 13856.0, 4021.0, 1335.0, 538.0, 298.0, 182.0, 139.0, 93.0, 64.0, 39.0, 36.0, 25.0, 20.0, 17.0, 10.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1871337890625, -0.18117713928222656, -0.17522048950195312, -0.1692638397216797, -0.16330718994140625, -0.1573505401611328, -0.15139389038085938, -0.14543724060058594, -0.1394805908203125, -0.13352394104003906, -0.12756729125976562, -0.12161064147949219, -0.11565399169921875, -0.10969734191894531, -0.10374069213867188, -0.09778404235839844, -0.091827392578125, -0.08587074279785156, -0.07991409301757812, -0.07395744323730469, -0.06800079345703125, -0.06204414367675781, -0.056087493896484375, -0.05013084411621094, -0.0441741943359375, -0.03821754455566406, -0.032260894775390625, -0.026304244995117188, -0.02034759521484375, -0.014390945434570312, -0.008434295654296875, -0.0024776458740234375, 0.00347900390625, 0.009435653686523438, 0.015392303466796875, 0.021348953247070312, 0.02730560302734375, 0.03326225280761719, 0.039218902587890625, 0.04517555236816406, 0.0511322021484375, 0.05708885192871094, 0.06304550170898438, 0.06900215148925781, 0.07495880126953125, 0.08091545104980469, 0.08687210083007812, 0.09282875061035156, 0.098785400390625, 0.10474205017089844, 0.11069869995117188, 0.11665534973144531, 0.12261199951171875, 0.1285686492919922, 0.13452529907226562, 0.14048194885253906, 0.1464385986328125, 0.15239524841308594, 0.15835189819335938, 0.1643085479736328, 0.17026519775390625, 0.1762218475341797, 0.18217849731445312, 0.18813514709472656, 0.194091796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 8.0, 12.0, 11.0, 8.0, 13.0, 7.0, 12.0, 14.0, 21.0, 14.0, 33.0, 24.0, 34.0, 31.0, 32.0, 35.0, 40.0, 32.0, 44.0, 35.0, 43.0, 40.0, 38.0, 32.0, 34.0, 38.0, 33.0, 28.0, 35.0, 32.0, 20.0, 23.0, 17.0, 22.0, 7.0, 20.0, 13.0, 17.0, 7.0, 10.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.15104103088378906, -0.14570999145507812, -0.1403789520263672, -0.13504791259765625, -0.1297168731689453, -0.12438583374023438, -0.11905479431152344, -0.1137237548828125, -0.10839271545410156, -0.10306167602539062, -0.09773063659667969, -0.09239959716796875, -0.08706855773925781, -0.08173751831054688, -0.07640647888183594, -0.071075439453125, -0.06574440002441406, -0.060413360595703125, -0.05508232116699219, -0.04975128173828125, -0.04442024230957031, -0.039089202880859375, -0.03375816345214844, -0.0284271240234375, -0.023096084594726562, -0.017765045166015625, -0.012434005737304688, -0.00710296630859375, -0.0017719268798828125, 0.003559112548828125, 0.008890151977539062, 0.01422119140625, 0.019552230834960938, 0.024883270263671875, 0.030214309692382812, 0.03554534912109375, 0.04087638854980469, 0.046207427978515625, 0.05153846740722656, 0.0568695068359375, 0.06220054626464844, 0.06753158569335938, 0.07286262512207031, 0.07819366455078125, 0.08352470397949219, 0.08885574340820312, 0.09418678283691406, 0.099517822265625, 0.10484886169433594, 0.11017990112304688, 0.11551094055175781, 0.12084197998046875, 0.1261730194091797, 0.13150405883789062, 0.13683509826660156, 0.1421661376953125, 0.14749717712402344, 0.15282821655273438, 0.1581592559814453, 0.16349029541015625, 0.1688213348388672, 0.17415237426757812, 0.17948341369628906, 0.184814453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 4.0, 5.0, 10.0, 15.0, 24.0, 18.0, 27.0, 35.0, 42.0, 69.0, 110.0, 167.0, 342.0, 642.0, 1359.0, 3348.0, 8279.0, 22345.0, 59686.0, 159243.0, 390613.0, 253169.0, 92293.0, 34831.0, 13092.0, 4858.0, 1981.0, 826.0, 412.0, 247.0, 135.0, 92.0, 72.0, 44.0, 28.0, 21.0, 15.0, 11.0, 8.0, 12.0, 4.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07373046875, -0.07160711288452148, -0.06948375701904297, -0.06736040115356445, -0.06523704528808594, -0.06311368942260742, -0.060990333557128906, -0.05886697769165039, -0.056743621826171875, -0.05462026596069336, -0.052496910095214844, -0.05037355422973633, -0.04825019836425781, -0.0461268424987793, -0.04400348663330078, -0.041880130767822266, -0.03975677490234375, -0.037633419036865234, -0.03551006317138672, -0.0333867073059082, -0.03126335144042969, -0.029139995574951172, -0.027016639709472656, -0.02489328384399414, -0.022769927978515625, -0.02064657211303711, -0.018523216247558594, -0.016399860382080078, -0.014276504516601562, -0.012153148651123047, -0.010029792785644531, -0.007906436920166016, -0.0057830810546875, -0.0036597251892089844, -0.0015363693237304688, 0.0005869865417480469, 0.0027103424072265625, 0.004833698272705078, 0.006957054138183594, 0.00908041000366211, 0.011203765869140625, 0.01332712173461914, 0.015450477600097656, 0.017573833465576172, 0.019697189331054688, 0.021820545196533203, 0.02394390106201172, 0.026067256927490234, 0.02819061279296875, 0.030313968658447266, 0.03243732452392578, 0.0345606803894043, 0.03668403625488281, 0.03880739212036133, 0.040930747985839844, 0.04305410385131836, 0.045177459716796875, 0.04730081558227539, 0.049424171447753906, 0.05154752731323242, 0.05367088317871094, 0.05579423904418945, 0.05791759490966797, 0.060040950775146484, 0.062164306640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 17.0, 11.0, 20.0, 20.0, 37.0, 41.0, 50.0, 84.0, 85.0, 84.0, 107.0, 93.0, 69.0, 73.0, 48.0, 50.0, 24.0, 18.0, 17.0, 13.0, 5.0, 10.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-05, -2.6103109121322632e-05, -2.5384128093719482e-05, -2.4665147066116333e-05, -2.3946166038513184e-05, -2.3227185010910034e-05, -2.2508203983306885e-05, -2.1789222955703735e-05, -2.1070241928100586e-05, -2.0351260900497437e-05, -1.9632279872894287e-05, -1.8913298845291138e-05, -1.8194317817687988e-05, -1.747533679008484e-05, -1.675635576248169e-05, -1.603737473487854e-05, -1.531839370727539e-05, -1.4599412679672241e-05, -1.3880431652069092e-05, -1.3161450624465942e-05, -1.2442469596862793e-05, -1.1723488569259644e-05, -1.1004507541656494e-05, -1.0285526514053345e-05, -9.566545486450195e-06, -8.847564458847046e-06, -8.128583431243896e-06, -7.409602403640747e-06, -6.690621376037598e-06, -5.971640348434448e-06, -5.252659320831299e-06, -4.533678293228149e-06, -3.814697265625e-06, -3.0957162380218506e-06, -2.376735210418701e-06, -1.6577541828155518e-06, -9.387731552124023e-07, -2.1979212760925293e-07, 4.991888999938965e-07, 1.218169927597046e-06, 1.9371509552001953e-06, 2.6561319828033447e-06, 3.375113010406494e-06, 4.0940940380096436e-06, 4.813075065612793e-06, 5.532056093215942e-06, 6.251037120819092e-06, 6.970018148422241e-06, 7.68899917602539e-06, 8.40798020362854e-06, 9.12696123123169e-06, 9.845942258834839e-06, 1.0564923286437988e-05, 1.1283904314041138e-05, 1.2002885341644287e-05, 1.2721866369247437e-05, 1.3440847396850586e-05, 1.4159828424453735e-05, 1.4878809452056885e-05, 1.5597790479660034e-05, 1.6316771507263184e-05, 1.7035752534866333e-05, 1.7754733562469482e-05, 1.8473714590072632e-05, 1.919269561767578e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 9.0, 10.0, 18.0, 17.0, 26.0, 37.0, 49.0, 81.0, 119.0, 153.0, 231.0, 507.0, 979.0, 2401.0, 6772.0, 19930.0, 57189.0, 156206.0, 363475.0, 276235.0, 105243.0, 37883.0, 13131.0, 4393.0, 1725.0, 742.0, 373.0, 201.0, 113.0, 90.0, 61.0, 43.0, 36.0, 20.0, 11.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.06663036346435547, -0.06453514099121094, -0.062439918518066406, -0.060344696044921875, -0.058249473571777344, -0.05615425109863281, -0.05405902862548828, -0.05196380615234375, -0.04986858367919922, -0.04777336120605469, -0.045678138732910156, -0.043582916259765625, -0.041487693786621094, -0.03939247131347656, -0.03729724884033203, -0.0352020263671875, -0.03310680389404297, -0.031011581420898438, -0.028916358947753906, -0.026821136474609375, -0.024725914001464844, -0.022630691528320312, -0.02053546905517578, -0.01844024658203125, -0.01634502410888672, -0.014249801635742188, -0.012154579162597656, -0.010059356689453125, -0.007964134216308594, -0.0058689117431640625, -0.0037736892700195312, -0.001678466796875, 0.00041675567626953125, 0.0025119781494140625, 0.004607200622558594, 0.006702423095703125, 0.008797645568847656, 0.010892868041992188, 0.012988090515136719, 0.01508331298828125, 0.01717853546142578, 0.019273757934570312, 0.021368980407714844, 0.023464202880859375, 0.025559425354003906, 0.027654647827148438, 0.02974987030029297, 0.0318450927734375, 0.03394031524658203, 0.03603553771972656, 0.038130760192871094, 0.040225982666015625, 0.042321205139160156, 0.04441642761230469, 0.04651165008544922, 0.04860687255859375, 0.05070209503173828, 0.05279731750488281, 0.054892539978027344, 0.056987762451171875, 0.059082984924316406, 0.06117820739746094, 0.06327342987060547, 0.06536865234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 15.0, 10.0, 9.0, 22.0, 20.0, 23.0, 43.0, 39.0, 36.0, 79.0, 95.0, 113.0, 116.0, 77.0, 62.0, 43.0, 39.0, 31.0, 32.0, 15.0, 14.0, 10.0, 14.0, 9.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09942626953125, -0.09714698791503906, -0.09486770629882812, -0.09258842468261719, -0.09030914306640625, -0.08802986145019531, -0.08575057983398438, -0.08347129821777344, -0.0811920166015625, -0.07891273498535156, -0.07663345336914062, -0.07435417175292969, -0.07207489013671875, -0.06979560852050781, -0.06751632690429688, -0.06523704528808594, -0.062957763671875, -0.06067848205566406, -0.058399200439453125, -0.05611991882324219, -0.05384063720703125, -0.05156135559082031, -0.049282073974609375, -0.04700279235839844, -0.0447235107421875, -0.04244422912597656, -0.040164947509765625, -0.03788566589355469, -0.03560638427734375, -0.03332710266113281, -0.031047821044921875, -0.028768539428710938, -0.0264892578125, -0.024209976196289062, -0.021930694580078125, -0.019651412963867188, -0.01737213134765625, -0.015092849731445312, -0.012813568115234375, -0.010534286499023438, -0.0082550048828125, -0.0059757232666015625, -0.003696441650390625, -0.0014171600341796875, 0.00086212158203125, 0.0031414031982421875, 0.005420684814453125, 0.0076999664306640625, 0.009979248046875, 0.012258529663085938, 0.014537811279296875, 0.016817092895507812, 0.01909637451171875, 0.021375656127929688, 0.023654937744140625, 0.025934219360351562, 0.0282135009765625, 0.030492782592773438, 0.032772064208984375, 0.03505134582519531, 0.03733062744140625, 0.03960990905761719, 0.041889190673828125, 0.04416847229003906, 0.04644775390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 11.0, 35.0, 50.0, 80.0, 98.0, 137.0, 149.0, 142.0, 112.0, 76.0, 50.0, 27.0, 10.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6319550275802612, -0.6007624864578247, -0.569570004940033, -0.5383774638175964, -0.5071849822998047, -0.47599244117736816, -0.44479990005493164, -0.4136073887348175, -0.38241487741470337, -0.35122236609458923, -0.3200298547744751, -0.2888373136520386, -0.25764480233192444, -0.2264522910118103, -0.19525976479053497, -0.16406723856925964, -0.1328747272491455, -0.10168220847845078, -0.07048968970775604, -0.03929717093706131, -0.008104652166366577, 0.02308785915374756, 0.05428038537502289, 0.08547291159629822, 0.11666542291641235, 0.1478579342365265, 0.17905046045780182, 0.21024298667907715, 0.24143549799919128, 0.2726280093193054, 0.30382055044174194, 0.3350130617618561, 0.3662055730819702, 0.39739808440208435, 0.4285905957221985, 0.459783136844635, 0.49097564816474915, 0.5221681594848633, 0.5533607006072998, 0.5845532417297363, 0.6157457232475281, 0.6469382643699646, 0.6781307458877563, 0.7093232870101929, 0.7405158281326294, 0.7717083096504211, 0.8029008507728577, 0.8340933322906494, 0.8652858734130859, 0.8964784145355225, 0.9276708960533142, 0.9588634371757507, 0.9900559186935425, 1.021248459815979, 1.0524410009384155, 1.083633542060852, 1.114825963973999, 1.1460185050964355, 1.177211046218872, 1.208403468132019, 1.2395960092544556, 1.270788550376892, 1.3019810914993286, 1.3331736326217651, 1.3643661737442017]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 6.0, 10.0, 11.0, 15.0, 17.0, 18.0, 15.0, 25.0, 26.0, 26.0, 27.0, 33.0, 28.0, 39.0, 36.0, 41.0, 46.0, 48.0, 31.0, 41.0, 42.0, 41.0, 39.0, 34.0, 30.0, 36.0, 29.0, 28.0, 37.0, 18.0, 23.0, 12.0, 16.0, 16.0, 12.0, 10.0, 5.0, 6.0, 6.0, 7.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54017174243927, -0.5241564512252808, -0.5081411004066467, -0.49212580919265747, -0.4761105179786682, -0.46009519696235657, -0.4440798759460449, -0.42806458473205566, -0.412049263715744, -0.3960339426994324, -0.3800186514854431, -0.36400333046913147, -0.3479880094528198, -0.33197271823883057, -0.3159573972225189, -0.2999420762062073, -0.283926784992218, -0.26791146397590637, -0.2518961727619171, -0.23588085174560547, -0.21986554563045502, -0.20385023951530457, -0.18783491849899292, -0.17181961238384247, -0.15580430626869202, -0.13978900015354156, -0.12377368658781052, -0.10775837302207947, -0.09174306690692902, -0.07572776079177856, -0.059712447226047516, -0.04369713366031647, -0.027681827545166016, -0.011666517704725266, 0.004348792135715485, 0.020364101976156235, 0.036379411816596985, 0.052394717931747437, 0.06841003149747849, 0.08442534506320953, 0.10044065117835999, 0.11645595729351044, 0.1324712634086609, 0.14848658442497253, 0.16450189054012299, 0.18051719665527344, 0.19653251767158508, 0.21254782378673553, 0.228563129901886, 0.24457843601703644, 0.2605937421321869, 0.27660906314849854, 0.2926243543624878, 0.30863967537879944, 0.3246549963951111, 0.34067028760910034, 0.356685608625412, 0.37270092964172363, 0.3887162208557129, 0.40473154187202454, 0.4207468628883362, 0.43676215410232544, 0.4527774751186371, 0.46879279613494873, 0.484808087348938]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 14.0, 19.0, 34.0, 42.0, 55.0, 103.0, 169.0, 306.0, 495.0, 810.0, 1550.0, 2781.0, 5417.0, 10370.0, 19787.0, 40330.0, 83473.0, 184631.0, 473966.0, 1387776.0, 1237716.0, 424122.0, 168866.0, 76203.0, 36696.0, 18539.0, 9277.0, 4873.0, 2562.0, 1430.0, 782.0, 424.0, 269.0, 146.0, 84.0, 49.0, 33.0, 23.0, 12.0, 10.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.08477783203125, -0.08248281478881836, -0.08018779754638672, -0.07789278030395508, -0.07559776306152344, -0.0733027458190918, -0.07100772857666016, -0.06871271133422852, -0.06641769409179688, -0.06412267684936523, -0.061827659606933594, -0.05953264236450195, -0.05723762512207031, -0.05494260787963867, -0.05264759063720703, -0.05035257339477539, -0.04805755615234375, -0.04576253890991211, -0.04346752166748047, -0.04117250442504883, -0.03887748718261719, -0.03658246994018555, -0.034287452697753906, -0.031992435455322266, -0.029697418212890625, -0.027402400970458984, -0.025107383728027344, -0.022812366485595703, -0.020517349243164062, -0.018222332000732422, -0.01592731475830078, -0.01363229751586914, -0.0113372802734375, -0.00904226303100586, -0.006747245788574219, -0.004452228546142578, -0.0021572113037109375, 0.00013780593872070312, 0.0024328231811523438, 0.004727840423583984, 0.007022857666015625, 0.009317874908447266, 0.011612892150878906, 0.013907909393310547, 0.016202926635742188, 0.018497943878173828, 0.02079296112060547, 0.02308797836303711, 0.02538299560546875, 0.02767801284790039, 0.02997303009033203, 0.03226804733276367, 0.03456306457519531, 0.03685808181762695, 0.039153099060058594, 0.041448116302490234, 0.043743133544921875, 0.046038150787353516, 0.048333168029785156, 0.0506281852722168, 0.05292320251464844, 0.05521821975708008, 0.05751323699951172, 0.05980825424194336, 0.062103271484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 6.0, 10.0, 6.0, 7.0, 6.0, 5.0, 10.0, 13.0, 14.0, 18.0, 27.0, 20.0, 20.0, 29.0, 32.0, 37.0, 33.0, 35.0, 33.0, 38.0, 45.0, 52.0, 49.0, 40.0, 41.0, 38.0, 39.0, 27.0, 35.0, 32.0, 28.0, 24.0, 26.0, 22.0, 12.0, 12.0, 13.0, 9.0, 9.0, 8.0, 6.0, 8.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.06884765625, -0.06691455841064453, -0.06498146057128906, -0.0630483627319336, -0.061115264892578125, -0.059182167053222656, -0.05724906921386719, -0.05531597137451172, -0.05338287353515625, -0.05144977569580078, -0.04951667785644531, -0.047583580017089844, -0.045650482177734375, -0.043717384338378906, -0.04178428649902344, -0.03985118865966797, -0.0379180908203125, -0.03598499298095703, -0.03405189514160156, -0.032118797302246094, -0.030185699462890625, -0.028252601623535156, -0.026319503784179688, -0.02438640594482422, -0.02245330810546875, -0.02052021026611328, -0.018587112426757812, -0.016654014587402344, -0.014720916748046875, -0.012787818908691406, -0.010854721069335938, -0.008921623229980469, -0.006988525390625, -0.005055427551269531, -0.0031223297119140625, -0.0011892318725585938, 0.000743865966796875, 0.0026769638061523438, 0.0046100616455078125, 0.006543159484863281, 0.00847625732421875, 0.010409355163574219, 0.012342453002929688, 0.014275550842285156, 0.016208648681640625, 0.018141746520996094, 0.020074844360351562, 0.02200794219970703, 0.0239410400390625, 0.02587413787841797, 0.027807235717773438, 0.029740333557128906, 0.031673431396484375, 0.033606529235839844, 0.03553962707519531, 0.03747272491455078, 0.03940582275390625, 0.04133892059326172, 0.04327201843261719, 0.045205116271972656, 0.047138214111328125, 0.049071311950683594, 0.05100440979003906, 0.05293750762939453, 0.05487060546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 19.0, 23.0, 29.0, 43.0, 58.0, 81.0, 121.0, 163.0, 232.0, 452.0, 740.0, 1152.0, 2193.0, 3799.0, 7018.0, 12786.0, 23495.0, 44234.0, 84756.0, 169561.0, 371409.0, 925195.0, 1383059.0, 630435.0, 265364.0, 127690.0, 64674.0, 34193.0, 18193.0, 10022.0, 5611.0, 3119.0, 1672.0, 981.0, 575.0, 373.0, 229.0, 162.0, 109.0, 67.0, 60.0, 32.0, 23.0, 25.0, 10.0, 9.0, 9.0, 7.0, 3.0, 3.0, 2.0], "bins": [-0.0902099609375, -0.08765411376953125, -0.0850982666015625, -0.08254241943359375, -0.079986572265625, -0.07743072509765625, -0.0748748779296875, -0.07231903076171875, -0.06976318359375, -0.06720733642578125, -0.0646514892578125, -0.06209564208984375, -0.059539794921875, -0.05698394775390625, -0.0544281005859375, -0.05187225341796875, -0.04931640625, -0.04676055908203125, -0.0442047119140625, -0.04164886474609375, -0.039093017578125, -0.03653717041015625, -0.0339813232421875, -0.03142547607421875, -0.02886962890625, -0.02631378173828125, -0.0237579345703125, -0.02120208740234375, -0.018646240234375, -0.01609039306640625, -0.0135345458984375, -0.01097869873046875, -0.0084228515625, -0.00586700439453125, -0.0033111572265625, -0.00075531005859375, 0.001800537109375, 0.00435638427734375, 0.0069122314453125, 0.00946807861328125, 0.01202392578125, 0.01457977294921875, 0.0171356201171875, 0.01969146728515625, 0.022247314453125, 0.02480316162109375, 0.0273590087890625, 0.02991485595703125, 0.032470703125, 0.03502655029296875, 0.0375823974609375, 0.04013824462890625, 0.042694091796875, 0.04524993896484375, 0.0478057861328125, 0.05036163330078125, 0.05291748046875, 0.05547332763671875, 0.0580291748046875, 0.06058502197265625, 0.063140869140625, 0.06569671630859375, 0.0682525634765625, 0.07080841064453125, 0.0733642578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 13.0, 9.0, 13.0, 16.0, 23.0, 45.0, 57.0, 72.0, 102.0, 162.0, 187.0, 316.0, 405.0, 596.0, 590.0, 442.0, 312.0, 192.0, 146.0, 95.0, 69.0, 48.0, 43.0, 34.0, 25.0, 14.0, 15.0, 13.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0926513671875, -0.08822250366210938, -0.08379364013671875, -0.07936477661132812, -0.0749359130859375, -0.07050704956054688, -0.06607818603515625, -0.061649322509765625, -0.057220458984375, -0.052791595458984375, -0.04836273193359375, -0.043933868408203125, -0.0395050048828125, -0.035076141357421875, -0.03064727783203125, -0.026218414306640625, -0.02178955078125, -0.017360687255859375, -0.01293182373046875, -0.008502960205078125, -0.0040740966796875, 0.000354766845703125, 0.00478363037109375, 0.009212493896484375, 0.013641357421875, 0.018070220947265625, 0.02249908447265625, 0.026927947998046875, 0.0313568115234375, 0.035785675048828125, 0.04021453857421875, 0.044643402099609375, 0.049072265625, 0.053501129150390625, 0.05792999267578125, 0.062358856201171875, 0.0667877197265625, 0.07121658325195312, 0.07564544677734375, 0.08007431030273438, 0.084503173828125, 0.08893203735351562, 0.09336090087890625, 0.09778976440429688, 0.1022186279296875, 0.10664749145507812, 0.11107635498046875, 0.11550521850585938, 0.11993408203125, 0.12436294555664062, 0.12879180908203125, 0.13322067260742188, 0.1376495361328125, 0.14207839965820312, 0.14650726318359375, 0.15093612670898438, 0.155364990234375, 0.15979385375976562, 0.16422271728515625, 0.16865158081054688, 0.1730804443359375, 0.17750930786132812, 0.18193817138671875, 0.18636703491210938, 0.1907958984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 10.0, 18.0, 43.0, 70.0, 109.0, 143.0, 167.0, 122.0, 112.0, 103.0, 48.0, 22.0, 18.0, 5.0, 9.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.579384684562683, -1.5455328226089478, -1.5116808414459229, -1.4778289794921875, -1.4439771175384521, -1.4101252555847168, -1.376273274421692, -1.3424214124679565, -1.3085694313049316, -1.2747175693511963, -1.2408655881881714, -1.207013726234436, -1.1731618642807007, -1.1393098831176758, -1.1054580211639404, -1.071606159210205, -1.0377542972564697, -1.0039024353027344, -0.9700505137443542, -0.9361985921859741, -0.9023467302322388, -0.8684948086738586, -0.8346428871154785, -0.8007910251617432, -0.766939103603363, -0.7330871820449829, -0.6992353200912476, -0.6653833985328674, -0.6315314769744873, -0.597679615020752, -0.5638276934623718, -0.5299757719039917, -0.4961237907409668, -0.46227189898490906, -0.4284200072288513, -0.3945680856704712, -0.36071619391441345, -0.3268643021583557, -0.2930123805999756, -0.25916048884391785, -0.2253085970878601, -0.19145670533180237, -0.15760479867458344, -0.1237528994679451, -0.08990100026130676, -0.05604910850524902, -0.02219720184803009, 0.011654704809188843, 0.04550659656524658, 0.07935849577188492, 0.11321039497852325, 0.1470623016357422, 0.18091419339179993, 0.21476608514785767, 0.2486179918050766, 0.28246989846229553, 0.31632179021835327, 0.350173681974411, 0.38402557373046875, 0.4178774952888489, 0.4517293870449066, 0.48558127880096436, 0.5194332003593445, 0.5532851219177246, 0.58713698387146]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0, 7.0, 8.0, 9.0, 17.0, 23.0, 18.0, 27.0, 17.0, 28.0, 22.0, 34.0, 34.0, 33.0, 35.0, 40.0, 29.0, 39.0, 41.0, 38.0, 42.0, 38.0, 37.0, 30.0, 36.0, 34.0, 34.0, 23.0, 29.0, 34.0, 20.0, 23.0, 12.0, 14.0, 9.0, 11.0, 8.0, 14.0, 9.0, 6.0, 3.0, 5.0, 5.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3596317768096924, -0.34799695014953613, -0.3363621234893799, -0.32472729682922363, -0.3130924701690674, -0.30145764350891113, -0.2898228168487549, -0.27818799018859863, -0.2665531635284424, -0.25491833686828613, -0.24328351020812988, -0.23164868354797363, -0.22001385688781738, -0.20837903022766113, -0.1967441886663437, -0.18510936200618744, -0.17347452044487, -0.16183969378471375, -0.1502048671245575, -0.13857004046440125, -0.126935213804245, -0.11530037969350815, -0.1036655455827713, -0.09203071892261505, -0.0803958922624588, -0.06876106560230255, -0.057126235216856, -0.045491404831409454, -0.033856578171253204, -0.022221751511096954, -0.010586917400360107, 0.0010479092597961426, 0.012682735919952393, 0.024317564442753792, 0.03595239296555519, 0.04758722335100174, 0.05922205001115799, 0.07085687667131424, 0.08249171078205109, 0.09412653744220734, 0.10576136410236359, 0.11739619076251984, 0.1290310174226761, 0.14066585898399353, 0.15230068564414978, 0.16393551230430603, 0.17557033896446228, 0.18720516562461853, 0.19883999228477478, 0.21047481894493103, 0.22210964560508728, 0.23374447226524353, 0.24537929892539978, 0.25701412558555603, 0.26864898204803467, 0.2802838087081909, 0.29191863536834717, 0.3035534620285034, 0.31518828868865967, 0.3268231153488159, 0.33845794200897217, 0.3500927686691284, 0.36172759532928467, 0.3733624219894409, 0.38499724864959717]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 6.0, 15.0, 33.0, 35.0, 57.0, 101.0, 136.0, 191.0, 276.0, 404.0, 659.0, 1021.0, 1506.0, 2178.0, 3259.0, 4889.0, 7498.0, 11199.0, 17090.0, 26896.0, 45161.0, 85018.0, 187736.0, 288263.0, 170193.0, 78764.0, 42318.0, 25618.0, 16151.0, 10596.0, 7196.0, 4762.0, 3151.0, 2044.0, 1364.0, 943.0, 609.0, 388.0, 285.0, 162.0, 113.0, 96.0, 49.0, 34.0, 27.0, 18.0, 11.0, 12.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.0821533203125, -0.0796966552734375, -0.077239990234375, -0.0747833251953125, -0.07232666015625, -0.0698699951171875, -0.067413330078125, -0.0649566650390625, -0.0625, -0.0600433349609375, -0.057586669921875, -0.0551300048828125, -0.05267333984375, -0.0502166748046875, -0.047760009765625, -0.0453033447265625, -0.0428466796875, -0.0403900146484375, -0.037933349609375, -0.0354766845703125, -0.03302001953125, -0.0305633544921875, -0.028106689453125, -0.0256500244140625, -0.023193359375, -0.0207366943359375, -0.018280029296875, -0.0158233642578125, -0.01336669921875, -0.0109100341796875, -0.008453369140625, -0.0059967041015625, -0.0035400390625, -0.0010833740234375, 0.001373291015625, 0.0038299560546875, 0.00628662109375, 0.0087432861328125, 0.011199951171875, 0.0136566162109375, 0.01611328125, 0.0185699462890625, 0.021026611328125, 0.0234832763671875, 0.02593994140625, 0.0283966064453125, 0.030853271484375, 0.0333099365234375, 0.0357666015625, 0.0382232666015625, 0.040679931640625, 0.0431365966796875, 0.04559326171875, 0.0480499267578125, 0.050506591796875, 0.0529632568359375, 0.055419921875, 0.0578765869140625, 0.060333251953125, 0.0627899169921875, 0.06524658203125, 0.0677032470703125, 0.070159912109375, 0.0726165771484375, 0.0750732421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 10.0, 10.0, 12.0, 7.0, 13.0, 21.0, 20.0, 24.0, 28.0, 28.0, 27.0, 41.0, 34.0, 48.0, 40.0, 37.0, 50.0, 43.0, 54.0, 58.0, 55.0, 46.0, 35.0, 32.0, 42.0, 30.0, 21.0, 23.0, 21.0, 24.0, 10.0, 13.0, 11.0, 9.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.07032394409179688, -0.06801605224609375, -0.06570816040039062, -0.0634002685546875, -0.061092376708984375, -0.05878448486328125, -0.056476593017578125, -0.054168701171875, -0.051860809326171875, -0.04955291748046875, -0.047245025634765625, -0.0449371337890625, -0.042629241943359375, -0.04032135009765625, -0.038013458251953125, -0.03570556640625, -0.033397674560546875, -0.03108978271484375, -0.028781890869140625, -0.0264739990234375, -0.024166107177734375, -0.02185821533203125, -0.019550323486328125, -0.017242431640625, -0.014934539794921875, -0.01262664794921875, -0.010318756103515625, -0.0080108642578125, -0.005702972412109375, -0.00339508056640625, -0.001087188720703125, 0.001220703125, 0.003528594970703125, 0.00583648681640625, 0.008144378662109375, 0.0104522705078125, 0.012760162353515625, 0.01506805419921875, 0.017375946044921875, 0.019683837890625, 0.021991729736328125, 0.02429962158203125, 0.026607513427734375, 0.0289154052734375, 0.031223297119140625, 0.03353118896484375, 0.035839080810546875, 0.03814697265625, 0.040454864501953125, 0.04276275634765625, 0.045070648193359375, 0.0473785400390625, 0.049686431884765625, 0.05199432373046875, 0.054302215576171875, 0.056610107421875, 0.058917999267578125, 0.06122589111328125, 0.06353378295898438, 0.0658416748046875, 0.06814956665039062, 0.07045745849609375, 0.07276535034179688, 0.0750732421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 12.0, 10.0, 15.0, 28.0, 41.0, 55.0, 105.0, 181.0, 355.0, 859.0, 2310.0, 6863.0, 19861.0, 60269.0, 267566.0, 524987.0, 113685.0, 33579.0, 11295.0, 3935.0, 1403.0, 501.0, 256.0, 135.0, 81.0, 43.0, 37.0, 21.0, 15.0, 11.0, 16.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.17000579833984375, -0.1639862060546875, -0.15796661376953125, -0.151947021484375, -0.14592742919921875, -0.1399078369140625, -0.13388824462890625, -0.12786865234375, -0.12184906005859375, -0.1158294677734375, -0.10980987548828125, -0.103790283203125, -0.09777069091796875, -0.0917510986328125, -0.08573150634765625, -0.0797119140625, -0.07369232177734375, -0.0676727294921875, -0.06165313720703125, -0.055633544921875, -0.04961395263671875, -0.0435943603515625, -0.03757476806640625, -0.03155517578125, -0.02553558349609375, -0.0195159912109375, -0.01349639892578125, -0.007476806640625, -0.00145721435546875, 0.0045623779296875, 0.01058197021484375, 0.0166015625, 0.02262115478515625, 0.0286407470703125, 0.03466033935546875, 0.040679931640625, 0.04669952392578125, 0.0527191162109375, 0.05873870849609375, 0.06475830078125, 0.07077789306640625, 0.0767974853515625, 0.08281707763671875, 0.088836669921875, 0.09485626220703125, 0.1008758544921875, 0.10689544677734375, 0.1129150390625, 0.11893463134765625, 0.1249542236328125, 0.13097381591796875, 0.136993408203125, 0.14301300048828125, 0.1490325927734375, 0.15505218505859375, 0.16107177734375, 0.16709136962890625, 0.1731109619140625, 0.17913055419921875, 0.185150146484375, 0.19116973876953125, 0.1971893310546875, 0.20320892333984375, 0.209228515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 5.0, 6.0, 14.0, 17.0, 18.0, 15.0, 19.0, 12.0, 25.0, 27.0, 31.0, 33.0, 32.0, 32.0, 41.0, 32.0, 33.0, 34.0, 31.0, 44.0, 45.0, 38.0, 44.0, 38.0, 30.0, 38.0, 34.0, 30.0, 29.0, 28.0, 21.0, 23.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.178955078125, -0.1733245849609375, -0.167694091796875, -0.1620635986328125, -0.15643310546875, -0.1508026123046875, -0.145172119140625, -0.1395416259765625, -0.1339111328125, -0.1282806396484375, -0.122650146484375, -0.1170196533203125, -0.11138916015625, -0.1057586669921875, -0.100128173828125, -0.0944976806640625, -0.0888671875, -0.0832366943359375, -0.077606201171875, -0.0719757080078125, -0.06634521484375, -0.0607147216796875, -0.055084228515625, -0.0494537353515625, -0.0438232421875, -0.0381927490234375, -0.032562255859375, -0.0269317626953125, -0.02130126953125, -0.0156707763671875, -0.010040283203125, -0.0044097900390625, 0.001220703125, 0.0068511962890625, 0.012481689453125, 0.0181121826171875, 0.02374267578125, 0.0293731689453125, 0.035003662109375, 0.0406341552734375, 0.0462646484375, 0.0518951416015625, 0.057525634765625, 0.0631561279296875, 0.06878662109375, 0.0744171142578125, 0.080047607421875, 0.0856781005859375, 0.09130859375, 0.0969390869140625, 0.102569580078125, 0.1082000732421875, 0.11383056640625, 0.1194610595703125, 0.125091552734375, 0.1307220458984375, 0.1363525390625, 0.1419830322265625, 0.147613525390625, 0.1532440185546875, 0.15887451171875, 0.1645050048828125, 0.170135498046875, 0.1757659912109375, 0.181396484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 8.0, 9.0, 27.0, 68.0, 107.0, 167.0, 316.0, 687.0, 1454.0, 3334.0, 7706.0, 17647.0, 43870.0, 111834.0, 339274.0, 337110.0, 110167.0, 43351.0, 17796.0, 7561.0, 3253.0, 1386.0, 700.0, 330.0, 189.0, 71.0, 50.0, 25.0, 25.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052764892578125, -0.05100584030151367, -0.049246788024902344, -0.047487735748291016, -0.04572868347167969, -0.04396963119506836, -0.04221057891845703, -0.0404515266418457, -0.038692474365234375, -0.03693342208862305, -0.03517436981201172, -0.03341531753540039, -0.03165626525878906, -0.029897212982177734, -0.028138160705566406, -0.026379108428955078, -0.02462005615234375, -0.022861003875732422, -0.021101951599121094, -0.019342899322509766, -0.017583847045898438, -0.01582479476928711, -0.014065742492675781, -0.012306690216064453, -0.010547637939453125, -0.008788585662841797, -0.007029533386230469, -0.005270481109619141, -0.0035114288330078125, -0.0017523765563964844, 6.67572021484375e-06, 0.0017657279968261719, 0.0035247802734375, 0.005283832550048828, 0.007042884826660156, 0.008801937103271484, 0.010560989379882812, 0.01232004165649414, 0.014079093933105469, 0.015838146209716797, 0.017597198486328125, 0.019356250762939453, 0.02111530303955078, 0.02287435531616211, 0.024633407592773438, 0.026392459869384766, 0.028151512145996094, 0.029910564422607422, 0.03166961669921875, 0.03342866897583008, 0.035187721252441406, 0.036946773529052734, 0.03870582580566406, 0.04046487808227539, 0.04222393035888672, 0.04398298263549805, 0.045742034912109375, 0.0475010871887207, 0.04926013946533203, 0.05101919174194336, 0.05277824401855469, 0.054537296295166016, 0.056296348571777344, 0.05805540084838867, 0.059814453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 11.0, 14.0, 24.0, 19.0, 32.0, 43.0, 63.0, 75.0, 71.0, 98.0, 114.0, 105.0, 81.0, 42.0, 49.0, 34.0, 32.0, 15.0, 10.0, 6.0, 6.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7821788787841797e-05, -1.7228536307811737e-05, -1.6635283827781677e-05, -1.6042031347751617e-05, -1.5448778867721558e-05, -1.4855526387691498e-05, -1.4262273907661438e-05, -1.3669021427631378e-05, -1.3075768947601318e-05, -1.2482516467571259e-05, -1.1889263987541199e-05, -1.1296011507511139e-05, -1.0702759027481079e-05, -1.010950654745102e-05, -9.51625406742096e-06, -8.9230015873909e-06, -8.32974910736084e-06, -7.73649662733078e-06, -7.14324414730072e-06, -6.54999166727066e-06, -5.956739187240601e-06, -5.363486707210541e-06, -4.770234227180481e-06, -4.176981747150421e-06, -3.5837292671203613e-06, -2.9904767870903015e-06, -2.3972243070602417e-06, -1.8039718270301819e-06, -1.210719347000122e-06, -6.174668669700623e-07, -2.421438694000244e-08, 5.690380930900574e-07, 1.1622905731201172e-06, 1.755543053150177e-06, 2.348795533180237e-06, 2.9420480132102966e-06, 3.5353004932403564e-06, 4.128552973270416e-06, 4.721805453300476e-06, 5.315057933330536e-06, 5.908310413360596e-06, 6.5015628933906555e-06, 7.094815373420715e-06, 7.688067853450775e-06, 8.281320333480835e-06, 8.874572813510895e-06, 9.467825293540955e-06, 1.0061077773571014e-05, 1.0654330253601074e-05, 1.1247582733631134e-05, 1.1840835213661194e-05, 1.2434087693691254e-05, 1.3027340173721313e-05, 1.3620592653751373e-05, 1.4213845133781433e-05, 1.4807097613811493e-05, 1.5400350093841553e-05, 1.5993602573871613e-05, 1.6586855053901672e-05, 1.7180107533931732e-05, 1.7773360013961792e-05, 1.8366612493991852e-05, 1.895986497402191e-05, 1.955311745405197e-05, 2.014636993408203e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 15.0, 26.0, 47.0, 76.0, 184.0, 352.0, 990.0, 3382.0, 15860.0, 93057.0, 572780.0, 305128.0, 45157.0, 8448.0, 1920.0, 603.0, 250.0, 131.0, 72.0, 33.0, 14.0, 12.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10308837890625, -0.09962940216064453, -0.09617042541503906, -0.0927114486694336, -0.08925247192382812, -0.08579349517822266, -0.08233451843261719, -0.07887554168701172, -0.07541656494140625, -0.07195758819580078, -0.06849861145019531, -0.06503963470458984, -0.061580657958984375, -0.058121681213378906, -0.05466270446777344, -0.05120372772216797, -0.0477447509765625, -0.04428577423095703, -0.04082679748535156, -0.037367820739746094, -0.033908843994140625, -0.030449867248535156, -0.026990890502929688, -0.02353191375732422, -0.02007293701171875, -0.01661396026611328, -0.013154983520507812, -0.009696006774902344, -0.006237030029296875, -0.0027780532836914062, 0.0006809234619140625, 0.004139900207519531, 0.007598876953125, 0.011057853698730469, 0.014516830444335938, 0.017975807189941406, 0.021434783935546875, 0.024893760681152344, 0.028352737426757812, 0.03181171417236328, 0.03527069091796875, 0.03872966766357422, 0.04218864440917969, 0.045647621154785156, 0.049106597900390625, 0.052565574645996094, 0.05602455139160156, 0.05948352813720703, 0.0629425048828125, 0.06640148162841797, 0.06986045837402344, 0.0733194351196289, 0.07677841186523438, 0.08023738861083984, 0.08369636535644531, 0.08715534210205078, 0.09061431884765625, 0.09407329559326172, 0.09753227233886719, 0.10099124908447266, 0.10445022583007812, 0.1079092025756836, 0.11136817932128906, 0.11482715606689453, 0.1182861328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 5.0, 6.0, 7.0, 16.0, 14.0, 18.0, 28.0, 29.0, 32.0, 50.0, 73.0, 62.0, 84.0, 91.0, 93.0, 71.0, 58.0, 50.0, 27.0, 31.0, 26.0, 26.0, 18.0, 15.0, 15.0, 8.0, 12.0, 8.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058380126953125, -0.05678367614746094, -0.055187225341796875, -0.05359077453613281, -0.05199432373046875, -0.05039787292480469, -0.048801422119140625, -0.04720497131347656, -0.0456085205078125, -0.04401206970214844, -0.042415618896484375, -0.04081916809082031, -0.03922271728515625, -0.03762626647949219, -0.036029815673828125, -0.03443336486816406, -0.0328369140625, -0.031240463256835938, -0.029644012451171875, -0.028047561645507812, -0.02645111083984375, -0.024854660034179688, -0.023258209228515625, -0.021661758422851562, -0.0200653076171875, -0.018468856811523438, -0.016872406005859375, -0.015275955200195312, -0.01367950439453125, -0.012083053588867188, -0.010486602783203125, -0.008890151977539062, -0.007293701171875, -0.0056972503662109375, -0.004100799560546875, -0.0025043487548828125, -0.00090789794921875, 0.0006885528564453125, 0.002285003662109375, 0.0038814544677734375, 0.0054779052734375, 0.0070743560791015625, 0.008670806884765625, 0.010267257690429688, 0.01186370849609375, 0.013460159301757812, 0.015056610107421875, 0.016653060913085938, 0.01824951171875, 0.019845962524414062, 0.021442413330078125, 0.023038864135742188, 0.02463531494140625, 0.026231765747070312, 0.027828216552734375, 0.029424667358398438, 0.0310211181640625, 0.03261756896972656, 0.034214019775390625, 0.03581047058105469, 0.03740692138671875, 0.03900337219238281, 0.040599822998046875, 0.04219627380371094, 0.043792724609375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 39.0, 202.0, 424.0, 271.0, 48.0, 13.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2217077016830444, -1.1432862281799316, -1.0648647546768188, -0.9864432215690613, -0.9080216884613037, -0.8296002149581909, -0.7511787414550781, -0.6727572083473206, -0.5943357348442078, -0.515914261341095, -0.4374927282333374, -0.3590712547302246, -0.28064975142478943, -0.20222824811935425, -0.12380677461624146, -0.04538524150848389, 0.033036231994628906, 0.11145772784948349, 0.18987922370433807, 0.26830071210861206, 0.34672221541404724, 0.4251437187194824, 0.5035651922225952, 0.5819867253303528, 0.6604081988334656, 0.7388296723365784, 0.8172512054443359, 0.8956726789474487, 0.9740941524505615, 1.0525157451629639, 1.130937099456787, 1.2093586921691895, 1.2877800464630127, 1.3662015199661255, 1.4446229934692383, 1.5230445861816406, 1.6014660596847534, 1.6798875331878662, 1.758309006690979, 1.8367304801940918, 1.9151520729064941, 1.993573546409607, 2.0719950199127197, 2.150416612625122, 2.2288379669189453, 2.3072595596313477, 2.38568115234375, 2.4641025066375732, 2.5425238609313965, 2.620945453643799, 2.699366807937622, 2.7777884006500244, 2.8562097549438477, 2.93463134765625, 3.0130529403686523, 3.0914742946624756, 3.169895887374878, 3.2483174800872803, 3.3267388343811035, 3.405160427093506, 3.483581781387329, 3.5620033740997314, 3.6404247283935547, 3.718846321105957, 3.7972679138183594]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 15.0, 14.0, 8.0, 12.0, 10.0, 17.0, 30.0, 20.0, 26.0, 31.0, 44.0, 29.0, 34.0, 47.0, 47.0, 50.0, 50.0, 48.0, 42.0, 42.0, 46.0, 44.0, 33.0, 47.0, 26.0, 40.0, 23.0, 26.0, 21.0, 11.0, 12.0, 4.0, 9.0, 6.0, 5.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48663830757141113, -0.4705071449279785, -0.4543759524822235, -0.4382447898387909, -0.4221135973930359, -0.40598243474960327, -0.38985127210617065, -0.37372010946273804, -0.35758891701698303, -0.3414577543735504, -0.3253265619277954, -0.3091953992843628, -0.2930642366409302, -0.27693304419517517, -0.26080188155174255, -0.24467070400714874, -0.22853952646255493, -0.21240834891796112, -0.1962771713733673, -0.1801460087299347, -0.16401483118534088, -0.14788365364074707, -0.13175249099731445, -0.11562131345272064, -0.09949013590812683, -0.08335895836353302, -0.0672277882695198, -0.05109661445021629, -0.03496544063091278, -0.01883426308631897, -0.0027030929923057556, 0.013428077101707458, 0.029559195041656494, 0.04569036886096001, 0.06182154268026352, 0.07795271277427673, 0.09408389031887054, 0.11021506786346436, 0.12634623050689697, 0.14247740805149078, 0.1586085855960846, 0.1747397631406784, 0.19087094068527222, 0.20700210332870483, 0.22313328087329865, 0.23926445841789246, 0.2553956210613251, 0.2715268135070801, 0.2876579761505127, 0.3037891387939453, 0.3199203312397003, 0.33605149388313293, 0.35218268632888794, 0.36831384897232056, 0.3844450116157532, 0.4005761742591858, 0.4167073667049408, 0.4328385293483734, 0.4489697217941284, 0.46510088443756104, 0.48123204708099365, 0.49736323952674866, 0.5134944319725037, 0.5296255946159363, 0.5457567572593689]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 17.0, 21.0, 30.0, 31.0, 54.0, 110.0, 167.0, 291.0, 401.0, 694.0, 1183.0, 1990.0, 3392.0, 5904.0, 10205.0, 17766.0, 31877.0, 57207.0, 108609.0, 225366.0, 574937.0, 1476711.0, 996300.0, 352142.0, 152888.0, 78360.0, 42093.0, 23456.0, 13364.0, 7834.0, 4405.0, 2615.0, 1536.0, 839.0, 537.0, 333.0, 185.0, 128.0, 87.0, 53.0, 43.0, 34.0, 23.0, 21.0, 8.0, 12.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06256103515625, -0.06052684783935547, -0.05849266052246094, -0.056458473205566406, -0.054424285888671875, -0.052390098571777344, -0.05035591125488281, -0.04832172393798828, -0.04628753662109375, -0.04425334930419922, -0.04221916198730469, -0.040184974670410156, -0.038150787353515625, -0.036116600036621094, -0.03408241271972656, -0.03204822540283203, -0.0300140380859375, -0.02797985076904297, -0.025945663452148438, -0.023911476135253906, -0.021877288818359375, -0.019843101501464844, -0.017808914184570312, -0.01577472686767578, -0.01374053955078125, -0.011706352233886719, -0.009672164916992188, -0.007637977600097656, -0.005603790283203125, -0.0035696029663085938, -0.0015354156494140625, 0.0004987716674804688, 0.002532958984375, 0.004567146301269531, 0.0066013336181640625, 0.008635520935058594, 0.010669708251953125, 0.012703895568847656, 0.014738082885742188, 0.01677227020263672, 0.01880645751953125, 0.02084064483642578, 0.022874832153320312, 0.024909019470214844, 0.026943206787109375, 0.028977394104003906, 0.031011581420898438, 0.03304576873779297, 0.0350799560546875, 0.03711414337158203, 0.03914833068847656, 0.041182518005371094, 0.043216705322265625, 0.045250892639160156, 0.04728507995605469, 0.04931926727294922, 0.05135345458984375, 0.05338764190673828, 0.05542182922363281, 0.057456016540527344, 0.059490203857421875, 0.061524391174316406, 0.06355857849121094, 0.06559276580810547, 0.067626953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 11.0, 3.0, 5.0, 7.0, 11.0, 12.0, 18.0, 12.0, 13.0, 17.0, 24.0, 26.0, 27.0, 25.0, 31.0, 28.0, 47.0, 38.0, 50.0, 36.0, 37.0, 39.0, 47.0, 46.0, 41.0, 31.0, 33.0, 32.0, 31.0, 35.0, 28.0, 27.0, 16.0, 23.0, 19.0, 13.0, 11.0, 13.0, 11.0, 7.0, 5.0, 5.0, 6.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06317138671875, -0.06129026412963867, -0.059409141540527344, -0.057528018951416016, -0.05564689636230469, -0.05376577377319336, -0.05188465118408203, -0.0500035285949707, -0.048122406005859375, -0.04624128341674805, -0.04436016082763672, -0.04247903823852539, -0.04059791564941406, -0.038716793060302734, -0.036835670471191406, -0.03495454788208008, -0.03307342529296875, -0.031192302703857422, -0.029311180114746094, -0.027430057525634766, -0.025548934936523438, -0.02366781234741211, -0.02178668975830078, -0.019905567169189453, -0.018024444580078125, -0.016143321990966797, -0.014262199401855469, -0.01238107681274414, -0.010499954223632812, -0.008618831634521484, -0.006737709045410156, -0.004856586456298828, -0.0029754638671875, -0.0010943412780761719, 0.0007867813110351562, 0.0026679039001464844, 0.0045490264892578125, 0.006430149078369141, 0.008311271667480469, 0.010192394256591797, 0.012073516845703125, 0.013954639434814453, 0.01583576202392578, 0.01771688461303711, 0.019598007202148438, 0.021479129791259766, 0.023360252380371094, 0.025241374969482422, 0.02712249755859375, 0.029003620147705078, 0.030884742736816406, 0.032765865325927734, 0.03464698791503906, 0.03652811050415039, 0.03840923309326172, 0.04029035568237305, 0.042171478271484375, 0.0440526008605957, 0.04593372344970703, 0.04781484603881836, 0.04969596862792969, 0.051577091217041016, 0.053458213806152344, 0.05533933639526367, 0.057220458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 14.0, 17.0, 10.0, 28.0, 59.0, 96.0, 130.0, 239.0, 443.0, 749.0, 1343.0, 2308.0, 4425.0, 8720.0, 17362.0, 36099.0, 74752.0, 168885.0, 437954.0, 1482179.0, 1292682.0, 380746.0, 150799.0, 68466.0, 32522.0, 16182.0, 8077.0, 4119.0, 2130.0, 1180.0, 635.0, 355.0, 216.0, 121.0, 84.0, 51.0, 30.0, 28.0, 10.0, 13.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10089111328125, -0.09782791137695312, -0.09476470947265625, -0.09170150756835938, -0.0886383056640625, -0.08557510375976562, -0.08251190185546875, -0.07944869995117188, -0.076385498046875, -0.07332229614257812, -0.07025909423828125, -0.06719589233398438, -0.0641326904296875, -0.061069488525390625, -0.05800628662109375, -0.054943084716796875, -0.0518798828125, -0.048816680908203125, -0.04575347900390625, -0.042690277099609375, -0.0396270751953125, -0.036563873291015625, -0.03350067138671875, -0.030437469482421875, -0.027374267578125, -0.024311065673828125, -0.02124786376953125, -0.018184661865234375, -0.0151214599609375, -0.012058258056640625, -0.00899505615234375, -0.005931854248046875, -0.00286865234375, 0.000194549560546875, 0.00325775146484375, 0.006320953369140625, 0.0093841552734375, 0.012447357177734375, 0.01551055908203125, 0.018573760986328125, 0.021636962890625, 0.024700164794921875, 0.02776336669921875, 0.030826568603515625, 0.0338897705078125, 0.036952972412109375, 0.04001617431640625, 0.043079376220703125, 0.046142578125, 0.049205780029296875, 0.05226898193359375, 0.055332183837890625, 0.0583953857421875, 0.061458587646484375, 0.06452178955078125, 0.06758499145507812, 0.070648193359375, 0.07371139526367188, 0.07677459716796875, 0.07983779907226562, 0.0829010009765625, 0.08596420288085938, 0.08902740478515625, 0.09209060668945312, 0.09515380859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 4.0, 6.0, 15.0, 8.0, 25.0, 27.0, 38.0, 35.0, 48.0, 72.0, 97.0, 126.0, 170.0, 240.0, 351.0, 553.0, 572.0, 491.0, 306.0, 232.0, 144.0, 121.0, 82.0, 58.0, 57.0, 39.0, 35.0, 24.0, 19.0, 18.0, 10.0, 9.0, 8.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13818359375, -0.13439655303955078, -0.13060951232910156, -0.12682247161865234, -0.12303543090820312, -0.1192483901977539, -0.11546134948730469, -0.11167430877685547, -0.10788726806640625, -0.10410022735595703, -0.10031318664550781, -0.0965261459350586, -0.09273910522460938, -0.08895206451416016, -0.08516502380371094, -0.08137798309326172, -0.0775909423828125, -0.07380390167236328, -0.07001686096191406, -0.06622982025146484, -0.062442779541015625, -0.058655738830566406, -0.05486869812011719, -0.05108165740966797, -0.04729461669921875, -0.04350757598876953, -0.03972053527832031, -0.035933494567871094, -0.032146453857421875, -0.028359413146972656, -0.024572372436523438, -0.02078533172607422, -0.016998291015625, -0.013211250305175781, -0.009424209594726562, -0.005637168884277344, -0.001850128173828125, 0.0019369125366210938, 0.0057239532470703125, 0.009510993957519531, 0.01329803466796875, 0.01708507537841797, 0.020872116088867188, 0.024659156799316406, 0.028446197509765625, 0.032233238220214844, 0.03602027893066406, 0.03980731964111328, 0.0435943603515625, 0.04738140106201172, 0.05116844177246094, 0.054955482482910156, 0.058742523193359375, 0.0625295639038086, 0.06631660461425781, 0.07010364532470703, 0.07389068603515625, 0.07767772674560547, 0.08146476745605469, 0.0852518081665039, 0.08903884887695312, 0.09282588958740234, 0.09661293029785156, 0.10039997100830078, 0.10418701171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 26.0, 47.0, 48.0, 68.0, 75.0, 92.0, 95.0, 84.0, 92.0, 101.0, 81.0, 55.0, 36.0, 29.0, 13.0, 19.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8095172643661499, -0.7883503437042236, -0.7671834826469421, -0.7460165619850159, -0.7248496413230896, -0.7036827802658081, -0.6825158596038818, -0.6613489389419556, -0.6401820182800293, -0.619015097618103, -0.5978482365608215, -0.5766813158988953, -0.555514395236969, -0.5343475341796875, -0.5131806135177612, -0.49201369285583496, -0.47084683179855347, -0.4496799409389496, -0.4285130202770233, -0.40734612941741943, -0.38617920875549316, -0.3650123178958893, -0.3438454270362854, -0.32267850637435913, -0.30151161551475525, -0.28034472465515137, -0.2591778039932251, -0.23801091313362122, -0.21684400737285614, -0.19567710161209106, -0.17451021075248718, -0.1533433049917221, -0.13217639923095703, -0.11100949347019196, -0.08984259516000748, -0.068675696849823, -0.04750879108905792, -0.026341885328292847, -0.005174994468688965, 0.01599191129207611, 0.037158817052841187, 0.058325719088315964, 0.07949262112379074, 0.10065951943397522, 0.1218264251947403, 0.14299333095550537, 0.16416022181510925, 0.18532712757587433, 0.2064940333366394, 0.22766093909740448, 0.24882784485816956, 0.26999473571777344, 0.2911616563796997, 0.3123285472393036, 0.33349543809890747, 0.35466235876083374, 0.3758292496204376, 0.3969961404800415, 0.4181630611419678, 0.43932995200157166, 0.46049684286117554, 0.4816637635231018, 0.5028306245803833, 0.5239975452423096, 0.5451644659042358]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 12.0, 9.0, 15.0, 16.0, 18.0, 15.0, 20.0, 26.0, 30.0, 37.0, 39.0, 35.0, 47.0, 39.0, 47.0, 44.0, 37.0, 46.0, 45.0, 35.0, 42.0, 37.0, 32.0, 44.0, 31.0, 29.0, 30.0, 31.0, 14.0, 14.0, 16.0, 16.0, 9.0, 7.0, 7.0, 10.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4762831926345825, -0.463061660528183, -0.44984012842178345, -0.4366185963153839, -0.4233970642089844, -0.41017553210258484, -0.3969539999961853, -0.38373246788978577, -0.37051093578338623, -0.3572894036769867, -0.34406787157058716, -0.3308463394641876, -0.3176248073577881, -0.30440327525138855, -0.291181743144989, -0.2779602110385895, -0.26473867893218994, -0.2515171468257904, -0.23829561471939087, -0.22507408261299133, -0.2118525505065918, -0.19863101840019226, -0.18540948629379272, -0.1721879541873932, -0.15896639227867126, -0.14574486017227173, -0.1325233280658722, -0.11930179595947266, -0.10608026385307312, -0.09285872429609299, -0.07963719218969345, -0.06641566008329391, -0.053194135427474976, -0.03997260332107544, -0.026751069352030754, -0.013529535382986069, -0.0003080032765865326, 0.012913532555103302, 0.026135064661502838, 0.039356596767902374, 0.05257812887430191, 0.06579966098070145, 0.07902119308710098, 0.09224273264408112, 0.10546426475048065, 0.11868579685688019, 0.13190732896327972, 0.14512886106967926, 0.1583503931760788, 0.17157192528247833, 0.18479345738887787, 0.1980149894952774, 0.21123652160167694, 0.22445806860923767, 0.2376796007156372, 0.25090113282203674, 0.2641226649284363, 0.2773441970348358, 0.29056572914123535, 0.3037872612476349, 0.3170087933540344, 0.33023032546043396, 0.3434518575668335, 0.35667338967323303, 0.36989492177963257]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 11.0, 19.0, 17.0, 29.0, 49.0, 74.0, 104.0, 146.0, 265.0, 434.0, 601.0, 1003.0, 1514.0, 2307.0, 3677.0, 5537.0, 8890.0, 14854.0, 28469.0, 61712.0, 153084.0, 309788.0, 251593.0, 105712.0, 44535.0, 21501.0, 12223.0, 7245.0, 4594.0, 3042.0, 1981.0, 1304.0, 797.0, 506.0, 341.0, 222.0, 132.0, 97.0, 43.0, 36.0, 22.0, 16.0, 9.0, 7.0, 1.0, 6.0, 3.0, 0.0, 3.0], "bins": [-0.0985107421875, -0.09583377838134766, -0.09315681457519531, -0.09047985076904297, -0.08780288696289062, -0.08512592315673828, -0.08244895935058594, -0.0797719955444336, -0.07709503173828125, -0.0744180679321289, -0.07174110412597656, -0.06906414031982422, -0.06638717651367188, -0.06371021270751953, -0.06103324890136719, -0.058356285095214844, -0.0556793212890625, -0.053002357482910156, -0.05032539367675781, -0.04764842987060547, -0.044971466064453125, -0.04229450225830078, -0.03961753845214844, -0.036940574645996094, -0.03426361083984375, -0.031586647033691406, -0.028909683227539062, -0.02623271942138672, -0.023555755615234375, -0.02087879180908203, -0.018201828002929688, -0.015524864196777344, -0.012847900390625, -0.010170936584472656, -0.0074939727783203125, -0.004817008972167969, -0.002140045166015625, 0.0005369186401367188, 0.0032138824462890625, 0.005890846252441406, 0.00856781005859375, 0.011244773864746094, 0.013921737670898438, 0.01659870147705078, 0.019275665283203125, 0.02195262908935547, 0.024629592895507812, 0.027306556701660156, 0.0299835205078125, 0.032660484313964844, 0.03533744812011719, 0.03801441192626953, 0.040691375732421875, 0.04336833953857422, 0.04604530334472656, 0.048722267150878906, 0.05139923095703125, 0.054076194763183594, 0.05675315856933594, 0.05943012237548828, 0.062107086181640625, 0.06478404998779297, 0.06746101379394531, 0.07013797760009766, 0.07281494140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 5.0, 8.0, 11.0, 7.0, 9.0, 15.0, 13.0, 14.0, 21.0, 21.0, 30.0, 30.0, 25.0, 27.0, 34.0, 26.0, 38.0, 38.0, 42.0, 45.0, 33.0, 28.0, 35.0, 43.0, 47.0, 38.0, 33.0, 31.0, 30.0, 24.0, 19.0, 27.0, 24.0, 21.0, 16.0, 12.0, 17.0, 15.0, 5.0, 8.0, 5.0, 3.0, 2.0, 11.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.059112548828125, -0.05726814270019531, -0.055423736572265625, -0.05357933044433594, -0.05173492431640625, -0.04989051818847656, -0.048046112060546875, -0.04620170593261719, -0.0443572998046875, -0.04251289367675781, -0.040668487548828125, -0.03882408142089844, -0.03697967529296875, -0.03513526916503906, -0.033290863037109375, -0.03144645690917969, -0.02960205078125, -0.027757644653320312, -0.025913238525390625, -0.024068832397460938, -0.02222442626953125, -0.020380020141601562, -0.018535614013671875, -0.016691207885742188, -0.0148468017578125, -0.013002395629882812, -0.011157989501953125, -0.009313583374023438, -0.00746917724609375, -0.0056247711181640625, -0.003780364990234375, -0.0019359588623046875, -9.1552734375e-05, 0.0017528533935546875, 0.003597259521484375, 0.0054416656494140625, 0.00728607177734375, 0.009130477905273438, 0.010974884033203125, 0.012819290161132812, 0.0146636962890625, 0.016508102416992188, 0.018352508544921875, 0.020196914672851562, 0.02204132080078125, 0.023885726928710938, 0.025730133056640625, 0.027574539184570312, 0.0294189453125, 0.03126335144042969, 0.033107757568359375, 0.03495216369628906, 0.03679656982421875, 0.03864097595214844, 0.040485382080078125, 0.04232978820800781, 0.0441741943359375, 0.04601860046386719, 0.047863006591796875, 0.04970741271972656, 0.05155181884765625, 0.05339622497558594, 0.055240631103515625, 0.05708503723144531, 0.058929443359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 5.0, 6.0, 9.0, 17.0, 18.0, 21.0, 33.0, 34.0, 52.0, 83.0, 109.0, 216.0, 348.0, 604.0, 1192.0, 2529.0, 5561.0, 12320.0, 30000.0, 84748.0, 275409.0, 403617.0, 148902.0, 48660.0, 18736.0, 7972.0, 3731.0, 1605.0, 817.0, 440.0, 266.0, 146.0, 95.0, 57.0, 47.0, 35.0, 26.0, 24.0, 19.0, 9.0, 13.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.125732421875, -0.12170791625976562, -0.11768341064453125, -0.11365890502929688, -0.1096343994140625, -0.10560989379882812, -0.10158538818359375, -0.09756088256835938, -0.093536376953125, -0.08951187133789062, -0.08548736572265625, -0.08146286010742188, -0.0774383544921875, -0.07341384887695312, -0.06938934326171875, -0.06536483764648438, -0.06134033203125, -0.057315826416015625, -0.05329132080078125, -0.049266815185546875, -0.0452423095703125, -0.041217803955078125, -0.03719329833984375, -0.033168792724609375, -0.029144287109375, -0.025119781494140625, -0.02109527587890625, -0.017070770263671875, -0.0130462646484375, -0.009021759033203125, -0.00499725341796875, -0.000972747802734375, 0.0030517578125, 0.007076263427734375, 0.01110076904296875, 0.015125274658203125, 0.0191497802734375, 0.023174285888671875, 0.02719879150390625, 0.031223297119140625, 0.035247802734375, 0.039272308349609375, 0.04329681396484375, 0.047321319580078125, 0.0513458251953125, 0.055370330810546875, 0.05939483642578125, 0.06341934204101562, 0.06744384765625, 0.07146835327148438, 0.07549285888671875, 0.07951736450195312, 0.0835418701171875, 0.08756637573242188, 0.09159088134765625, 0.09561538696289062, 0.099639892578125, 0.10366439819335938, 0.10768890380859375, 0.11171340942382812, 0.1157379150390625, 0.11976242065429688, 0.12378692626953125, 0.12781143188476562, 0.1318359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 7.0, 6.0, 8.0, 10.0, 13.0, 15.0, 14.0, 16.0, 17.0, 26.0, 34.0, 33.0, 38.0, 34.0, 33.0, 35.0, 46.0, 32.0, 43.0, 46.0, 53.0, 47.0, 51.0, 36.0, 37.0, 32.0, 34.0, 33.0, 36.0, 21.0, 22.0, 21.0, 3.0, 18.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.2298583984375, -0.22360801696777344, -0.21735763549804688, -0.2111072540283203, -0.20485687255859375, -0.1986064910888672, -0.19235610961914062, -0.18610572814941406, -0.1798553466796875, -0.17360496520996094, -0.16735458374023438, -0.1611042022705078, -0.15485382080078125, -0.1486034393310547, -0.14235305786132812, -0.13610267639160156, -0.129852294921875, -0.12360191345214844, -0.11735153198242188, -0.11110115051269531, -0.10485076904296875, -0.09860038757324219, -0.09235000610351562, -0.08609962463378906, -0.0798492431640625, -0.07359886169433594, -0.06734848022460938, -0.06109809875488281, -0.05484771728515625, -0.04859733581542969, -0.042346954345703125, -0.03609657287597656, -0.02984619140625, -0.023595809936523438, -0.017345428466796875, -0.011095046997070312, -0.00484466552734375, 0.0014057159423828125, 0.007656097412109375, 0.013906478881835938, 0.0201568603515625, 0.026407241821289062, 0.032657623291015625, 0.03890800476074219, 0.04515838623046875, 0.05140876770019531, 0.057659149169921875, 0.06390953063964844, 0.070159912109375, 0.07641029357910156, 0.08266067504882812, 0.08891105651855469, 0.09516143798828125, 0.10141181945800781, 0.10766220092773438, 0.11391258239746094, 0.1201629638671875, 0.12641334533691406, 0.13266372680664062, 0.1389141082763672, 0.14516448974609375, 0.1514148712158203, 0.15766525268554688, 0.16391563415527344, 0.170166015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 9.0, 11.0, 15.0, 33.0, 60.0, 130.0, 425.0, 1312.0, 4810.0, 15647.0, 54053.0, 241431.0, 533636.0, 145200.0, 36487.0, 10754.0, 3091.0, 940.0, 270.0, 125.0, 46.0, 29.0, 17.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0697021484375, -0.0671529769897461, -0.06460380554199219, -0.06205463409423828, -0.059505462646484375, -0.05695629119873047, -0.05440711975097656, -0.051857948303222656, -0.04930877685546875, -0.046759605407714844, -0.04421043395996094, -0.04166126251220703, -0.039112091064453125, -0.03656291961669922, -0.03401374816894531, -0.031464576721191406, -0.0289154052734375, -0.026366233825683594, -0.023817062377929688, -0.02126789093017578, -0.018718719482421875, -0.01616954803466797, -0.013620376586914062, -0.011071205139160156, -0.00852203369140625, -0.005972862243652344, -0.0034236907958984375, -0.0008745193481445312, 0.001674652099609375, 0.004223823547363281, 0.0067729949951171875, 0.009322166442871094, 0.011871337890625, 0.014420509338378906, 0.016969680786132812, 0.01951885223388672, 0.022068023681640625, 0.02461719512939453, 0.027166366577148438, 0.029715538024902344, 0.03226470947265625, 0.034813880920410156, 0.03736305236816406, 0.03991222381591797, 0.042461395263671875, 0.04501056671142578, 0.04755973815917969, 0.050108909606933594, 0.0526580810546875, 0.055207252502441406, 0.05775642395019531, 0.06030559539794922, 0.06285476684570312, 0.06540393829345703, 0.06795310974121094, 0.07050228118896484, 0.07305145263671875, 0.07560062408447266, 0.07814979553222656, 0.08069896697998047, 0.08324813842773438, 0.08579730987548828, 0.08834648132324219, 0.0908956527709961, 0.09344482421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 9.0, 24.0, 32.0, 30.0, 39.0, 72.0, 73.0, 78.0, 100.0, 95.0, 83.0, 73.0, 73.0, 61.0, 24.0, 30.0, 15.0, 11.0, 6.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.609325408935547e-05, -1.5541911125183105e-05, -1.4990568161010742e-05, -1.4439225196838379e-05, -1.3887882232666016e-05, -1.3336539268493652e-05, -1.2785196304321289e-05, -1.2233853340148926e-05, -1.1682510375976562e-05, -1.11311674118042e-05, -1.0579824447631836e-05, -1.0028481483459473e-05, -9.47713851928711e-06, -8.925795555114746e-06, -8.374452590942383e-06, -7.82310962677002e-06, -7.271766662597656e-06, -6.720423698425293e-06, -6.16908073425293e-06, -5.617737770080566e-06, -5.066394805908203e-06, -4.51505184173584e-06, -3.9637088775634766e-06, -3.4123659133911133e-06, -2.86102294921875e-06, -2.3096799850463867e-06, -1.7583370208740234e-06, -1.2069940567016602e-06, -6.556510925292969e-07, -1.043081283569336e-07, 4.470348358154297e-07, 9.98377799987793e-07, 1.5497207641601562e-06, 2.1010637283325195e-06, 2.652406692504883e-06, 3.203749656677246e-06, 3.7550926208496094e-06, 4.306435585021973e-06, 4.857778549194336e-06, 5.409121513366699e-06, 5.9604644775390625e-06, 6.511807441711426e-06, 7.063150405883789e-06, 7.614493370056152e-06, 8.165836334228516e-06, 8.717179298400879e-06, 9.268522262573242e-06, 9.819865226745605e-06, 1.0371208190917969e-05, 1.0922551155090332e-05, 1.1473894119262695e-05, 1.2025237083435059e-05, 1.2576580047607422e-05, 1.3127923011779785e-05, 1.3679265975952148e-05, 1.4230608940124512e-05, 1.4781951904296875e-05, 1.5333294868469238e-05, 1.58846378326416e-05, 1.6435980796813965e-05, 1.6987323760986328e-05, 1.753866672515869e-05, 1.8090009689331055e-05, 1.8641352653503418e-05, 1.919269561767578e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 13.0, 10.0, 13.0, 14.0, 35.0, 41.0, 60.0, 108.0, 132.0, 222.0, 367.0, 687.0, 1286.0, 2522.0, 5207.0, 11319.0, 24828.0, 58599.0, 142623.0, 304341.0, 280171.0, 123483.0, 50660.0, 22362.0, 9830.0, 4632.0, 2286.0, 1183.0, 584.0, 380.0, 180.0, 108.0, 85.0, 55.0, 30.0, 26.0, 19.0, 17.0, 11.0, 2.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.048248291015625, -0.046736717224121094, -0.04522514343261719, -0.04371356964111328, -0.042201995849609375, -0.04069042205810547, -0.03917884826660156, -0.037667274475097656, -0.03615570068359375, -0.034644126892089844, -0.03313255310058594, -0.03162097930908203, -0.030109405517578125, -0.02859783172607422, -0.027086257934570312, -0.025574684143066406, -0.0240631103515625, -0.022551536560058594, -0.021039962768554688, -0.01952838897705078, -0.018016815185546875, -0.01650524139404297, -0.014993667602539062, -0.013482093811035156, -0.01197052001953125, -0.010458946228027344, -0.008947372436523438, -0.007435798645019531, -0.005924224853515625, -0.004412651062011719, -0.0029010772705078125, -0.0013895034790039062, 0.0001220703125, 0.0016336441040039062, 0.0031452178955078125, 0.004656791687011719, 0.006168365478515625, 0.007679939270019531, 0.009191513061523438, 0.010703086853027344, 0.01221466064453125, 0.013726234436035156, 0.015237808227539062, 0.01674938201904297, 0.018260955810546875, 0.01977252960205078, 0.021284103393554688, 0.022795677185058594, 0.0243072509765625, 0.025818824768066406, 0.027330398559570312, 0.02884197235107422, 0.030353546142578125, 0.03186511993408203, 0.03337669372558594, 0.034888267517089844, 0.03639984130859375, 0.037911415100097656, 0.03942298889160156, 0.04093456268310547, 0.042446136474609375, 0.04395771026611328, 0.04546928405761719, 0.046980857849121094, 0.048492431640625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 5.0, 10.0, 7.0, 17.0, 9.0, 13.0, 11.0, 24.0, 23.0, 39.0, 44.0, 49.0, 52.0, 63.0, 64.0, 75.0, 76.0, 70.0, 58.0, 52.0, 38.0, 37.0, 30.0, 21.0, 23.0, 15.0, 15.0, 13.0, 12.0, 6.0, 6.0, 2.0, 7.0, 1.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04058837890625, -0.038956642150878906, -0.03732490539550781, -0.03569316864013672, -0.034061431884765625, -0.03242969512939453, -0.030797958374023438, -0.029166221618652344, -0.02753448486328125, -0.025902748107910156, -0.024271011352539062, -0.02263927459716797, -0.021007537841796875, -0.01937580108642578, -0.017744064331054688, -0.016112327575683594, -0.0144805908203125, -0.012848854064941406, -0.011217117309570312, -0.009585380554199219, -0.007953643798828125, -0.006321907043457031, -0.0046901702880859375, -0.0030584335327148438, -0.00142669677734375, 0.00020503997802734375, 0.0018367767333984375, 0.0034685134887695312, 0.005100250244140625, 0.006731986999511719, 0.008363723754882812, 0.009995460510253906, 0.011627197265625, 0.013258934020996094, 0.014890670776367188, 0.01652240753173828, 0.018154144287109375, 0.01978588104248047, 0.021417617797851562, 0.023049354553222656, 0.02468109130859375, 0.026312828063964844, 0.027944564819335938, 0.02957630157470703, 0.031208038330078125, 0.03283977508544922, 0.03447151184082031, 0.036103248596191406, 0.0377349853515625, 0.039366722106933594, 0.04099845886230469, 0.04263019561767578, 0.044261932373046875, 0.04589366912841797, 0.04752540588378906, 0.049157142639160156, 0.05078887939453125, 0.052420616149902344, 0.05405235290527344, 0.05568408966064453, 0.057315826416015625, 0.05894756317138672, 0.06057929992675781, 0.062211036682128906, 0.0638427734375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 13.0, 37.0, 88.0, 133.0, 166.0, 197.0, 169.0, 89.0, 52.0, 31.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7692256569862366, -0.7388582229614258, -0.708490788936615, -0.6781233549118042, -0.6477559804916382, -0.6173884868621826, -0.5870211124420166, -0.5566536784172058, -0.526286244392395, -0.49591881036758423, -0.46555137634277344, -0.43518397212028503, -0.40481653809547424, -0.37444910407066345, -0.34408169984817505, -0.31371426582336426, -0.28334683179855347, -0.2529793977737427, -0.22261197865009308, -0.19224455952644348, -0.1618771255016327, -0.1315096914768219, -0.1011422723531723, -0.0707748532295227, -0.040407419204711914, -0.01003999263048172, 0.020327433943748474, 0.05069486051797867, 0.08106228709220886, 0.11142972111701965, 0.14179714024066925, 0.17216455936431885, 0.20253205299377441, 0.2328994870185852, 0.263266921043396, 0.2936343252658844, 0.3240017592906952, 0.354369193315506, 0.3847365975379944, 0.4151040315628052, 0.44547146558761597, 0.47583889961242676, 0.5062063336372375, 0.5365737676620483, 0.5669411420822144, 0.5973086357116699, 0.6276760101318359, 0.6580434441566467, 0.6884108781814575, 0.7187783122062683, 0.7491457462310791, 0.7795131802558899, 0.8098806142807007, 0.8402479887008667, 0.8706154227256775, 0.9009828567504883, 0.9313502907752991, 0.9617177248001099, 0.9920851588249207, 1.0224525928497314, 1.0528199672698975, 1.083187460899353, 1.113554835319519, 1.1439223289489746, 1.1742897033691406]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 9.0, 10.0, 11.0, 9.0, 19.0, 18.0, 14.0, 19.0, 27.0, 24.0, 34.0, 22.0, 27.0, 29.0, 26.0, 30.0, 25.0, 51.0, 55.0, 36.0, 43.0, 43.0, 43.0, 32.0, 43.0, 39.0, 20.0, 29.0, 31.0, 20.0, 17.0, 28.0, 11.0, 17.0, 13.0, 13.0, 8.0, 10.0, 6.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.4376823902130127, -0.4242086708545685, -0.41073498129844666, -0.39726126194000244, -0.3837875425815582, -0.370313823223114, -0.3568401336669922, -0.343366414308548, -0.32989269495010376, -0.31641897559165955, -0.3029452860355377, -0.2894715666770935, -0.2759978473186493, -0.2625241279602051, -0.24905043840408325, -0.23557671904563904, -0.22210301458835602, -0.208629310131073, -0.19515559077262878, -0.18168188631534576, -0.16820816695690155, -0.15473446249961853, -0.14126074314117432, -0.1277870386838913, -0.11431332677602768, -0.10083961486816406, -0.08736590296030045, -0.07389219105243683, -0.06041848286986351, -0.04694477468729019, -0.033471062779426575, -0.019997350871562958, -0.006523638963699341, 0.0069500720128417015, 0.020423782989382744, 0.03389749303460121, 0.04737120494246483, 0.06084491312503815, 0.07431862503290176, 0.08779233694076538, 0.101266048848629, 0.11473976075649261, 0.12821346521377563, 0.14168718457221985, 0.15516088902950287, 0.1686345934867859, 0.1821083128452301, 0.19558203220367432, 0.20905573666095734, 0.22252944111824036, 0.23600316047668457, 0.2494768649339676, 0.2629505693912506, 0.2764242887496948, 0.28989800810813904, 0.30337172746658325, 0.3168454170227051, 0.3303191363811493, 0.3437928259372711, 0.35726654529571533, 0.37074026465415955, 0.38421398401260376, 0.3976876735687256, 0.4111613929271698, 0.424635112285614]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 11.0, 18.0, 20.0, 29.0, 48.0, 57.0, 90.0, 160.0, 301.0, 498.0, 926.0, 1814.0, 3586.0, 7394.0, 15461.0, 33440.0, 74647.0, 174964.0, 479842.0, 1390819.0, 1296196.0, 427737.0, 158337.0, 67796.0, 31336.0, 14516.0, 6837.0, 3440.0, 1786.0, 908.0, 493.0, 298.0, 160.0, 106.0, 69.0, 34.0, 22.0, 22.0, 16.0, 15.0, 9.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07769775390625, -0.07501411437988281, -0.07233047485351562, -0.06964683532714844, -0.06696319580078125, -0.06427955627441406, -0.061595916748046875, -0.05891227722167969, -0.0562286376953125, -0.05354499816894531, -0.050861358642578125, -0.04817771911621094, -0.04549407958984375, -0.04281044006347656, -0.040126800537109375, -0.03744316101074219, -0.034759521484375, -0.03207588195800781, -0.029392242431640625, -0.026708602905273438, -0.02402496337890625, -0.021341323852539062, -0.018657684326171875, -0.015974044799804688, -0.0132904052734375, -0.010606765747070312, -0.007923126220703125, -0.0052394866943359375, -0.00255584716796875, 0.0001277923583984375, 0.002811431884765625, 0.0054950714111328125, 0.0081787109375, 0.010862350463867188, 0.013545989990234375, 0.016229629516601562, 0.01891326904296875, 0.021596908569335938, 0.024280548095703125, 0.026964187622070312, 0.0296478271484375, 0.03233146667480469, 0.035015106201171875, 0.03769874572753906, 0.04038238525390625, 0.04306602478027344, 0.045749664306640625, 0.04843330383300781, 0.051116943359375, 0.05380058288574219, 0.056484222412109375, 0.05916786193847656, 0.06185150146484375, 0.06453514099121094, 0.06721878051757812, 0.06990242004394531, 0.0725860595703125, 0.07526969909667969, 0.07795333862304688, 0.08063697814941406, 0.08332061767578125, 0.08600425720214844, 0.08868789672851562, 0.09137153625488281, 0.09405517578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 14.0, 14.0, 15.0, 11.0, 26.0, 21.0, 32.0, 24.0, 42.0, 28.0, 31.0, 23.0, 46.0, 41.0, 51.0, 49.0, 42.0, 39.0, 43.0, 28.0, 30.0, 34.0, 38.0, 30.0, 29.0, 27.0, 27.0, 21.0, 22.0, 18.0, 18.0, 3.0, 12.0, 12.0, 6.0, 5.0, 10.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06451416015625, -0.06258296966552734, -0.06065177917480469, -0.05872058868408203, -0.056789398193359375, -0.05485820770263672, -0.05292701721191406, -0.050995826721191406, -0.04906463623046875, -0.047133445739746094, -0.04520225524902344, -0.04327106475830078, -0.041339874267578125, -0.03940868377685547, -0.03747749328613281, -0.035546302795410156, -0.0336151123046875, -0.031683921813964844, -0.029752731323242188, -0.02782154083251953, -0.025890350341796875, -0.02395915985107422, -0.022027969360351562, -0.020096778869628906, -0.01816558837890625, -0.016234397888183594, -0.014303207397460938, -0.012372016906738281, -0.010440826416015625, -0.008509635925292969, -0.0065784454345703125, -0.004647254943847656, -0.002716064453125, -0.0007848739624023438, 0.0011463165283203125, 0.0030775070190429688, 0.005008697509765625, 0.006939888000488281, 0.008871078491210938, 0.010802268981933594, 0.01273345947265625, 0.014664649963378906, 0.016595840454101562, 0.01852703094482422, 0.020458221435546875, 0.02238941192626953, 0.024320602416992188, 0.026251792907714844, 0.0281829833984375, 0.030114173889160156, 0.03204536437988281, 0.03397655487060547, 0.035907745361328125, 0.03783893585205078, 0.03977012634277344, 0.041701316833496094, 0.04363250732421875, 0.045563697814941406, 0.04749488830566406, 0.04942607879638672, 0.051357269287109375, 0.05328845977783203, 0.05521965026855469, 0.057150840759277344, 0.05908203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 13.0, 22.0, 43.0, 53.0, 104.0, 140.0, 290.0, 466.0, 867.0, 1680.0, 2998.0, 6077.0, 12265.0, 24470.0, 49708.0, 106767.0, 241818.0, 655306.0, 1652122.0, 884365.0, 305739.0, 130285.0, 60485.0, 28871.0, 14171.0, 7296.0, 3662.0, 1855.0, 980.0, 573.0, 294.0, 194.0, 109.0, 71.0, 40.0, 28.0, 19.0, 12.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0953369140625, -0.09266090393066406, -0.08998489379882812, -0.08730888366699219, -0.08463287353515625, -0.08195686340332031, -0.07928085327148438, -0.07660484313964844, -0.0739288330078125, -0.07125282287597656, -0.06857681274414062, -0.06590080261230469, -0.06322479248046875, -0.06054878234863281, -0.057872772216796875, -0.05519676208496094, -0.052520751953125, -0.04984474182128906, -0.047168731689453125, -0.04449272155761719, -0.04181671142578125, -0.03914070129394531, -0.036464691162109375, -0.03378868103027344, -0.0311126708984375, -0.028436660766601562, -0.025760650634765625, -0.023084640502929688, -0.02040863037109375, -0.017732620239257812, -0.015056610107421875, -0.012380599975585938, -0.00970458984375, -0.0070285797119140625, -0.004352569580078125, -0.0016765594482421875, 0.00099945068359375, 0.0036754608154296875, 0.006351470947265625, 0.009027481079101562, 0.0117034912109375, 0.014379501342773438, 0.017055511474609375, 0.019731521606445312, 0.02240753173828125, 0.025083541870117188, 0.027759552001953125, 0.030435562133789062, 0.033111572265625, 0.03578758239746094, 0.038463592529296875, 0.04113960266113281, 0.04381561279296875, 0.04649162292480469, 0.049167633056640625, 0.05184364318847656, 0.0545196533203125, 0.05719566345214844, 0.059871673583984375, 0.06254768371582031, 0.06522369384765625, 0.06789970397949219, 0.07057571411132812, 0.07325172424316406, 0.075927734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 18.0, 18.0, 17.0, 29.0, 22.0, 48.0, 31.0, 66.0, 70.0, 100.0, 104.0, 185.0, 243.0, 311.0, 416.0, 509.0, 485.0, 355.0, 256.0, 173.0, 139.0, 100.0, 88.0, 60.0, 60.0, 35.0, 28.0, 26.0, 13.0, 18.0, 6.0, 7.0, 10.0, 3.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10858154296875, -0.10491275787353516, -0.10124397277832031, -0.09757518768310547, -0.09390640258789062, -0.09023761749267578, -0.08656883239746094, -0.0829000473022461, -0.07923126220703125, -0.0755624771118164, -0.07189369201660156, -0.06822490692138672, -0.06455612182617188, -0.06088733673095703, -0.05721855163574219, -0.053549766540527344, -0.0498809814453125, -0.046212196350097656, -0.04254341125488281, -0.03887462615966797, -0.035205841064453125, -0.03153705596923828, -0.027868270874023438, -0.024199485778808594, -0.02053070068359375, -0.016861915588378906, -0.013193130493164062, -0.009524345397949219, -0.005855560302734375, -0.0021867752075195312, 0.0014820098876953125, 0.005150794982910156, 0.008819580078125, 0.012488365173339844, 0.016157150268554688, 0.01982593536376953, 0.023494720458984375, 0.02716350555419922, 0.030832290649414062, 0.034501075744628906, 0.03816986083984375, 0.041838645935058594, 0.04550743103027344, 0.04917621612548828, 0.052845001220703125, 0.05651378631591797, 0.06018257141113281, 0.06385135650634766, 0.0675201416015625, 0.07118892669677734, 0.07485771179199219, 0.07852649688720703, 0.08219528198242188, 0.08586406707763672, 0.08953285217285156, 0.0932016372680664, 0.09687042236328125, 0.1005392074584961, 0.10420799255371094, 0.10787677764892578, 0.11154556274414062, 0.11521434783935547, 0.11888313293457031, 0.12255191802978516, 0.126220703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 8.0, 8.0, 23.0, 30.0, 50.0, 50.0, 75.0, 97.0, 84.0, 98.0, 103.0, 90.0, 59.0, 67.0, 63.0, 36.0, 17.0, 7.0, 11.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6537379026412964, -0.6325673460960388, -0.6113967895507812, -0.5902261734008789, -0.5690556168556213, -0.5478850603103638, -0.5267145037651062, -0.5055439472198486, -0.4843733608722687, -0.4632028043270111, -0.44203221797943115, -0.4208616614341736, -0.399691104888916, -0.37852051854133606, -0.3573499619960785, -0.33617937564849854, -0.31500881910324097, -0.2938382625579834, -0.27266767621040344, -0.2514971196651459, -0.2303265482187271, -0.20915597677230835, -0.18798542022705078, -0.16681484878063202, -0.14564427733421326, -0.1244737058877945, -0.10330314189195633, -0.08213257789611816, -0.0609620064496994, -0.03979143500328064, -0.01862087845802307, 0.002549692988395691, 0.023720204830169678, 0.04489077255129814, 0.0660613402724266, 0.08723190426826477, 0.10840247571468353, 0.1295730471611023, 0.15074360370635986, 0.17191417515277863, 0.1930847465991974, 0.21425531804561615, 0.2354258894920349, 0.2565964460372925, 0.27776700258255005, 0.29893758893013, 0.3201081454753876, 0.34127873182296753, 0.3624492883682251, 0.38361984491348267, 0.4047904312610626, 0.4259609878063202, 0.44713157415390015, 0.4683021306991577, 0.4894726872444153, 0.5106432437896729, 0.5318138599395752, 0.5529844164848328, 0.5741549730300903, 0.5953255891799927, 0.6164961457252502, 0.6376667022705078, 0.6588372588157654, 0.680007815361023, 0.7011783719062805]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 5.0, 7.0, 5.0, 23.0, 13.0, 13.0, 20.0, 25.0, 24.0, 24.0, 29.0, 35.0, 33.0, 35.0, 33.0, 34.0, 42.0, 43.0, 37.0, 42.0, 42.0, 35.0, 44.0, 40.0, 38.0, 39.0, 20.0, 32.0, 33.0, 17.0, 22.0, 22.0, 15.0, 9.0, 5.0, 13.0, 12.0, 7.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.3592570424079895, -0.34792518615722656, -0.3365933299064636, -0.3252614736557007, -0.31392964720726013, -0.3025977909564972, -0.29126593470573425, -0.2799340784549713, -0.26860225200653076, -0.2572703957557678, -0.24593855440616608, -0.23460669815540314, -0.2232748568058014, -0.21194300055503845, -0.2006111443042755, -0.18927928805351257, -0.17794743180274963, -0.1666155755519867, -0.15528373420238495, -0.143951877951622, -0.13262003660202026, -0.12128818035125732, -0.10995632410049438, -0.09862447530031204, -0.0872926265001297, -0.07596077769994736, -0.06462892889976501, -0.053297072649002075, -0.04196522384881973, -0.03063337504863739, -0.01930151879787445, -0.007969669997692108, 0.0033621788024902344, 0.014694029465317726, 0.026025880128145218, 0.03735773265361786, 0.0486895814538002, 0.060021430253982544, 0.07135328650474548, 0.08268513530492783, 0.09401698410511017, 0.10534883290529251, 0.11668068170547485, 0.1280125379562378, 0.13934439420700073, 0.15067623555660248, 0.16200809180736542, 0.17333993315696716, 0.1846717894077301, 0.19600364565849304, 0.2073354870080948, 0.21866734325885773, 0.22999918460845947, 0.2413310408592224, 0.25266289710998535, 0.2639947533607483, 0.27532660961151123, 0.28665846586227417, 0.2979903221130371, 0.30932217836380005, 0.3206540048122406, 0.33198586106300354, 0.3433177173137665, 0.3546495735645294, 0.36598140001296997]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 9.0, 9.0, 20.0, 34.0, 51.0, 74.0, 98.0, 166.0, 231.0, 302.0, 479.0, 667.0, 906.0, 1369.0, 1749.0, 2516.0, 3359.0, 4955.0, 6664.0, 9492.0, 14605.0, 23792.0, 46993.0, 123014.0, 306828.0, 282633.0, 107380.0, 42559.0, 22110.0, 13700.0, 9201.0, 6315.0, 4596.0, 3327.0, 2399.0, 1843.0, 1181.0, 905.0, 630.0, 444.0, 309.0, 210.0, 147.0, 116.0, 65.0, 33.0, 23.0, 19.0, 13.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.08284950256347656, -0.07988357543945312, -0.07691764831542969, -0.07395172119140625, -0.07098579406738281, -0.06801986694335938, -0.06505393981933594, -0.0620880126953125, -0.05912208557128906, -0.056156158447265625, -0.05319023132324219, -0.05022430419921875, -0.04725837707519531, -0.044292449951171875, -0.04132652282714844, -0.038360595703125, -0.03539466857910156, -0.032428741455078125, -0.029462814331054688, -0.02649688720703125, -0.023530960083007812, -0.020565032958984375, -0.017599105834960938, -0.0146331787109375, -0.011667251586914062, -0.008701324462890625, -0.0057353973388671875, -0.00276947021484375, 0.0001964569091796875, 0.003162384033203125, 0.0061283111572265625, 0.00909423828125, 0.012060165405273438, 0.015026092529296875, 0.017992019653320312, 0.02095794677734375, 0.023923873901367188, 0.026889801025390625, 0.029855728149414062, 0.0328216552734375, 0.03578758239746094, 0.038753509521484375, 0.04171943664550781, 0.04468536376953125, 0.04765129089355469, 0.050617218017578125, 0.05358314514160156, 0.056549072265625, 0.05951499938964844, 0.062480926513671875, 0.06544685363769531, 0.06841278076171875, 0.07137870788574219, 0.07434463500976562, 0.07731056213378906, 0.0802764892578125, 0.08324241638183594, 0.08620834350585938, 0.08917427062988281, 0.09214019775390625, 0.09510612487792969, 0.09807205200195312, 0.10103797912597656, 0.10400390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 8.0, 4.0, 8.0, 9.0, 18.0, 12.0, 20.0, 19.0, 24.0, 37.0, 24.0, 25.0, 32.0, 28.0, 32.0, 38.0, 38.0, 42.0, 37.0, 48.0, 41.0, 38.0, 33.0, 42.0, 34.0, 30.0, 28.0, 31.0, 27.0, 24.0, 24.0, 19.0, 23.0, 19.0, 10.0, 12.0, 9.0, 10.0, 5.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.06451416015625, -0.0626683235168457, -0.060822486877441406, -0.05897665023803711, -0.05713081359863281, -0.055284976959228516, -0.05343914031982422, -0.05159330368041992, -0.049747467041015625, -0.04790163040161133, -0.04605579376220703, -0.044209957122802734, -0.04236412048339844, -0.04051828384399414, -0.038672447204589844, -0.03682661056518555, -0.03498077392578125, -0.03313493728637695, -0.031289100646972656, -0.02944326400756836, -0.027597427368164062, -0.025751590728759766, -0.02390575408935547, -0.022059917449951172, -0.020214080810546875, -0.018368244171142578, -0.01652240753173828, -0.014676570892333984, -0.012830734252929688, -0.01098489761352539, -0.009139060974121094, -0.007293224334716797, -0.0054473876953125, -0.003601551055908203, -0.0017557144165039062, 9.012222290039062e-05, 0.0019359588623046875, 0.0037817955017089844, 0.005627632141113281, 0.007473468780517578, 0.009319305419921875, 0.011165142059326172, 0.013010978698730469, 0.014856815338134766, 0.016702651977539062, 0.01854848861694336, 0.020394325256347656, 0.022240161895751953, 0.02408599853515625, 0.025931835174560547, 0.027777671813964844, 0.02962350845336914, 0.03146934509277344, 0.033315181732177734, 0.03516101837158203, 0.03700685501098633, 0.038852691650390625, 0.04069852828979492, 0.04254436492919922, 0.044390201568603516, 0.04623603820800781, 0.04808187484741211, 0.049927711486816406, 0.0517735481262207, 0.053619384765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 3.0, 7.0, 3.0, 5.0, 15.0, 19.0, 28.0, 37.0, 42.0, 60.0, 94.0, 172.0, 241.0, 432.0, 899.0, 2004.0, 4828.0, 11774.0, 28912.0, 85595.0, 426469.0, 367379.0, 74747.0, 26110.0, 10604.0, 4439.0, 1773.0, 798.0, 413.0, 215.0, 140.0, 85.0, 50.0, 45.0, 40.0, 25.0, 9.0, 14.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.16643905639648438, -0.16088104248046875, -0.15532302856445312, -0.1497650146484375, -0.14420700073242188, -0.13864898681640625, -0.13309097290039062, -0.127532958984375, -0.12197494506835938, -0.11641693115234375, -0.11085891723632812, -0.1053009033203125, -0.09974288940429688, -0.09418487548828125, -0.08862686157226562, -0.08306884765625, -0.07751083374023438, -0.07195281982421875, -0.06639480590820312, -0.0608367919921875, -0.055278778076171875, -0.04972076416015625, -0.044162750244140625, -0.038604736328125, -0.033046722412109375, -0.02748870849609375, -0.021930694580078125, -0.0163726806640625, -0.010814666748046875, -0.00525665283203125, 0.000301361083984375, 0.005859375, 0.011417388916015625, 0.01697540283203125, 0.022533416748046875, 0.0280914306640625, 0.033649444580078125, 0.03920745849609375, 0.044765472412109375, 0.050323486328125, 0.055881500244140625, 0.06143951416015625, 0.06699752807617188, 0.0725555419921875, 0.07811355590820312, 0.08367156982421875, 0.08922958374023438, 0.09478759765625, 0.10034561157226562, 0.10590362548828125, 0.11146163940429688, 0.1170196533203125, 0.12257766723632812, 0.12813568115234375, 0.13369369506835938, 0.139251708984375, 0.14480972290039062, 0.15036773681640625, 0.15592575073242188, 0.1614837646484375, 0.16704177856445312, 0.17259979248046875, 0.17815780639648438, 0.1837158203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 9.0, 9.0, 2.0, 9.0, 11.0, 8.0, 9.0, 16.0, 21.0, 20.0, 33.0, 23.0, 16.0, 34.0, 27.0, 31.0, 35.0, 44.0, 46.0, 36.0, 38.0, 39.0, 35.0, 41.0, 55.0, 46.0, 39.0, 36.0, 31.0, 30.0, 21.0, 21.0, 19.0, 18.0, 17.0, 14.0, 14.0, 5.0, 10.0, 3.0, 11.0, 9.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1522216796875, -0.14736175537109375, -0.1425018310546875, -0.13764190673828125, -0.132781982421875, -0.12792205810546875, -0.1230621337890625, -0.11820220947265625, -0.11334228515625, -0.10848236083984375, -0.1036224365234375, -0.09876251220703125, -0.093902587890625, -0.08904266357421875, -0.0841827392578125, -0.07932281494140625, -0.074462890625, -0.06960296630859375, -0.0647430419921875, -0.05988311767578125, -0.055023193359375, -0.05016326904296875, -0.0453033447265625, -0.04044342041015625, -0.03558349609375, -0.03072357177734375, -0.0258636474609375, -0.02100372314453125, -0.016143798828125, -0.01128387451171875, -0.0064239501953125, -0.00156402587890625, 0.0032958984375, 0.00815582275390625, 0.0130157470703125, 0.01787567138671875, 0.022735595703125, 0.02759552001953125, 0.0324554443359375, 0.03731536865234375, 0.04217529296875, 0.04703521728515625, 0.0518951416015625, 0.05675506591796875, 0.061614990234375, 0.06647491455078125, 0.0713348388671875, 0.07619476318359375, 0.0810546875, 0.08591461181640625, 0.0907745361328125, 0.09563446044921875, 0.100494384765625, 0.10535430908203125, 0.1102142333984375, 0.11507415771484375, 0.11993408203125, 0.12479400634765625, 0.1296539306640625, 0.13451385498046875, 0.139373779296875, 0.14423370361328125, 0.1490936279296875, 0.15395355224609375, 0.1588134765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 8.0, 15.0, 22.0, 37.0, 60.0, 80.0, 156.0, 253.0, 437.0, 648.0, 1133.0, 1839.0, 2944.0, 4822.0, 7853.0, 13739.0, 27855.0, 69603.0, 217873.0, 393962.0, 187463.0, 61206.0, 24736.0, 12752.0, 7392.0, 4511.0, 2759.0, 1717.0, 1083.0, 610.0, 346.0, 224.0, 147.0, 88.0, 53.0, 43.0, 28.0, 19.0, 12.0, 2.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.045928955078125, -0.0445551872253418, -0.043181419372558594, -0.04180765151977539, -0.04043388366699219, -0.039060115814208984, -0.03768634796142578, -0.03631258010864258, -0.034938812255859375, -0.03356504440307617, -0.03219127655029297, -0.030817508697509766, -0.029443740844726562, -0.02806997299194336, -0.026696205139160156, -0.025322437286376953, -0.02394866943359375, -0.022574901580810547, -0.021201133728027344, -0.01982736587524414, -0.018453598022460938, -0.017079830169677734, -0.01570606231689453, -0.014332294464111328, -0.012958526611328125, -0.011584758758544922, -0.010210990905761719, -0.008837223052978516, -0.0074634552001953125, -0.006089687347412109, -0.004715919494628906, -0.003342151641845703, -0.0019683837890625, -0.0005946159362792969, 0.0007791519165039062, 0.0021529197692871094, 0.0035266876220703125, 0.004900455474853516, 0.006274223327636719, 0.007647991180419922, 0.009021759033203125, 0.010395526885986328, 0.011769294738769531, 0.013143062591552734, 0.014516830444335938, 0.01589059829711914, 0.017264366149902344, 0.018638134002685547, 0.02001190185546875, 0.021385669708251953, 0.022759437561035156, 0.02413320541381836, 0.025506973266601562, 0.026880741119384766, 0.02825450897216797, 0.029628276824951172, 0.031002044677734375, 0.03237581253051758, 0.03374958038330078, 0.035123348236083984, 0.03649711608886719, 0.03787088394165039, 0.039244651794433594, 0.0406184196472168, 0.0419921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 6.0, 3.0, 7.0, 6.0, 14.0, 22.0, 21.0, 33.0, 53.0, 80.0, 92.0, 117.0, 109.0, 112.0, 98.0, 60.0, 35.0, 40.0, 17.0, 19.0, 5.0, 10.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0205974578857422e-05, -1.955777406692505e-05, -1.8909573554992676e-05, -1.8261373043060303e-05, -1.761317253112793e-05, -1.6964972019195557e-05, -1.6316771507263184e-05, -1.566857099533081e-05, -1.5020370483398438e-05, -1.4372169971466064e-05, -1.3723969459533691e-05, -1.3075768947601318e-05, -1.2427568435668945e-05, -1.1779367923736572e-05, -1.11311674118042e-05, -1.0482966899871826e-05, -9.834766387939453e-06, -9.18656587600708e-06, -8.538365364074707e-06, -7.890164852142334e-06, -7.241964340209961e-06, -6.593763828277588e-06, -5.945563316345215e-06, -5.297362804412842e-06, -4.649162292480469e-06, -4.000961780548096e-06, -3.3527612686157227e-06, -2.7045607566833496e-06, -2.0563602447509766e-06, -1.4081597328186035e-06, -7.599592208862305e-07, -1.1175870895385742e-07, 5.364418029785156e-07, 1.1846423149108887e-06, 1.8328428268432617e-06, 2.4810433387756348e-06, 3.129243850708008e-06, 3.777444362640381e-06, 4.425644874572754e-06, 5.073845386505127e-06, 5.7220458984375e-06, 6.370246410369873e-06, 7.018446922302246e-06, 7.666647434234619e-06, 8.314847946166992e-06, 8.963048458099365e-06, 9.611248970031738e-06, 1.0259449481964111e-05, 1.0907649993896484e-05, 1.1555850505828857e-05, 1.220405101776123e-05, 1.2852251529693604e-05, 1.3500452041625977e-05, 1.414865255355835e-05, 1.4796853065490723e-05, 1.5445053577423096e-05, 1.609325408935547e-05, 1.6741454601287842e-05, 1.7389655113220215e-05, 1.8037855625152588e-05, 1.868605613708496e-05, 1.9334256649017334e-05, 1.9982457160949707e-05, 2.063065767288208e-05, 2.1278858184814453e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 10.0, 8.0, 19.0, 17.0, 32.0, 43.0, 70.0, 103.0, 166.0, 255.0, 425.0, 875.0, 1705.0, 3175.0, 6099.0, 12757.0, 28552.0, 81552.0, 247954.0, 377174.0, 184813.0, 59467.0, 22002.0, 10272.0, 5183.0, 2708.0, 1338.0, 731.0, 401.0, 211.0, 144.0, 81.0, 57.0, 39.0, 25.0, 15.0, 19.0, 5.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.04620361328125, -0.044730186462402344, -0.04325675964355469, -0.04178333282470703, -0.040309906005859375, -0.03883647918701172, -0.03736305236816406, -0.035889625549316406, -0.03441619873046875, -0.032942771911621094, -0.03146934509277344, -0.02999591827392578, -0.028522491455078125, -0.02704906463623047, -0.025575637817382812, -0.024102210998535156, -0.0226287841796875, -0.021155357360839844, -0.019681930541992188, -0.01820850372314453, -0.016735076904296875, -0.015261650085449219, -0.013788223266601562, -0.012314796447753906, -0.01084136962890625, -0.009367942810058594, -0.007894515991210938, -0.006421089172363281, -0.004947662353515625, -0.0034742355346679688, -0.0020008087158203125, -0.0005273818969726562, 0.000946044921875, 0.0024194717407226562, 0.0038928985595703125, 0.005366325378417969, 0.006839752197265625, 0.008313179016113281, 0.009786605834960938, 0.011260032653808594, 0.01273345947265625, 0.014206886291503906, 0.015680313110351562, 0.01715373992919922, 0.018627166748046875, 0.02010059356689453, 0.021574020385742188, 0.023047447204589844, 0.0245208740234375, 0.025994300842285156, 0.027467727661132812, 0.02894115447998047, 0.030414581298828125, 0.03188800811767578, 0.03336143493652344, 0.034834861755371094, 0.03630828857421875, 0.037781715393066406, 0.03925514221191406, 0.04072856903076172, 0.042201995849609375, 0.04367542266845703, 0.04514884948730469, 0.046622276306152344, 0.048095703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 9.0, 6.0, 9.0, 12.0, 9.0, 14.0, 26.0, 43.0, 41.0, 75.0, 77.0, 76.0, 95.0, 93.0, 85.0, 74.0, 54.0, 36.0, 36.0, 20.0, 20.0, 18.0, 18.0, 17.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.041228294372558594, -0.03970146179199219, -0.03817462921142578, -0.036647796630859375, -0.03512096405029297, -0.03359413146972656, -0.032067298889160156, -0.03054046630859375, -0.029013633728027344, -0.027486801147460938, -0.02595996856689453, -0.024433135986328125, -0.02290630340576172, -0.021379470825195312, -0.019852638244628906, -0.0183258056640625, -0.016798973083496094, -0.015272140502929688, -0.013745307922363281, -0.012218475341796875, -0.010691642761230469, -0.009164810180664062, -0.007637977600097656, -0.00611114501953125, -0.004584312438964844, -0.0030574798583984375, -0.0015306472778320312, -3.814697265625e-06, 0.0015230178833007812, 0.0030498504638671875, 0.004576683044433594, 0.006103515625, 0.007630348205566406, 0.009157180786132812, 0.010684013366699219, 0.012210845947265625, 0.013737678527832031, 0.015264511108398438, 0.016791343688964844, 0.01831817626953125, 0.019845008850097656, 0.021371841430664062, 0.02289867401123047, 0.024425506591796875, 0.02595233917236328, 0.027479171752929688, 0.029006004333496094, 0.0305328369140625, 0.032059669494628906, 0.03358650207519531, 0.03511333465576172, 0.036640167236328125, 0.03816699981689453, 0.03969383239746094, 0.041220664978027344, 0.04274749755859375, 0.044274330139160156, 0.04580116271972656, 0.04732799530029297, 0.048854827880859375, 0.05038166046142578, 0.05190849304199219, 0.053435325622558594, 0.054962158203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 10.0, 32.0, 48.0, 78.0, 103.0, 144.0, 135.0, 138.0, 113.0, 73.0, 51.0, 28.0, 16.0, 12.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.9762471914291382, -0.9521121382713318, -0.9279770851135254, -0.9038420915603638, -0.8797070384025574, -0.855571985244751, -0.8314369916915894, -0.807301938533783, -0.7831668853759766, -0.7590318322181702, -0.7348967790603638, -0.7107617855072021, -0.6866267323493958, -0.6624916791915894, -0.6383566856384277, -0.6142216324806213, -0.5900865793228149, -0.5659515261650085, -0.5418164730072021, -0.5176814794540405, -0.49354642629623413, -0.46941137313842773, -0.4452763497829437, -0.4211413264274597, -0.3970062732696533, -0.3728712201118469, -0.3487361967563629, -0.3246011734008789, -0.3004661202430725, -0.2763310670852661, -0.2521960437297821, -0.2280610054731369, -0.2039259672164917, -0.1797909289598465, -0.1556558907032013, -0.1315208524465561, -0.10738581418991089, -0.08325077593326569, -0.05911573767662048, -0.03498069941997528, -0.010845661163330078, 0.013289377093315125, 0.03742441534996033, 0.06155945360660553, 0.08569449186325073, 0.10982953011989594, 0.13396456837654114, 0.15809960663318634, 0.18223464488983154, 0.20636968314647675, 0.23050472140312195, 0.25463974475860596, 0.27877479791641235, 0.30290985107421875, 0.32704487442970276, 0.35117989778518677, 0.37531495094299316, 0.39945000410079956, 0.42358502745628357, 0.4477200508117676, 0.471855103969574, 0.49599015712738037, 0.520125150680542, 0.5442602038383484, 0.5683952569961548]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 2.0, 7.0, 8.0, 17.0, 11.0, 18.0, 14.0, 18.0, 19.0, 22.0, 27.0, 34.0, 21.0, 30.0, 40.0, 44.0, 46.0, 40.0, 45.0, 51.0, 51.0, 42.0, 46.0, 43.0, 40.0, 40.0, 27.0, 23.0, 34.0, 18.0, 25.0, 18.0, 18.0, 10.0, 11.0, 8.0, 7.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.4616820216178894, -0.4485746920108795, -0.43546736240386963, -0.42236006259918213, -0.40925273299217224, -0.39614540338516235, -0.38303810358047485, -0.36993077397346497, -0.3568234443664551, -0.3437161147594452, -0.3306087851524353, -0.3175014853477478, -0.3043941557407379, -0.291286826133728, -0.2781795263290405, -0.26507219672203064, -0.25196486711502075, -0.23885753750801086, -0.22575022280216217, -0.21264290809631348, -0.1995355784893036, -0.1864282488822937, -0.173320934176445, -0.1602136194705963, -0.14710628986358643, -0.13399896025657654, -0.12089164555072784, -0.10778432339429855, -0.09467700123786926, -0.08156967908143997, -0.06846235692501068, -0.05535503476858139, -0.0422477126121521, -0.02914039045572281, -0.016033068299293518, -0.0029257461428642273, 0.010181576013565063, 0.023288898169994354, 0.036396220326423645, 0.049503542482852936, 0.06261086463928223, 0.07571818679571152, 0.08882550895214081, 0.1019328311085701, 0.11504015326499939, 0.12814748287200928, 0.14125479757785797, 0.15436211228370667, 0.16746944189071655, 0.18057677149772644, 0.19368408620357513, 0.20679140090942383, 0.21989873051643372, 0.2330060601234436, 0.2461133748292923, 0.259220689535141, 0.2723280191421509, 0.28543534874916077, 0.29854267835617065, 0.31164997816085815, 0.32475730776786804, 0.33786463737487793, 0.35097193717956543, 0.3640792667865753, 0.3771865963935852]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 1.0, 7.0, 7.0, 6.0, 9.0, 14.0, 27.0, 29.0, 63.0, 65.0, 107.0, 193.0, 314.0, 557.0, 1065.0, 2066.0, 4127.0, 8268.0, 17335.0, 37143.0, 85546.0, 227379.0, 765036.0, 1733876.0, 880342.0, 260882.0, 94215.0, 39942.0, 18259.0, 8618.0, 4225.0, 2092.0, 1048.0, 555.0, 323.0, 192.0, 117.0, 71.0, 55.0, 34.0, 22.0, 21.0, 15.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.08978271484375, -0.08710670471191406, -0.08443069458007812, -0.08175468444824219, -0.07907867431640625, -0.07640266418457031, -0.07372665405273438, -0.07105064392089844, -0.0683746337890625, -0.06569862365722656, -0.06302261352539062, -0.06034660339355469, -0.05767059326171875, -0.05499458312988281, -0.052318572998046875, -0.04964256286621094, -0.046966552734375, -0.04429054260253906, -0.041614532470703125, -0.03893852233886719, -0.03626251220703125, -0.03358650207519531, -0.030910491943359375, -0.028234481811523438, -0.0255584716796875, -0.022882461547851562, -0.020206451416015625, -0.017530441284179688, -0.01485443115234375, -0.012178421020507812, -0.009502410888671875, -0.0068264007568359375, -0.004150390625, -0.0014743804931640625, 0.001201629638671875, 0.0038776397705078125, 0.00655364990234375, 0.009229660034179688, 0.011905670166015625, 0.014581680297851562, 0.0172576904296875, 0.019933700561523438, 0.022609710693359375, 0.025285720825195312, 0.02796173095703125, 0.030637741088867188, 0.033313751220703125, 0.03598976135253906, 0.038665771484375, 0.04134178161621094, 0.044017791748046875, 0.04669380187988281, 0.04936981201171875, 0.05204582214355469, 0.054721832275390625, 0.05739784240722656, 0.0600738525390625, 0.06274986267089844, 0.06542587280273438, 0.06810188293457031, 0.07077789306640625, 0.07345390319824219, 0.07612991333007812, 0.07880592346191406, 0.08148193359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 5.0, 5.0, 11.0, 16.0, 17.0, 18.0, 24.0, 23.0, 18.0, 31.0, 25.0, 30.0, 33.0, 47.0, 32.0, 34.0, 46.0, 38.0, 41.0, 44.0, 29.0, 40.0, 28.0, 44.0, 29.0, 32.0, 27.0, 34.0, 32.0, 22.0, 18.0, 25.0, 9.0, 13.0, 16.0, 11.0, 8.0, 5.0, 10.0, 1.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0631103515625, -0.06129598617553711, -0.05948162078857422, -0.05766725540161133, -0.05585289001464844, -0.05403852462768555, -0.052224159240722656, -0.050409793853759766, -0.048595428466796875, -0.046781063079833984, -0.044966697692871094, -0.0431523323059082, -0.04133796691894531, -0.03952360153198242, -0.03770923614501953, -0.03589487075805664, -0.03408050537109375, -0.03226613998413086, -0.03045177459716797, -0.028637409210205078, -0.026823043823242188, -0.025008678436279297, -0.023194313049316406, -0.021379947662353516, -0.019565582275390625, -0.017751216888427734, -0.015936851501464844, -0.014122486114501953, -0.012308120727539062, -0.010493755340576172, -0.008679389953613281, -0.006865024566650391, -0.0050506591796875, -0.0032362937927246094, -0.0014219284057617188, 0.0003924369812011719, 0.0022068023681640625, 0.004021167755126953, 0.005835533142089844, 0.007649898529052734, 0.009464263916015625, 0.011278629302978516, 0.013092994689941406, 0.014907360076904297, 0.016721725463867188, 0.018536090850830078, 0.02035045623779297, 0.02216482162475586, 0.02397918701171875, 0.02579355239868164, 0.02760791778564453, 0.029422283172607422, 0.031236648559570312, 0.0330510139465332, 0.034865379333496094, 0.036679744720458984, 0.038494110107421875, 0.040308475494384766, 0.042122840881347656, 0.04393720626831055, 0.04575157165527344, 0.04756593704223633, 0.04938030242919922, 0.05119466781616211, 0.053009033203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 14.0, 17.0, 20.0, 43.0, 68.0, 93.0, 176.0, 322.0, 611.0, 1131.0, 2183.0, 4725.0, 10273.0, 23629.0, 56655.0, 144599.0, 445675.0, 1743557.0, 1257429.0, 314668.0, 109739.0, 43657.0, 18850.0, 8223.0, 3829.0, 1869.0, 960.0, 522.0, 250.0, 178.0, 102.0, 62.0, 52.0, 35.0, 16.0, 16.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09344196319580078, -0.09020423889160156, -0.08696651458740234, -0.08372879028320312, -0.0804910659790039, -0.07725334167480469, -0.07401561737060547, -0.07077789306640625, -0.06754016876220703, -0.06430244445800781, -0.061064720153808594, -0.057826995849609375, -0.054589271545410156, -0.05135154724121094, -0.04811382293701172, -0.0448760986328125, -0.04163837432861328, -0.03840065002441406, -0.035162925720214844, -0.031925201416015625, -0.028687477111816406, -0.025449752807617188, -0.02221202850341797, -0.01897430419921875, -0.01573657989501953, -0.012498855590820312, -0.009261131286621094, -0.006023406982421875, -0.0027856826782226562, 0.0004520416259765625, 0.0036897659301757812, 0.006927490234375, 0.010165214538574219, 0.013402938842773438, 0.016640663146972656, 0.019878387451171875, 0.023116111755371094, 0.026353836059570312, 0.02959156036376953, 0.03282928466796875, 0.03606700897216797, 0.03930473327636719, 0.042542457580566406, 0.045780181884765625, 0.049017906188964844, 0.05225563049316406, 0.05549335479736328, 0.0587310791015625, 0.06196880340576172, 0.06520652770996094, 0.06844425201416016, 0.07168197631835938, 0.0749197006225586, 0.07815742492675781, 0.08139514923095703, 0.08463287353515625, 0.08787059783935547, 0.09110832214355469, 0.0943460464477539, 0.09758377075195312, 0.10082149505615234, 0.10405921936035156, 0.10729694366455078, 0.11053466796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 3.0, 8.0, 14.0, 18.0, 17.0, 26.0, 34.0, 44.0, 60.0, 60.0, 92.0, 112.0, 162.0, 228.0, 347.0, 487.0, 524.0, 503.0, 373.0, 257.0, 184.0, 111.0, 74.0, 83.0, 52.0, 38.0, 34.0, 25.0, 13.0, 21.0, 14.0, 15.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12353515625, -0.1197509765625, -0.115966796875, -0.1121826171875, -0.1083984375, -0.1046142578125, -0.100830078125, -0.0970458984375, -0.09326171875, -0.0894775390625, -0.085693359375, -0.0819091796875, -0.078125, -0.0743408203125, -0.070556640625, -0.0667724609375, -0.06298828125, -0.0592041015625, -0.055419921875, -0.0516357421875, -0.0478515625, -0.0440673828125, -0.040283203125, -0.0364990234375, -0.03271484375, -0.0289306640625, -0.025146484375, -0.0213623046875, -0.017578125, -0.0137939453125, -0.010009765625, -0.0062255859375, -0.00244140625, 0.0013427734375, 0.005126953125, 0.0089111328125, 0.0126953125, 0.0164794921875, 0.020263671875, 0.0240478515625, 0.02783203125, 0.0316162109375, 0.035400390625, 0.0391845703125, 0.04296875, 0.0467529296875, 0.050537109375, 0.0543212890625, 0.05810546875, 0.0618896484375, 0.065673828125, 0.0694580078125, 0.0732421875, 0.0770263671875, 0.080810546875, 0.0845947265625, 0.08837890625, 0.0921630859375, 0.095947265625, 0.0997314453125, 0.103515625, 0.1072998046875, 0.111083984375, 0.1148681640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 3.0, 6.0, 7.0, 16.0, 23.0, 42.0, 65.0, 73.0, 99.0, 122.0, 145.0, 114.0, 98.0, 71.0, 58.0, 28.0, 12.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8450343608856201, -0.8171789050102234, -0.7893233895301819, -0.7614679336547852, -0.7336124181747437, -0.7057569622993469, -0.6779014468193054, -0.6500459909439087, -0.6221904754638672, -0.5943350195884705, -0.566479504108429, -0.5386240482330322, -0.5107685327529907, -0.482913076877594, -0.4550575613975525, -0.42720210552215576, -0.39934661984443665, -0.37149113416671753, -0.3436356484889984, -0.3157801628112793, -0.2879246771335602, -0.26006919145584106, -0.23221372067928314, -0.20435823500156403, -0.1765027493238449, -0.1486472636461258, -0.12079177796840668, -0.09293629974126816, -0.06508081406354904, -0.03722533583641052, -0.009369850158691406, 0.01848563551902771, 0.046341121196746826, 0.07419660687446594, 0.10205209255218506, 0.12990757822990417, 0.1577630639076233, 0.1856185346841812, 0.21347402036190033, 0.24132950603961945, 0.26918500661849976, 0.29704049229621887, 0.324895977973938, 0.3527514636516571, 0.3806069493293762, 0.40846240520477295, 0.43631792068481445, 0.4641733765602112, 0.4920288622379303, 0.5198843479156494, 0.5477398037910461, 0.5755953192710876, 0.6034507751464844, 0.6313062906265259, 0.6591617465019226, 0.6870172619819641, 0.7148727178573608, 0.7427281737327576, 0.7705836892127991, 0.7984391450881958, 0.8262946605682373, 0.854150116443634, 0.8820056319236755, 0.9098610877990723, 0.9377166032791138]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 7.0, 8.0, 8.0, 12.0, 12.0, 12.0, 25.0, 17.0, 22.0, 21.0, 30.0, 36.0, 32.0, 42.0, 44.0, 38.0, 52.0, 39.0, 47.0, 36.0, 37.0, 44.0, 51.0, 40.0, 47.0, 30.0, 36.0, 26.0, 21.0, 15.0, 25.0, 19.0, 11.0, 15.0, 8.0, 14.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36221349239349365, -0.34868741035461426, -0.3351612985134125, -0.3216352164745331, -0.3081091046333313, -0.2945830225944519, -0.2810569405555725, -0.2675308287143707, -0.25400471687316895, -0.24047861993312836, -0.22695252299308777, -0.21342644095420837, -0.1999003291130066, -0.1863742470741272, -0.1728481501340866, -0.15932205319404602, -0.14579597115516663, -0.13226987421512604, -0.11874377727508545, -0.10521768778562546, -0.09169159084558487, -0.07816549390554428, -0.06463940441608429, -0.0511133074760437, -0.03758721053600311, -0.024061115458607674, -0.010535020381212234, 0.0029910728335380554, 0.016517169773578644, 0.030043266713619232, 0.043569356203079224, 0.05709545314311981, 0.0706215500831604, 0.08414764702320099, 0.09767374396324158, 0.11119983345270157, 0.12472593039274216, 0.13825201988220215, 0.15177811682224274, 0.16530421376228333, 0.1788303107023239, 0.1923564076423645, 0.2058825045824051, 0.21940860152244568, 0.23293468356132507, 0.24646079540252686, 0.25998687744140625, 0.27351295948028564, 0.2870390713214874, 0.3005651533603668, 0.3140912652015686, 0.327617347240448, 0.3411434590816498, 0.3546695411205292, 0.36819565296173096, 0.38172173500061035, 0.39524781703948975, 0.40877389907836914, 0.4223000109195709, 0.4358260929584503, 0.4493522047996521, 0.4628782868385315, 0.4764043688774109, 0.48993048071861267, 0.5034565925598145]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 21.0, 33.0, 49.0, 66.0, 95.0, 187.0, 254.0, 426.0, 602.0, 977.0, 1592.0, 2457.0, 3802.0, 5673.0, 8589.0, 12920.0, 19648.0, 32807.0, 71819.0, 196762.0, 330310.0, 196810.0, 72198.0, 33051.0, 19482.0, 13009.0, 8688.0, 5676.0, 3753.0, 2361.0, 1576.0, 1011.0, 709.0, 402.0, 252.0, 147.0, 116.0, 69.0, 30.0, 39.0, 25.0, 11.0, 9.0, 8.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.09515380859375, -0.09222602844238281, -0.08929824829101562, -0.08637046813964844, -0.08344268798828125, -0.08051490783691406, -0.07758712768554688, -0.07465934753417969, -0.0717315673828125, -0.06880378723144531, -0.06587600708007812, -0.06294822692871094, -0.06002044677734375, -0.05709266662597656, -0.054164886474609375, -0.05123710632324219, -0.048309326171875, -0.04538154602050781, -0.042453765869140625, -0.03952598571777344, -0.03659820556640625, -0.03367042541503906, -0.030742645263671875, -0.027814865112304688, -0.0248870849609375, -0.021959304809570312, -0.019031524658203125, -0.016103744506835938, -0.01317596435546875, -0.010248184204101562, -0.007320404052734375, -0.0043926239013671875, -0.00146484375, 0.0014629364013671875, 0.004390716552734375, 0.0073184967041015625, 0.01024627685546875, 0.013174057006835938, 0.016101837158203125, 0.019029617309570312, 0.0219573974609375, 0.024885177612304688, 0.027812957763671875, 0.030740737915039062, 0.03366851806640625, 0.03659629821777344, 0.039524078369140625, 0.04245185852050781, 0.045379638671875, 0.04830741882324219, 0.051235198974609375, 0.05416297912597656, 0.05709075927734375, 0.06001853942871094, 0.06294631958007812, 0.06587409973144531, 0.0688018798828125, 0.07172966003417969, 0.07465744018554688, 0.07758522033691406, 0.08051300048828125, 0.08344078063964844, 0.08636856079101562, 0.08929634094238281, 0.09222412109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 4.0, 7.0, 11.0, 15.0, 17.0, 15.0, 19.0, 17.0, 19.0, 29.0, 31.0, 29.0, 44.0, 44.0, 38.0, 44.0, 52.0, 45.0, 45.0, 44.0, 52.0, 49.0, 48.0, 45.0, 32.0, 40.0, 40.0, 22.0, 11.0, 18.0, 18.0, 9.0, 7.0, 9.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0743408203125, -0.07226181030273438, -0.07018280029296875, -0.06810379028320312, -0.0660247802734375, -0.06394577026367188, -0.06186676025390625, -0.059787750244140625, -0.057708740234375, -0.055629730224609375, -0.05355072021484375, -0.051471710205078125, -0.0493927001953125, -0.047313690185546875, -0.04523468017578125, -0.043155670166015625, -0.04107666015625, -0.038997650146484375, -0.03691864013671875, -0.034839630126953125, -0.0327606201171875, -0.030681610107421875, -0.02860260009765625, -0.026523590087890625, -0.024444580078125, -0.022365570068359375, -0.02028656005859375, -0.018207550048828125, -0.0161285400390625, -0.014049530029296875, -0.01197052001953125, -0.009891510009765625, -0.0078125, -0.005733489990234375, -0.00365447998046875, -0.001575469970703125, 0.0005035400390625, 0.002582550048828125, 0.00466156005859375, 0.006740570068359375, 0.008819580078125, 0.010898590087890625, 0.01297760009765625, 0.015056610107421875, 0.0171356201171875, 0.019214630126953125, 0.02129364013671875, 0.023372650146484375, 0.02545166015625, 0.027530670166015625, 0.02960968017578125, 0.031688690185546875, 0.0337677001953125, 0.035846710205078125, 0.03792572021484375, 0.040004730224609375, 0.042083740234375, 0.044162750244140625, 0.04624176025390625, 0.048320770263671875, 0.0503997802734375, 0.052478790283203125, 0.05455780029296875, 0.056636810302734375, 0.0587158203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 9.0, 12.0, 4.0, 13.0, 14.0, 32.0, 58.0, 94.0, 121.0, 201.0, 364.0, 690.0, 1836.0, 5647.0, 19490.0, 75789.0, 534318.0, 337566.0, 51728.0, 13879.0, 4007.0, 1342.0, 557.0, 303.0, 180.0, 103.0, 61.0, 45.0, 35.0, 22.0, 16.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21400070190429688, -0.20632171630859375, -0.19864273071289062, -0.1909637451171875, -0.18328475952148438, -0.17560577392578125, -0.16792678833007812, -0.160247802734375, -0.15256881713867188, -0.14488983154296875, -0.13721084594726562, -0.1295318603515625, -0.12185287475585938, -0.11417388916015625, -0.10649490356445312, -0.09881591796875, -0.09113693237304688, -0.08345794677734375, -0.07577896118164062, -0.0680999755859375, -0.060420989990234375, -0.05274200439453125, -0.045063018798828125, -0.037384033203125, -0.029705047607421875, -0.02202606201171875, -0.014347076416015625, -0.0066680908203125, 0.001010894775390625, 0.00868988037109375, 0.016368865966796875, 0.0240478515625, 0.031726837158203125, 0.03940582275390625, 0.047084808349609375, 0.0547637939453125, 0.062442779541015625, 0.07012176513671875, 0.07780075073242188, 0.085479736328125, 0.09315872192382812, 0.10083770751953125, 0.10851669311523438, 0.1161956787109375, 0.12387466430664062, 0.13155364990234375, 0.13923263549804688, 0.14691162109375, 0.15459060668945312, 0.16226959228515625, 0.16994857788085938, 0.1776275634765625, 0.18530654907226562, 0.19298553466796875, 0.20066452026367188, 0.208343505859375, 0.21602249145507812, 0.22370147705078125, 0.23138046264648438, 0.2390594482421875, 0.24673843383789062, 0.25441741943359375, 0.2620964050292969, 0.269775390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 7.0, 13.0, 13.0, 13.0, 16.0, 19.0, 22.0, 20.0, 24.0, 25.0, 26.0, 41.0, 44.0, 38.0, 44.0, 54.0, 36.0, 40.0, 41.0, 47.0, 38.0, 42.0, 37.0, 38.0, 36.0, 30.0, 25.0, 20.0, 14.0, 11.0, 21.0, 16.0, 17.0, 7.0, 13.0, 8.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.16368484497070312, -0.15818023681640625, -0.15267562866210938, -0.1471710205078125, -0.14166641235351562, -0.13616180419921875, -0.13065719604492188, -0.125152587890625, -0.11964797973632812, -0.11414337158203125, -0.10863876342773438, -0.1031341552734375, -0.09762954711914062, -0.09212493896484375, -0.08662033081054688, -0.08111572265625, -0.07561111450195312, -0.07010650634765625, -0.06460189819335938, -0.0590972900390625, -0.053592681884765625, -0.04808807373046875, -0.042583465576171875, -0.037078857421875, -0.031574249267578125, -0.02606964111328125, -0.020565032958984375, -0.0150604248046875, -0.009555816650390625, -0.00405120849609375, 0.001453399658203125, 0.0069580078125, 0.012462615966796875, 0.01796722412109375, 0.023471832275390625, 0.0289764404296875, 0.034481048583984375, 0.03998565673828125, 0.045490264892578125, 0.050994873046875, 0.056499481201171875, 0.06200408935546875, 0.06750869750976562, 0.0730133056640625, 0.07851791381835938, 0.08402252197265625, 0.08952713012695312, 0.09503173828125, 0.10053634643554688, 0.10604095458984375, 0.11154556274414062, 0.1170501708984375, 0.12255477905273438, 0.12805938720703125, 0.13356399536132812, 0.139068603515625, 0.14457321166992188, 0.15007781982421875, 0.15558242797851562, 0.1610870361328125, 0.16659164428710938, 0.17209625244140625, 0.17760086059570312, 0.18310546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 8.0, 7.0, 18.0, 42.0, 57.0, 60.0, 106.0, 205.0, 403.0, 723.0, 1383.0, 2758.0, 5527.0, 10717.0, 20390.0, 40584.0, 105673.0, 392825.0, 312707.0, 82529.0, 34791.0, 17985.0, 9288.0, 4696.0, 2394.0, 1221.0, 606.0, 374.0, 204.0, 96.0, 55.0, 37.0, 19.0, 16.0, 12.0, 9.0, 9.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.057861328125, -0.05610227584838867, -0.054343223571777344, -0.052584171295166016, -0.05082511901855469, -0.04906606674194336, -0.04730701446533203, -0.0455479621887207, -0.043788909912109375, -0.04202985763549805, -0.04027080535888672, -0.03851175308227539, -0.03675270080566406, -0.034993648529052734, -0.033234596252441406, -0.03147554397583008, -0.02971649169921875, -0.027957439422607422, -0.026198387145996094, -0.024439334869384766, -0.022680282592773438, -0.02092123031616211, -0.01916217803955078, -0.017403125762939453, -0.015644073486328125, -0.013885021209716797, -0.012125968933105469, -0.01036691665649414, -0.008607864379882812, -0.006848812103271484, -0.005089759826660156, -0.003330707550048828, -0.0015716552734375, 0.00018739700317382812, 0.0019464492797851562, 0.0037055015563964844, 0.0054645538330078125, 0.007223606109619141, 0.008982658386230469, 0.010741710662841797, 0.012500762939453125, 0.014259815216064453, 0.01601886749267578, 0.01777791976928711, 0.019536972045898438, 0.021296024322509766, 0.023055076599121094, 0.024814128875732422, 0.02657318115234375, 0.028332233428955078, 0.030091285705566406, 0.031850337982177734, 0.03360939025878906, 0.03536844253540039, 0.03712749481201172, 0.03888654708862305, 0.040645599365234375, 0.0424046516418457, 0.04416370391845703, 0.04592275619506836, 0.04768180847167969, 0.049440860748291016, 0.051199913024902344, 0.05295896530151367, 0.054718017578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 7.0, 6.0, 3.0, 9.0, 11.0, 10.0, 19.0, 20.0, 34.0, 66.0, 77.0, 108.0, 135.0, 118.0, 94.0, 71.0, 54.0, 31.0, 17.0, 18.0, 10.0, 13.0, 13.0, 9.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1338462829589844e-05, -2.055242657661438e-05, -1.9766390323638916e-05, -1.8980354070663452e-05, -1.8194317817687988e-05, -1.7408281564712524e-05, -1.662224531173706e-05, -1.5836209058761597e-05, -1.5050172805786133e-05, -1.4264136552810669e-05, -1.3478100299835205e-05, -1.2692064046859741e-05, -1.1906027793884277e-05, -1.1119991540908813e-05, -1.033395528793335e-05, -9.547919034957886e-06, -8.761882781982422e-06, -7.975846529006958e-06, -7.189810276031494e-06, -6.40377402305603e-06, -5.617737770080566e-06, -4.8317015171051025e-06, -4.045665264129639e-06, -3.259629011154175e-06, -2.473592758178711e-06, -1.687556505203247e-06, -9.015202522277832e-07, -1.1548399925231934e-07, 6.705522537231445e-07, 1.4565885066986084e-06, 2.2426247596740723e-06, 3.028661012649536e-06, 3.814697265625e-06, 4.600733518600464e-06, 5.386769771575928e-06, 6.172806024551392e-06, 6.9588422775268555e-06, 7.74487853050232e-06, 8.530914783477783e-06, 9.316951036453247e-06, 1.0102987289428711e-05, 1.0889023542404175e-05, 1.1675059795379639e-05, 1.2461096048355103e-05, 1.3247132301330566e-05, 1.403316855430603e-05, 1.4819204807281494e-05, 1.5605241060256958e-05, 1.6391277313232422e-05, 1.7177313566207886e-05, 1.796334981918335e-05, 1.8749386072158813e-05, 1.9535422325134277e-05, 2.032145857810974e-05, 2.1107494831085205e-05, 2.189353108406067e-05, 2.2679567337036133e-05, 2.3465603590011597e-05, 2.425163984298706e-05, 2.5037676095962524e-05, 2.5823712348937988e-05, 2.6609748601913452e-05, 2.7395784854888916e-05, 2.818182110786438e-05, 2.8967857360839844e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 7.0, 7.0, 8.0, 4.0, 18.0, 19.0, 30.0, 47.0, 51.0, 82.0, 148.0, 217.0, 403.0, 651.0, 1297.0, 2756.0, 6824.0, 17497.0, 44681.0, 133912.0, 440771.0, 274384.0, 76494.0, 28506.0, 11200.0, 4502.0, 1904.0, 931.0, 450.0, 272.0, 173.0, 93.0, 62.0, 42.0, 36.0, 26.0, 13.0, 12.0, 11.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06610107421875, -0.06419944763183594, -0.062297821044921875, -0.06039619445800781, -0.05849456787109375, -0.05659294128417969, -0.054691314697265625, -0.05278968811035156, -0.0508880615234375, -0.04898643493652344, -0.047084808349609375, -0.04518318176269531, -0.04328155517578125, -0.04137992858886719, -0.039478302001953125, -0.03757667541503906, -0.035675048828125, -0.03377342224121094, -0.031871795654296875, -0.029970169067382812, -0.02806854248046875, -0.026166915893554688, -0.024265289306640625, -0.022363662719726562, -0.0204620361328125, -0.018560409545898438, -0.016658782958984375, -0.014757156372070312, -0.01285552978515625, -0.010953903198242188, -0.009052276611328125, -0.0071506500244140625, -0.0052490234375, -0.0033473968505859375, -0.001445770263671875, 0.0004558563232421875, 0.00235748291015625, 0.0042591094970703125, 0.006160736083984375, 0.008062362670898438, 0.0099639892578125, 0.011865615844726562, 0.013767242431640625, 0.015668869018554688, 0.01757049560546875, 0.019472122192382812, 0.021373748779296875, 0.023275375366210938, 0.025177001953125, 0.027078628540039062, 0.028980255126953125, 0.030881881713867188, 0.03278350830078125, 0.03468513488769531, 0.036586761474609375, 0.03848838806152344, 0.0403900146484375, 0.04229164123535156, 0.044193267822265625, 0.04609489440917969, 0.04799652099609375, 0.04989814758300781, 0.051799774169921875, 0.05370140075683594, 0.05560302734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 11.0, 6.0, 7.0, 5.0, 14.0, 7.0, 14.0, 18.0, 21.0, 28.0, 29.0, 35.0, 62.0, 55.0, 74.0, 77.0, 85.0, 72.0, 53.0, 53.0, 44.0, 36.0, 31.0, 22.0, 19.0, 16.0, 16.0, 13.0, 12.0, 8.0, 5.0, 4.0, 4.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.046112060546875, -0.044704437255859375, -0.04329681396484375, -0.041889190673828125, -0.0404815673828125, -0.039073944091796875, -0.03766632080078125, -0.036258697509765625, -0.03485107421875, -0.033443450927734375, -0.03203582763671875, -0.030628204345703125, -0.0292205810546875, -0.027812957763671875, -0.02640533447265625, -0.024997711181640625, -0.023590087890625, -0.022182464599609375, -0.02077484130859375, -0.019367218017578125, -0.0179595947265625, -0.016551971435546875, -0.01514434814453125, -0.013736724853515625, -0.0123291015625, -0.010921478271484375, -0.00951385498046875, -0.008106231689453125, -0.0066986083984375, -0.005290985107421875, -0.00388336181640625, -0.002475738525390625, -0.001068115234375, 0.000339508056640625, 0.00174713134765625, 0.003154754638671875, 0.0045623779296875, 0.005970001220703125, 0.00737762451171875, 0.008785247802734375, 0.01019287109375, 0.011600494384765625, 0.01300811767578125, 0.014415740966796875, 0.0158233642578125, 0.017230987548828125, 0.01863861083984375, 0.020046234130859375, 0.021453857421875, 0.022861480712890625, 0.02426910400390625, 0.025676727294921875, 0.0270843505859375, 0.028491973876953125, 0.02989959716796875, 0.031307220458984375, 0.03271484375, 0.034122467041015625, 0.03553009033203125, 0.036937713623046875, 0.0383453369140625, 0.039752960205078125, 0.04116058349609375, 0.042568206787109375, 0.043975830078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 13.0, 18.0, 65.0, 125.0, 194.0, 226.0, 178.0, 108.0, 34.0, 13.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7120633125305176, -1.6716995239257812, -1.6313356161117554, -1.5909717082977295, -1.5506079196929932, -1.5102441310882568, -1.469880223274231, -1.429516315460205, -1.3891525268554688, -1.3487887382507324, -1.3084248304367065, -1.2680609226226807, -1.2276971340179443, -1.187333345413208, -1.1469694375991821, -1.1066055297851562, -1.06624174118042, -1.0258779525756836, -0.9855140447616577, -0.9451501965522766, -0.9047863483428955, -0.8644225001335144, -0.8240586519241333, -0.7836948037147522, -0.7433309555053711, -0.70296710729599, -0.6626032590866089, -0.6222394108772278, -0.5818755626678467, -0.5415117144584656, -0.5011478662490845, -0.46078401803970337, -0.4204202890396118, -0.3800564408302307, -0.3396925926208496, -0.2993287444114685, -0.2589648962020874, -0.2186010479927063, -0.1782371997833252, -0.1378733515739441, -0.09750950336456299, -0.057145655155181885, -0.01678180694580078, 0.023582041263580322, 0.06394588947296143, 0.10430973768234253, 0.14467358589172363, 0.18503743410110474, 0.22540128231048584, 0.26576513051986694, 0.30612897872924805, 0.34649282693862915, 0.38685667514801025, 0.42722052335739136, 0.46758437156677246, 0.5079482197761536, 0.5483120679855347, 0.5886759161949158, 0.6290397644042969, 0.669403612613678, 0.7097674608230591, 0.7501313090324402, 0.7904951572418213, 0.8308590054512024, 0.8712228536605835]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 9.0, 2.0, 5.0, 4.0, 5.0, 9.0, 11.0, 11.0, 16.0, 11.0, 29.0, 25.0, 27.0, 20.0, 29.0, 23.0, 34.0, 22.0, 31.0, 32.0, 25.0, 45.0, 40.0, 55.0, 51.0, 40.0, 32.0, 39.0, 33.0, 39.0, 19.0, 26.0, 24.0, 26.0, 17.0, 25.0, 14.0, 18.0, 14.0, 9.0, 19.0, 9.0, 13.0, 2.0, 4.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.39768993854522705, -0.38538652658462524, -0.37308311462402344, -0.36077970266342163, -0.3484762907028198, -0.336172878742218, -0.3238694667816162, -0.311566025018692, -0.2992626130580902, -0.2869592010974884, -0.2746557891368866, -0.2623523771762848, -0.250048965215683, -0.23774553835391998, -0.22544212639331818, -0.21313869953155518, -0.20083530247211456, -0.18853189051151276, -0.17622847855091095, -0.16392505168914795, -0.15162163972854614, -0.13931822776794434, -0.12701481580734253, -0.11471139639616013, -0.10240798443555832, -0.09010457247495651, -0.07780115306377411, -0.0654977411031723, -0.0531943254172802, -0.04089090973138809, -0.028587497770786285, -0.016284078359603882, -0.003980666399002075, 0.008322748355567455, 0.020626163110136986, 0.03292957693338394, 0.04523299261927605, 0.05753640830516815, 0.06983982026576996, 0.08214323967695236, 0.09444665163755417, 0.10675006359815598, 0.11905348300933838, 0.13135689496994019, 0.143660306930542, 0.1559637188911438, 0.1682671308517456, 0.1805705577135086, 0.1928739696741104, 0.20517738163471222, 0.21748079359531403, 0.22978422045707703, 0.24208763241767883, 0.25439104437828064, 0.26669445633888245, 0.27899786829948425, 0.29130128026008606, 0.30360469222068787, 0.3159081041812897, 0.3282115161418915, 0.3405149281024933, 0.3528183698654175, 0.3651217818260193, 0.3774251937866211, 0.3897286057472229]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 6.0, 8.0, 5.0, 15.0, 22.0, 32.0, 65.0, 93.0, 174.0, 294.0, 560.0, 984.0, 1824.0, 3371.0, 6430.0, 12408.0, 23788.0, 47052.0, 99021.0, 236291.0, 614397.0, 1224278.0, 1075287.0, 487142.0, 195678.0, 83788.0, 39640.0, 20012.0, 10292.0, 5323.0, 2788.0, 1460.0, 765.0, 443.0, 261.0, 127.0, 73.0, 36.0, 22.0, 15.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.080078125, -0.07796382904052734, -0.07584953308105469, -0.07373523712158203, -0.07162094116210938, -0.06950664520263672, -0.06739234924316406, -0.0652780532836914, -0.06316375732421875, -0.061049461364746094, -0.05893516540527344, -0.05682086944580078, -0.054706573486328125, -0.05259227752685547, -0.05047798156738281, -0.048363685607910156, -0.0462493896484375, -0.044135093688964844, -0.04202079772949219, -0.03990650177001953, -0.037792205810546875, -0.03567790985107422, -0.03356361389160156, -0.031449317932128906, -0.02933502197265625, -0.027220726013183594, -0.025106430053710938, -0.02299213409423828, -0.020877838134765625, -0.01876354217529297, -0.016649246215820312, -0.014534950256347656, -0.012420654296875, -0.010306358337402344, -0.008192062377929688, -0.006077766418457031, -0.003963470458984375, -0.0018491744995117188, 0.0002651214599609375, 0.0023794174194335938, 0.00449371337890625, 0.006608009338378906, 0.008722305297851562, 0.010836601257324219, 0.012950897216796875, 0.015065193176269531, 0.017179489135742188, 0.019293785095214844, 0.0214080810546875, 0.023522377014160156, 0.025636672973632812, 0.02775096893310547, 0.029865264892578125, 0.03197956085205078, 0.03409385681152344, 0.036208152770996094, 0.03832244873046875, 0.040436744689941406, 0.04255104064941406, 0.04466533660888672, 0.046779632568359375, 0.04889392852783203, 0.05100822448730469, 0.053122520446777344, 0.05523681640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 1.0, 4.0, 2.0, 9.0, 4.0, 8.0, 12.0, 18.0, 6.0, 21.0, 21.0, 25.0, 21.0, 26.0, 32.0, 30.0, 32.0, 37.0, 41.0, 42.0, 40.0, 61.0, 50.0, 43.0, 50.0, 40.0, 39.0, 36.0, 34.0, 38.0, 24.0, 20.0, 21.0, 22.0, 16.0, 18.0, 16.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06402587890625, -0.06201171875, -0.05999755859375, -0.0579833984375, -0.05596923828125, -0.053955078125, -0.05194091796875, -0.0499267578125, -0.04791259765625, -0.0458984375, -0.04388427734375, -0.0418701171875, -0.03985595703125, -0.037841796875, -0.03582763671875, -0.0338134765625, -0.03179931640625, -0.02978515625, -0.02777099609375, -0.0257568359375, -0.02374267578125, -0.021728515625, -0.01971435546875, -0.0177001953125, -0.01568603515625, -0.013671875, -0.01165771484375, -0.0096435546875, -0.00762939453125, -0.005615234375, -0.00360107421875, -0.0015869140625, 0.00042724609375, 0.00244140625, 0.00445556640625, 0.0064697265625, 0.00848388671875, 0.010498046875, 0.01251220703125, 0.0145263671875, 0.01654052734375, 0.0185546875, 0.02056884765625, 0.0225830078125, 0.02459716796875, 0.026611328125, 0.02862548828125, 0.0306396484375, 0.03265380859375, 0.03466796875, 0.03668212890625, 0.0386962890625, 0.04071044921875, 0.042724609375, 0.04473876953125, 0.0467529296875, 0.04876708984375, 0.05078125, 0.05279541015625, 0.0548095703125, 0.05682373046875, 0.058837890625, 0.06085205078125, 0.0628662109375, 0.06488037109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 4.0, 16.0, 17.0, 22.0, 26.0, 44.0, 66.0, 106.0, 150.0, 285.0, 452.0, 896.0, 1895.0, 4609.0, 12672.0, 35699.0, 106722.0, 360781.0, 1574127.0, 1570973.0, 360427.0, 106471.0, 35830.0, 13016.0, 4843.0, 1892.0, 935.0, 473.0, 313.0, 183.0, 118.0, 77.0, 46.0, 29.0, 19.0, 13.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1297607421875, -0.1259441375732422, -0.12212753295898438, -0.11831092834472656, -0.11449432373046875, -0.11067771911621094, -0.10686111450195312, -0.10304450988769531, -0.0992279052734375, -0.09541130065917969, -0.09159469604492188, -0.08777809143066406, -0.08396148681640625, -0.08014488220214844, -0.07632827758789062, -0.07251167297363281, -0.068695068359375, -0.06487846374511719, -0.061061859130859375, -0.05724525451660156, -0.05342864990234375, -0.04961204528808594, -0.045795440673828125, -0.04197883605957031, -0.0381622314453125, -0.03434562683105469, -0.030529022216796875, -0.026712417602539062, -0.02289581298828125, -0.019079208374023438, -0.015262603759765625, -0.011445999145507812, -0.00762939453125, -0.0038127899169921875, 3.814697265625e-06, 0.0038204193115234375, 0.00763702392578125, 0.011453628540039062, 0.015270233154296875, 0.019086837768554688, 0.0229034423828125, 0.026720046997070312, 0.030536651611328125, 0.03435325622558594, 0.03816986083984375, 0.04198646545410156, 0.045803070068359375, 0.04961967468261719, 0.053436279296875, 0.05725288391113281, 0.061069488525390625, 0.06488609313964844, 0.06870269775390625, 0.07251930236816406, 0.07633590698242188, 0.08015251159667969, 0.0839691162109375, 0.08778572082519531, 0.09160232543945312, 0.09541893005371094, 0.09923553466796875, 0.10305213928222656, 0.10686874389648438, 0.11068534851074219, 0.114501953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 8.0, 14.0, 11.0, 17.0, 29.0, 31.0, 41.0, 64.0, 62.0, 93.0, 105.0, 145.0, 210.0, 276.0, 375.0, 411.0, 452.0, 361.0, 286.0, 239.0, 208.0, 124.0, 89.0, 77.0, 63.0, 52.0, 47.0, 37.0, 29.0, 18.0, 14.0, 18.0, 13.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09564208984375, -0.09200382232666016, -0.08836555480957031, -0.08472728729248047, -0.08108901977539062, -0.07745075225830078, -0.07381248474121094, -0.0701742172241211, -0.06653594970703125, -0.0628976821899414, -0.05925941467285156, -0.05562114715576172, -0.051982879638671875, -0.04834461212158203, -0.04470634460449219, -0.041068077087402344, -0.0374298095703125, -0.033791542053222656, -0.030153274536132812, -0.02651500701904297, -0.022876739501953125, -0.01923847198486328, -0.015600204467773438, -0.011961936950683594, -0.00832366943359375, -0.004685401916503906, -0.0010471343994140625, 0.0025911331176757812, 0.006229400634765625, 0.009867668151855469, 0.013505935668945312, 0.017144203186035156, 0.020782470703125, 0.024420738220214844, 0.028059005737304688, 0.03169727325439453, 0.035335540771484375, 0.03897380828857422, 0.04261207580566406, 0.046250343322753906, 0.04988861083984375, 0.053526878356933594, 0.05716514587402344, 0.06080341339111328, 0.06444168090820312, 0.06807994842529297, 0.07171821594238281, 0.07535648345947266, 0.0789947509765625, 0.08263301849365234, 0.08627128601074219, 0.08990955352783203, 0.09354782104492188, 0.09718608856201172, 0.10082435607910156, 0.1044626235961914, 0.10810089111328125, 0.1117391586303711, 0.11537742614746094, 0.11901569366455078, 0.12265396118164062, 0.12629222869873047, 0.1299304962158203, 0.13356876373291016, 0.13720703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 9.0, 14.0, 44.0, 71.0, 142.0, 187.0, 197.0, 165.0, 82.0, 54.0, 19.0, 9.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8802762031555176, -1.837556004524231, -1.7948358058929443, -1.7521157264709473, -1.7093955278396606, -1.666675329208374, -1.623955249786377, -1.5812350511550903, -1.5385148525238037, -1.495794653892517, -1.4530744552612305, -1.4103543758392334, -1.3676341772079468, -1.3249139785766602, -1.282193899154663, -1.2394737005233765, -1.1967535018920898, -1.1540333032608032, -1.1113131046295166, -1.0685930252075195, -1.025872826576233, -0.9831526279449463, -0.9404324889183044, -0.8977123498916626, -0.854992151260376, -0.8122719526290894, -0.7695518136024475, -0.7268316745758057, -0.684111475944519, -0.6413912773132324, -0.5986711382865906, -0.5559509992599487, -0.5132307410240173, -0.4705105721950531, -0.42779040336608887, -0.38507023453712463, -0.3423500657081604, -0.29962989687919617, -0.25690972805023193, -0.2141895592212677, -0.17146939039230347, -0.12874922156333923, -0.086029052734375, -0.04330888390541077, -0.0005887150764465332, 0.0421314537525177, 0.08485162258148193, 0.12757179141044617, 0.1702919602394104, 0.21301212906837463, 0.25573229789733887, 0.2984524667263031, 0.34117263555526733, 0.38389280438423157, 0.4266129732131958, 0.46933314204216003, 0.5120533108711243, 0.5547734498977661, 0.5974936485290527, 0.6402138471603394, 0.6829339861869812, 0.725654125213623, 0.7683743238449097, 0.8110945224761963, 0.8538146615028381]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 9.0, 3.0, 12.0, 8.0, 16.0, 9.0, 17.0, 16.0, 11.0, 22.0, 18.0, 28.0, 29.0, 35.0, 30.0, 36.0, 34.0, 36.0, 39.0, 30.0, 41.0, 44.0, 33.0, 43.0, 40.0, 40.0, 37.0, 29.0, 31.0, 24.0, 28.0, 24.0, 23.0, 17.0, 18.0, 21.0, 11.0, 11.0, 6.0, 10.0, 5.0, 1.0, 6.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3717927932739258, -0.359464555978775, -0.3471362888813019, -0.3348080515861511, -0.322479784488678, -0.3101515471935272, -0.29782330989837646, -0.2854950428009033, -0.27316680550575256, -0.2608385682106018, -0.24851030111312866, -0.2361820638179779, -0.22385381162166595, -0.211525559425354, -0.19919732213020325, -0.1868690699338913, -0.17454081773757935, -0.1622125655412674, -0.14988431334495544, -0.1375560760498047, -0.12522782385349274, -0.11289957165718079, -0.10057132691144943, -0.08824308216571808, -0.07591482996940613, -0.06358657777309418, -0.051258333027362823, -0.03893008455634117, -0.02660183608531952, -0.014273587614297867, -0.0019453391432762146, 0.01038290560245514, 0.02271115779876709, 0.03503940626978874, 0.047367654740810394, 0.059695903211832047, 0.0720241516828537, 0.08435240387916565, 0.096680648624897, 0.10900889337062836, 0.12133714556694031, 0.13366539776325226, 0.1459936499595642, 0.15832188725471497, 0.17065013945102692, 0.18297839164733887, 0.19530662894248962, 0.20763488113880157, 0.21996313333511353, 0.23229138553142548, 0.24461963772773743, 0.2569478750228882, 0.26927614212036133, 0.2816043794155121, 0.29393261671066284, 0.306260883808136, 0.31858912110328674, 0.3309173583984375, 0.34324562549591064, 0.3555738627910614, 0.36790210008621216, 0.3802303671836853, 0.39255860447883606, 0.4048868417739868, 0.41721510887145996]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 17.0, 18.0, 38.0, 50.0, 94.0, 136.0, 253.0, 435.0, 686.0, 1268.0, 2372.0, 4338.0, 7748.0, 13839.0, 23824.0, 44284.0, 96363.0, 230495.0, 311308.0, 164630.0, 68521.0, 33980.0, 18844.0, 10986.0, 6158.0, 3393.0, 1929.0, 1063.0, 553.0, 351.0, 215.0, 117.0, 78.0, 36.0, 42.0, 25.0, 13.0, 12.0, 12.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09552001953125, -0.09236717224121094, -0.08921432495117188, -0.08606147766113281, -0.08290863037109375, -0.07975578308105469, -0.07660293579101562, -0.07345008850097656, -0.0702972412109375, -0.06714439392089844, -0.06399154663085938, -0.06083869934082031, -0.05768585205078125, -0.05453300476074219, -0.051380157470703125, -0.04822731018066406, -0.045074462890625, -0.04192161560058594, -0.038768768310546875, -0.03561592102050781, -0.03246307373046875, -0.029310226440429688, -0.026157379150390625, -0.023004531860351562, -0.0198516845703125, -0.016698837280273438, -0.013545989990234375, -0.010393142700195312, -0.00724029541015625, -0.0040874481201171875, -0.000934600830078125, 0.0022182464599609375, 0.00537109375, 0.008523941040039062, 0.011676788330078125, 0.014829635620117188, 0.01798248291015625, 0.021135330200195312, 0.024288177490234375, 0.027441024780273438, 0.0305938720703125, 0.03374671936035156, 0.036899566650390625, 0.04005241394042969, 0.04320526123046875, 0.04635810852050781, 0.049510955810546875, 0.05266380310058594, 0.055816650390625, 0.05896949768066406, 0.062122344970703125, 0.06527519226074219, 0.06842803955078125, 0.07158088684082031, 0.07473373413085938, 0.07788658142089844, 0.0810394287109375, 0.08419227600097656, 0.08734512329101562, 0.09049797058105469, 0.09365081787109375, 0.09680366516113281, 0.09995651245117188, 0.10310935974121094, 0.10626220703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 9.0, 11.0, 11.0, 15.0, 19.0, 15.0, 20.0, 15.0, 21.0, 30.0, 34.0, 22.0, 29.0, 35.0, 24.0, 42.0, 37.0, 41.0, 31.0, 35.0, 35.0, 34.0, 27.0, 31.0, 39.0, 27.0, 34.0, 23.0, 40.0, 29.0, 23.0, 20.0, 19.0, 20.0, 12.0, 12.0, 15.0, 14.0, 7.0, 8.0, 5.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0562744140625, -0.05449390411376953, -0.05271339416503906, -0.050932884216308594, -0.049152374267578125, -0.047371864318847656, -0.04559135437011719, -0.04381084442138672, -0.04203033447265625, -0.04024982452392578, -0.03846931457519531, -0.036688804626464844, -0.034908294677734375, -0.033127784729003906, -0.03134727478027344, -0.02956676483154297, -0.0277862548828125, -0.02600574493408203, -0.024225234985351562, -0.022444725036621094, -0.020664215087890625, -0.018883705139160156, -0.017103195190429688, -0.015322685241699219, -0.01354217529296875, -0.011761665344238281, -0.009981155395507812, -0.008200645446777344, -0.006420135498046875, -0.004639625549316406, -0.0028591156005859375, -0.0010786056518554688, 0.000701904296875, 0.0024824142456054688, 0.0042629241943359375, 0.006043434143066406, 0.007823944091796875, 0.009604454040527344, 0.011384963989257812, 0.013165473937988281, 0.01494598388671875, 0.01672649383544922, 0.018507003784179688, 0.020287513732910156, 0.022068023681640625, 0.023848533630371094, 0.025629043579101562, 0.02740955352783203, 0.0291900634765625, 0.03097057342529297, 0.03275108337402344, 0.034531593322753906, 0.036312103271484375, 0.038092613220214844, 0.03987312316894531, 0.04165363311767578, 0.04343414306640625, 0.04521465301513672, 0.04699516296386719, 0.048775672912597656, 0.050556182861328125, 0.052336692810058594, 0.05411720275878906, 0.05589771270751953, 0.05767822265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 8.0, 6.0, 8.0, 19.0, 24.0, 37.0, 36.0, 55.0, 90.0, 112.0, 165.0, 282.0, 463.0, 736.0, 1518.0, 3513.0, 8957.0, 23760.0, 66787.0, 238742.0, 471313.0, 154519.0, 47705.0, 17349.0, 6609.0, 2732.0, 1226.0, 629.0, 371.0, 230.0, 176.0, 116.0, 77.0, 48.0, 32.0, 26.0, 22.0, 18.0, 7.0, 5.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18408203125, -0.1783905029296875, -0.172698974609375, -0.1670074462890625, -0.16131591796875, -0.1556243896484375, -0.149932861328125, -0.1442413330078125, -0.1385498046875, -0.1328582763671875, -0.127166748046875, -0.1214752197265625, -0.11578369140625, -0.1100921630859375, -0.104400634765625, -0.0987091064453125, -0.093017578125, -0.0873260498046875, -0.081634521484375, -0.0759429931640625, -0.07025146484375, -0.0645599365234375, -0.058868408203125, -0.0531768798828125, -0.0474853515625, -0.0417938232421875, -0.036102294921875, -0.0304107666015625, -0.02471923828125, -0.0190277099609375, -0.013336181640625, -0.0076446533203125, -0.001953125, 0.0037384033203125, 0.009429931640625, 0.0151214599609375, 0.02081298828125, 0.0265045166015625, 0.032196044921875, 0.0378875732421875, 0.0435791015625, 0.0492706298828125, 0.054962158203125, 0.0606536865234375, 0.06634521484375, 0.0720367431640625, 0.077728271484375, 0.0834197998046875, 0.089111328125, 0.0948028564453125, 0.100494384765625, 0.1061859130859375, 0.11187744140625, 0.1175689697265625, 0.123260498046875, 0.1289520263671875, 0.1346435546875, 0.1403350830078125, 0.146026611328125, 0.1517181396484375, 0.15740966796875, 0.1631011962890625, 0.168792724609375, 0.1744842529296875, 0.18017578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 10.0, 6.0, 8.0, 11.0, 9.0, 18.0, 8.0, 16.0, 19.0, 25.0, 28.0, 38.0, 28.0, 31.0, 39.0, 47.0, 43.0, 43.0, 55.0, 35.0, 57.0, 40.0, 41.0, 38.0, 31.0, 31.0, 32.0, 22.0, 35.0, 25.0, 22.0, 11.0, 17.0, 13.0, 20.0, 5.0, 8.0, 9.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2109375, -0.20474815368652344, -0.19855880737304688, -0.1923694610595703, -0.18618011474609375, -0.1799907684326172, -0.17380142211914062, -0.16761207580566406, -0.1614227294921875, -0.15523338317871094, -0.14904403686523438, -0.1428546905517578, -0.13666534423828125, -0.1304759979248047, -0.12428665161132812, -0.11809730529785156, -0.111907958984375, -0.10571861267089844, -0.09952926635742188, -0.09333992004394531, -0.08715057373046875, -0.08096122741699219, -0.07477188110351562, -0.06858253479003906, -0.0623931884765625, -0.05620384216308594, -0.050014495849609375, -0.04382514953613281, -0.03763580322265625, -0.03144645690917969, -0.025257110595703125, -0.019067764282226562, -0.01287841796875, -0.0066890716552734375, -0.000499725341796875, 0.0056896209716796875, 0.01187896728515625, 0.018068313598632812, 0.024257659912109375, 0.030447006225585938, 0.0366363525390625, 0.04282569885253906, 0.049015045166015625, 0.05520439147949219, 0.06139373779296875, 0.06758308410644531, 0.07377243041992188, 0.07996177673339844, 0.086151123046875, 0.09234046936035156, 0.09852981567382812, 0.10471916198730469, 0.11090850830078125, 0.11709785461425781, 0.12328720092773438, 0.12947654724121094, 0.1356658935546875, 0.14185523986816406, 0.14804458618164062, 0.1542339324951172, 0.16042327880859375, 0.1666126251220703, 0.17280197143554688, 0.17899131774902344, 0.1851806640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 2.0, 9.0, 17.0, 18.0, 39.0, 50.0, 68.0, 102.0, 201.0, 320.0, 608.0, 1150.0, 2204.0, 4389.0, 8763.0, 17548.0, 36897.0, 89578.0, 247247.0, 357992.0, 165990.0, 61607.0, 26822.0, 13114.0, 6589.0, 3425.0, 1702.0, 938.0, 473.0, 273.0, 152.0, 99.0, 54.0, 43.0, 27.0, 11.0, 11.0, 14.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04937744140625, -0.04784870147705078, -0.04631996154785156, -0.044791221618652344, -0.043262481689453125, -0.041733741760253906, -0.04020500183105469, -0.03867626190185547, -0.03714752197265625, -0.03561878204345703, -0.03409004211425781, -0.032561302185058594, -0.031032562255859375, -0.029503822326660156, -0.027975082397460938, -0.02644634246826172, -0.0249176025390625, -0.02338886260986328, -0.021860122680664062, -0.020331382751464844, -0.018802642822265625, -0.017273902893066406, -0.015745162963867188, -0.014216423034667969, -0.01268768310546875, -0.011158943176269531, -0.009630203247070312, -0.008101463317871094, -0.006572723388671875, -0.005043983459472656, -0.0035152435302734375, -0.0019865036010742188, -0.000457763671875, 0.0010709762573242188, 0.0025997161865234375, 0.004128456115722656, 0.005657196044921875, 0.007185935974121094, 0.008714675903320312, 0.010243415832519531, 0.01177215576171875, 0.013300895690917969, 0.014829635620117188, 0.016358375549316406, 0.017887115478515625, 0.019415855407714844, 0.020944595336914062, 0.02247333526611328, 0.0240020751953125, 0.02553081512451172, 0.027059555053710938, 0.028588294982910156, 0.030117034912109375, 0.031645774841308594, 0.03317451477050781, 0.03470325469970703, 0.03623199462890625, 0.03776073455810547, 0.03928947448730469, 0.040818214416503906, 0.042346954345703125, 0.043875694274902344, 0.04540443420410156, 0.04693317413330078, 0.0484619140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 5.0, 4.0, 8.0, 11.0, 13.0, 13.0, 13.0, 11.0, 25.0, 24.0, 33.0, 49.0, 53.0, 67.0, 73.0, 94.0, 76.0, 81.0, 58.0, 60.0, 50.0, 36.0, 23.0, 19.0, 16.0, 8.0, 16.0, 14.0, 5.0, 14.0, 10.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.627206802368164e-05, -1.5676021575927734e-05, -1.5079975128173828e-05, -1.4483928680419922e-05, -1.3887882232666016e-05, -1.329183578491211e-05, -1.2695789337158203e-05, -1.2099742889404297e-05, -1.150369644165039e-05, -1.0907649993896484e-05, -1.0311603546142578e-05, -9.715557098388672e-06, -9.119510650634766e-06, -8.52346420288086e-06, -7.927417755126953e-06, -7.331371307373047e-06, -6.735324859619141e-06, -6.139278411865234e-06, -5.543231964111328e-06, -4.947185516357422e-06, -4.351139068603516e-06, -3.7550926208496094e-06, -3.159046173095703e-06, -2.562999725341797e-06, -1.9669532775878906e-06, -1.3709068298339844e-06, -7.748603820800781e-07, -1.7881393432617188e-07, 4.172325134277344e-07, 1.0132789611816406e-06, 1.6093254089355469e-06, 2.205371856689453e-06, 2.8014183044433594e-06, 3.3974647521972656e-06, 3.993511199951172e-06, 4.589557647705078e-06, 5.185604095458984e-06, 5.781650543212891e-06, 6.377696990966797e-06, 6.973743438720703e-06, 7.569789886474609e-06, 8.165836334228516e-06, 8.761882781982422e-06, 9.357929229736328e-06, 9.953975677490234e-06, 1.055002212524414e-05, 1.1146068572998047e-05, 1.1742115020751953e-05, 1.233816146850586e-05, 1.2934207916259766e-05, 1.3530254364013672e-05, 1.4126300811767578e-05, 1.4722347259521484e-05, 1.531839370727539e-05, 1.5914440155029297e-05, 1.6510486602783203e-05, 1.710653305053711e-05, 1.7702579498291016e-05, 1.8298625946044922e-05, 1.8894672393798828e-05, 1.9490718841552734e-05, 2.008676528930664e-05, 2.0682811737060547e-05, 2.1278858184814453e-05, 2.187490463256836e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 15.0, 11.0, 13.0, 27.0, 23.0, 49.0, 100.0, 194.0, 486.0, 966.0, 2924.0, 10916.0, 50079.0, 252132.0, 521887.0, 164309.0, 33173.0, 7625.0, 2110.0, 764.0, 364.0, 170.0, 85.0, 54.0, 34.0, 16.0, 15.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06231689453125, -0.0598602294921875, -0.057403564453125, -0.0549468994140625, -0.052490234375, -0.0500335693359375, -0.047576904296875, -0.0451202392578125, -0.04266357421875, -0.0402069091796875, -0.037750244140625, -0.0352935791015625, -0.0328369140625, -0.0303802490234375, -0.027923583984375, -0.0254669189453125, -0.02301025390625, -0.0205535888671875, -0.018096923828125, -0.0156402587890625, -0.01318359375, -0.0107269287109375, -0.008270263671875, -0.0058135986328125, -0.00335693359375, -0.0009002685546875, 0.001556396484375, 0.0040130615234375, 0.0064697265625, 0.0089263916015625, 0.011383056640625, 0.0138397216796875, 0.01629638671875, 0.0187530517578125, 0.021209716796875, 0.0236663818359375, 0.026123046875, 0.0285797119140625, 0.031036376953125, 0.0334930419921875, 0.03594970703125, 0.0384063720703125, 0.040863037109375, 0.0433197021484375, 0.0457763671875, 0.0482330322265625, 0.050689697265625, 0.0531463623046875, 0.05560302734375, 0.0580596923828125, 0.060516357421875, 0.0629730224609375, 0.0654296875, 0.0678863525390625, 0.070343017578125, 0.0727996826171875, 0.07525634765625, 0.0777130126953125, 0.080169677734375, 0.0826263427734375, 0.0850830078125, 0.0875396728515625, 0.089996337890625, 0.0924530029296875, 0.09490966796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 2.0, 7.0, 7.0, 12.0, 23.0, 23.0, 23.0, 25.0, 32.0, 33.0, 50.0, 37.0, 60.0, 51.0, 58.0, 58.0, 63.0, 57.0, 66.0, 46.0, 46.0, 42.0, 34.0, 22.0, 19.0, 14.0, 11.0, 11.0, 16.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.046722412109375, -0.04535865783691406, -0.043994903564453125, -0.04263114929199219, -0.04126739501953125, -0.03990364074707031, -0.038539886474609375, -0.03717613220214844, -0.0358123779296875, -0.03444862365722656, -0.033084869384765625, -0.03172111511230469, -0.03035736083984375, -0.028993606567382812, -0.027629852294921875, -0.026266098022460938, -0.02490234375, -0.023538589477539062, -0.022174835205078125, -0.020811080932617188, -0.01944732666015625, -0.018083572387695312, -0.016719818115234375, -0.015356063842773438, -0.0139923095703125, -0.012628555297851562, -0.011264801025390625, -0.009901046752929688, -0.00853729248046875, -0.0071735382080078125, -0.005809783935546875, -0.0044460296630859375, -0.003082275390625, -0.0017185211181640625, -0.000354766845703125, 0.0010089874267578125, 0.00237274169921875, 0.0037364959716796875, 0.005100250244140625, 0.0064640045166015625, 0.0078277587890625, 0.009191513061523438, 0.010555267333984375, 0.011919021606445312, 0.01328277587890625, 0.014646530151367188, 0.016010284423828125, 0.017374038696289062, 0.01873779296875, 0.020101547241210938, 0.021465301513671875, 0.022829055786132812, 0.02419281005859375, 0.025556564331054688, 0.026920318603515625, 0.028284072875976562, 0.0296478271484375, 0.031011581420898438, 0.032375335693359375, 0.03373908996582031, 0.03510284423828125, 0.03646659851074219, 0.037830352783203125, 0.03919410705566406, 0.040557861328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 28.0, 42.0, 80.0, 159.0, 208.0, 177.0, 135.0, 79.0, 48.0, 18.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.45541250705719, -1.4207514524459839, -1.3860903978347778, -1.3514293432235718, -1.3167684078216553, -1.2821073532104492, -1.2474462985992432, -1.212785243988037, -1.178124189376831, -1.143463134765625, -1.108802080154419, -1.074141025543213, -1.0394799709320068, -1.0048190355300903, -0.9701579809188843, -0.9354969263076782, -0.9008358716964722, -0.8661748170852661, -0.8315137624740601, -0.7968527674674988, -0.7621917128562927, -0.7275306582450867, -0.6928696632385254, -0.6582086086273193, -0.6235475540161133, -0.5888864994049072, -0.5542254447937012, -0.5195644497871399, -0.48490339517593384, -0.4502423405647278, -0.4155813157558441, -0.38092029094696045, -0.3462591767311096, -0.31159812211990356, -0.2769370973110199, -0.24227605760097504, -0.20761501789093018, -0.17295397818088531, -0.13829293847084045, -0.1036318987607956, -0.06897085905075073, -0.03430981934070587, 0.00035122036933898926, 0.03501226007938385, 0.06967329978942871, 0.10433433949947357, 0.13899537920951843, 0.1736564189195633, 0.20831745862960815, 0.24297849833965302, 0.2776395380496979, 0.31230056285858154, 0.3469616174697876, 0.38162267208099365, 0.4162836968898773, 0.450944721698761, 0.48560577630996704, 0.5202668309211731, 0.5549278259277344, 0.5895888805389404, 0.6242499351501465, 0.6589109897613525, 0.6935720443725586, 0.7282330393791199, 0.7628940939903259]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 5.0, 12.0, 7.0, 9.0, 18.0, 16.0, 15.0, 21.0, 28.0, 22.0, 26.0, 33.0, 37.0, 43.0, 34.0, 38.0, 38.0, 32.0, 37.0, 47.0, 40.0, 46.0, 39.0, 31.0, 30.0, 37.0, 31.0, 32.0, 25.0, 22.0, 14.0, 15.0, 26.0, 16.0, 15.0, 15.0, 6.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0], "bins": [-0.516281008720398, -0.502227783203125, -0.48817455768585205, -0.4741213321685791, -0.46006810665130615, -0.4460148811340332, -0.43196165561676025, -0.4179084002971649, -0.40385517477989197, -0.389801949262619, -0.37574872374534607, -0.3616954982280731, -0.34764227271080017, -0.33358901739120483, -0.3195357918739319, -0.30548256635665894, -0.291429340839386, -0.27737611532211304, -0.2633228898048401, -0.24926966428756714, -0.235216423869133, -0.22116319835186005, -0.2071099728345871, -0.19305673241615295, -0.1790035367012024, -0.16495031118392944, -0.1508970856666565, -0.13684386014938354, -0.1227906197309494, -0.10873739421367645, -0.0946841686964035, -0.08063093572854996, -0.06657770276069641, -0.05252447351813316, -0.038471244275569916, -0.024418018758296967, -0.010364789515733719, 0.003688439726829529, 0.017741665244102478, 0.031794898211956024, 0.04584812372922897, 0.05990135297179222, 0.07395458221435547, 0.08800780773162842, 0.10206103324890137, 0.11611426621675491, 0.13016748428344727, 0.1442207247018814, 0.15827395021915436, 0.1723271757364273, 0.18638040125370026, 0.2004336416721344, 0.21448686718940735, 0.2285400927066803, 0.24259331822395325, 0.2566465437412262, 0.27069976925849915, 0.2847529947757721, 0.29880622029304504, 0.312859445810318, 0.32691267132759094, 0.3409659266471863, 0.35501915216445923, 0.3690723776817322, 0.3831256031990051]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 12.0, 13.0, 31.0, 51.0, 88.0, 162.0, 244.0, 500.0, 876.0, 1651.0, 3106.0, 5664.0, 10591.0, 19699.0, 38737.0, 79944.0, 182147.0, 447510.0, 968942.0, 1191834.0, 708654.0, 295909.0, 122571.0, 55991.0, 28014.0, 14610.0, 7643.0, 4181.0, 2208.0, 1182.0, 639.0, 367.0, 196.0, 115.0, 64.0, 41.0, 33.0, 19.0, 10.0, 3.0, 4.0, 2.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06622314453125, -0.06423234939575195, -0.062241554260253906, -0.06025075912475586, -0.05825996398925781, -0.056269168853759766, -0.05427837371826172, -0.05228757858276367, -0.050296783447265625, -0.04830598831176758, -0.04631519317626953, -0.044324398040771484, -0.04233360290527344, -0.04034280776977539, -0.038352012634277344, -0.0363612174987793, -0.03437042236328125, -0.0323796272277832, -0.030388832092285156, -0.02839803695678711, -0.026407241821289062, -0.024416446685791016, -0.02242565155029297, -0.020434856414794922, -0.018444061279296875, -0.016453266143798828, -0.014462471008300781, -0.012471675872802734, -0.010480880737304688, -0.00849008560180664, -0.006499290466308594, -0.004508495330810547, -0.0025177001953125, -0.0005269050598144531, 0.0014638900756835938, 0.0034546852111816406, 0.0054454803466796875, 0.007436275482177734, 0.009427070617675781, 0.011417865753173828, 0.013408660888671875, 0.015399456024169922, 0.01739025115966797, 0.019381046295166016, 0.021371841430664062, 0.02336263656616211, 0.025353431701660156, 0.027344226837158203, 0.02933502197265625, 0.0313258171081543, 0.033316612243652344, 0.03530740737915039, 0.03729820251464844, 0.039288997650146484, 0.04127979278564453, 0.04327058792114258, 0.045261383056640625, 0.04725217819213867, 0.04924297332763672, 0.051233768463134766, 0.05322456359863281, 0.05521535873413086, 0.057206153869628906, 0.05919694900512695, 0.061187744140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 4.0, 6.0, 9.0, 8.0, 17.0, 14.0, 16.0, 11.0, 22.0, 22.0, 23.0, 31.0, 29.0, 39.0, 34.0, 34.0, 31.0, 34.0, 37.0, 43.0, 53.0, 51.0, 42.0, 36.0, 37.0, 35.0, 38.0, 23.0, 36.0, 23.0, 18.0, 19.0, 16.0, 10.0, 13.0, 14.0, 15.0, 9.0, 10.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06463623046875, -0.06268692016601562, -0.06073760986328125, -0.058788299560546875, -0.0568389892578125, -0.054889678955078125, -0.05294036865234375, -0.050991058349609375, -0.049041748046875, -0.047092437744140625, -0.04514312744140625, -0.043193817138671875, -0.0412445068359375, -0.039295196533203125, -0.03734588623046875, -0.035396575927734375, -0.033447265625, -0.031497955322265625, -0.02954864501953125, -0.027599334716796875, -0.0256500244140625, -0.023700714111328125, -0.02175140380859375, -0.019802093505859375, -0.017852783203125, -0.015903472900390625, -0.01395416259765625, -0.012004852294921875, -0.0100555419921875, -0.008106231689453125, -0.00615692138671875, -0.004207611083984375, -0.00225830078125, -0.000308990478515625, 0.00164031982421875, 0.003589630126953125, 0.0055389404296875, 0.007488250732421875, 0.00943756103515625, 0.011386871337890625, 0.013336181640625, 0.015285491943359375, 0.01723480224609375, 0.019184112548828125, 0.0211334228515625, 0.023082733154296875, 0.02503204345703125, 0.026981353759765625, 0.0289306640625, 0.030879974365234375, 0.03282928466796875, 0.034778594970703125, 0.0367279052734375, 0.038677215576171875, 0.04062652587890625, 0.042575836181640625, 0.044525146484375, 0.046474456787109375, 0.04842376708984375, 0.050373077392578125, 0.0523223876953125, 0.054271697998046875, 0.05622100830078125, 0.058170318603515625, 0.06011962890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 16.0, 22.0, 31.0, 31.0, 66.0, 89.0, 138.0, 222.0, 317.0, 495.0, 848.0, 1539.0, 2971.0, 6687.0, 15964.0, 42078.0, 117197.0, 373415.0, 1570194.0, 1519390.0, 359837.0, 113633.0, 40892.0, 15264.0, 6351.0, 2860.0, 1476.0, 809.0, 491.0, 295.0, 195.0, 143.0, 109.0, 61.0, 41.0, 27.0, 27.0, 17.0, 7.0, 9.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1109619140625, -0.10738086700439453, -0.10379981994628906, -0.1002187728881836, -0.09663772583007812, -0.09305667877197266, -0.08947563171386719, -0.08589458465576172, -0.08231353759765625, -0.07873249053955078, -0.07515144348144531, -0.07157039642333984, -0.06798934936523438, -0.0644083023071289, -0.06082725524902344, -0.05724620819091797, -0.0536651611328125, -0.05008411407470703, -0.04650306701660156, -0.042922019958496094, -0.039340972900390625, -0.035759925842285156, -0.03217887878417969, -0.02859783172607422, -0.02501678466796875, -0.02143573760986328, -0.017854690551757812, -0.014273643493652344, -0.010692596435546875, -0.007111549377441406, -0.0035305023193359375, 5.054473876953125e-05, 0.003631591796875, 0.007212638854980469, 0.010793685913085938, 0.014374732971191406, 0.017955780029296875, 0.021536827087402344, 0.025117874145507812, 0.02869892120361328, 0.03227996826171875, 0.03586101531982422, 0.03944206237792969, 0.043023109436035156, 0.046604156494140625, 0.050185203552246094, 0.05376625061035156, 0.05734729766845703, 0.0609283447265625, 0.06450939178466797, 0.06809043884277344, 0.0716714859008789, 0.07525253295898438, 0.07883358001708984, 0.08241462707519531, 0.08599567413330078, 0.08957672119140625, 0.09315776824951172, 0.09673881530761719, 0.10031986236572266, 0.10390090942382812, 0.1074819564819336, 0.11106300354003906, 0.11464405059814453, 0.11822509765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 6.0, 15.0, 13.0, 17.0, 30.0, 48.0, 47.0, 53.0, 105.0, 98.0, 158.0, 212.0, 277.0, 410.0, 523.0, 517.0, 387.0, 323.0, 225.0, 144.0, 92.0, 84.0, 72.0, 39.0, 41.0, 30.0, 24.0, 19.0, 14.0, 11.0, 5.0, 5.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1416015625, -0.13732337951660156, -0.13304519653320312, -0.1287670135498047, -0.12448883056640625, -0.12021064758300781, -0.11593246459960938, -0.11165428161621094, -0.1073760986328125, -0.10309791564941406, -0.09881973266601562, -0.09454154968261719, -0.09026336669921875, -0.08598518371582031, -0.08170700073242188, -0.07742881774902344, -0.073150634765625, -0.06887245178222656, -0.06459426879882812, -0.06031608581542969, -0.05603790283203125, -0.05175971984863281, -0.047481536865234375, -0.04320335388183594, -0.0389251708984375, -0.03464698791503906, -0.030368804931640625, -0.026090621948242188, -0.02181243896484375, -0.017534255981445312, -0.013256072998046875, -0.008977890014648438, -0.00469970703125, -0.0004215240478515625, 0.003856658935546875, 0.008134841918945312, 0.01241302490234375, 0.016691207885742188, 0.020969390869140625, 0.025247573852539062, 0.0295257568359375, 0.03380393981933594, 0.038082122802734375, 0.04236030578613281, 0.04663848876953125, 0.05091667175292969, 0.055194854736328125, 0.05947303771972656, 0.063751220703125, 0.06802940368652344, 0.07230758666992188, 0.07658576965332031, 0.08086395263671875, 0.08514213562011719, 0.08942031860351562, 0.09369850158691406, 0.0979766845703125, 0.10225486755371094, 0.10653305053710938, 0.11081123352050781, 0.11508941650390625, 0.11936759948730469, 0.12364578247070312, 0.12792396545410156, 0.1322021484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 15.0, 75.0, 156.0, 297.0, 274.0, 111.0, 44.0, 14.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3617911338806152, -3.291457414627075, -3.221123695373535, -3.150789976119995, -3.080456256866455, -3.010122537612915, -2.939788818359375, -2.869455099105835, -2.799121379852295, -2.728787660598755, -2.658453941345215, -2.588120222091675, -2.5177865028381348, -2.4474527835845947, -2.3771190643310547, -2.3067853450775146, -2.2364516258239746, -2.1661179065704346, -2.0957841873168945, -2.0254504680633545, -1.9551167488098145, -1.8847830295562744, -1.8144493103027344, -1.7441155910491943, -1.6737818717956543, -1.6034481525421143, -1.5331144332885742, -1.4627807140350342, -1.3924469947814941, -1.322113275527954, -1.251779556274414, -1.181445837020874, -1.1111118793487549, -1.0407781600952148, -0.9704444408416748, -0.9001107215881348, -0.8297770023345947, -0.7594432830810547, -0.6891095638275146, -0.6187758445739746, -0.5484421253204346, -0.47810840606689453, -0.4077746868133545, -0.33744096755981445, -0.2671072483062744, -0.19677352905273438, -0.12643980979919434, -0.0561060905456543, 0.014227628707885742, 0.08456134796142578, 0.15489506721496582, 0.22522878646850586, 0.2955625057220459, 0.36589622497558594, 0.436229944229126, 0.506563663482666, 0.576897382736206, 0.6472311019897461, 0.7175648212432861, 0.7878985404968262, 0.8582322597503662, 0.9285659790039062, 0.9988996982574463, 1.0692334175109863, 1.1395671367645264]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 12.0, 8.0, 14.0, 15.0, 10.0, 24.0, 29.0, 30.0, 21.0, 34.0, 29.0, 44.0, 43.0, 49.0, 45.0, 46.0, 44.0, 44.0, 44.0, 46.0, 39.0, 45.0, 28.0, 33.0, 33.0, 26.0, 25.0, 16.0, 23.0, 18.0, 16.0, 14.0, 14.0, 7.0, 4.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.43745726346969604, -0.4223458170890808, -0.40723440051078796, -0.3921229839324951, -0.3770115375518799, -0.36190009117126465, -0.3467886745929718, -0.33167725801467896, -0.3165658116340637, -0.3014543652534485, -0.28634294867515564, -0.2712315320968628, -0.25612008571624756, -0.24100865423679352, -0.22589722275733948, -0.21078579127788544, -0.1956743597984314, -0.18056292831897736, -0.16545149683952332, -0.15034006536006927, -0.13522863388061523, -0.1201172024011612, -0.10500577092170715, -0.08989433944225311, -0.07478290796279907, -0.05967147648334503, -0.04456004500389099, -0.02944861352443695, -0.01433718204498291, 0.0007742494344711304, 0.01588568091392517, 0.03099711239337921, 0.04610854387283325, 0.06121997535228729, 0.07633140683174133, 0.09144283831119537, 0.10655426979064941, 0.12166570127010345, 0.1367771327495575, 0.15188856422901154, 0.16699999570846558, 0.18211142718791962, 0.19722285866737366, 0.2123342901468277, 0.22744572162628174, 0.24255715310573578, 0.2576685845851898, 0.27278000116348267, 0.2878914475440979, 0.30300289392471313, 0.318114310503006, 0.33322572708129883, 0.34833717346191406, 0.3634486198425293, 0.37856003642082214, 0.393671452999115, 0.4087828993797302, 0.42389434576034546, 0.4390057623386383, 0.45411717891693115, 0.4692286252975464, 0.4843400716781616, 0.49945148825645447, 0.5145629048347473, 0.5296743512153625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 15.0, 22.0, 38.0, 72.0, 152.0, 303.0, 761.0, 1803.0, 4963.0, 13239.0, 40368.0, 120689.0, 280762.0, 325106.0, 170883.0, 58862.0, 19273.0, 6765.0, 2579.0, 1065.0, 426.0, 209.0, 96.0, 40.0, 25.0, 11.0, 9.0, 2.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09881591796875, -0.095428466796875, -0.092041015625, -0.088653564453125, -0.08526611328125, -0.081878662109375, -0.0784912109375, -0.075103759765625, -0.07171630859375, -0.068328857421875, -0.06494140625, -0.061553955078125, -0.05816650390625, -0.054779052734375, -0.0513916015625, -0.048004150390625, -0.04461669921875, -0.041229248046875, -0.037841796875, -0.034454345703125, -0.03106689453125, -0.027679443359375, -0.0242919921875, -0.020904541015625, -0.01751708984375, -0.014129638671875, -0.0107421875, -0.007354736328125, -0.00396728515625, -0.000579833984375, 0.0028076171875, 0.006195068359375, 0.00958251953125, 0.012969970703125, 0.016357421875, 0.019744873046875, 0.02313232421875, 0.026519775390625, 0.0299072265625, 0.033294677734375, 0.03668212890625, 0.040069580078125, 0.04345703125, 0.046844482421875, 0.05023193359375, 0.053619384765625, 0.0570068359375, 0.060394287109375, 0.06378173828125, 0.067169189453125, 0.070556640625, 0.073944091796875, 0.07733154296875, 0.080718994140625, 0.0841064453125, 0.087493896484375, 0.09088134765625, 0.094268798828125, 0.09765625, 0.101043701171875, 0.10443115234375, 0.107818603515625, 0.1112060546875, 0.114593505859375, 0.11798095703125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 10.0, 19.0, 19.0, 14.0, 18.0, 20.0, 29.0, 24.0, 30.0, 23.0, 29.0, 38.0, 36.0, 29.0, 51.0, 37.0, 41.0, 42.0, 39.0, 31.0, 40.0, 30.0, 33.0, 31.0, 37.0, 27.0, 23.0, 34.0, 21.0, 12.0, 21.0, 16.0, 14.0, 11.0, 11.0, 7.0, 5.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061370849609375, -0.05946063995361328, -0.05755043029785156, -0.055640220642089844, -0.053730010986328125, -0.051819801330566406, -0.04990959167480469, -0.04799938201904297, -0.04608917236328125, -0.04417896270751953, -0.04226875305175781, -0.040358543395996094, -0.038448333740234375, -0.036538124084472656, -0.03462791442871094, -0.03271770477294922, -0.0308074951171875, -0.02889728546142578, -0.026987075805664062, -0.025076866149902344, -0.023166656494140625, -0.021256446838378906, -0.019346237182617188, -0.01743602752685547, -0.01552581787109375, -0.013615608215332031, -0.011705398559570312, -0.009795188903808594, -0.007884979248046875, -0.005974769592285156, -0.0040645599365234375, -0.0021543502807617188, -0.000244140625, 0.0016660690307617188, 0.0035762786865234375, 0.005486488342285156, 0.007396697998046875, 0.009306907653808594, 0.011217117309570312, 0.013127326965332031, 0.01503753662109375, 0.01694774627685547, 0.018857955932617188, 0.020768165588378906, 0.022678375244140625, 0.024588584899902344, 0.026498794555664062, 0.02840900421142578, 0.0303192138671875, 0.03222942352294922, 0.03413963317871094, 0.036049842834472656, 0.037960052490234375, 0.039870262145996094, 0.04178047180175781, 0.04369068145751953, 0.04560089111328125, 0.04751110076904297, 0.04942131042480469, 0.051331520080566406, 0.053241729736328125, 0.055151939392089844, 0.05706214904785156, 0.05897235870361328, 0.060882568359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 6.0, 4.0, 6.0, 12.0, 7.0, 16.0, 28.0, 39.0, 59.0, 100.0, 180.0, 310.0, 620.0, 1474.0, 3523.0, 9792.0, 32014.0, 116894.0, 350410.0, 359764.0, 123045.0, 33333.0, 10305.0, 3745.0, 1476.0, 628.0, 304.0, 181.0, 99.0, 64.0, 40.0, 15.0, 12.0, 11.0, 13.0, 11.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13134765625, -0.12697219848632812, -0.12259674072265625, -0.11822128295898438, -0.1138458251953125, -0.10947036743164062, -0.10509490966796875, -0.10071945190429688, -0.096343994140625, -0.09196853637695312, -0.08759307861328125, -0.08321762084960938, -0.0788421630859375, -0.07446670532226562, -0.07009124755859375, -0.06571578979492188, -0.06134033203125, -0.056964874267578125, -0.05258941650390625, -0.048213958740234375, -0.0438385009765625, -0.039463043212890625, -0.03508758544921875, -0.030712127685546875, -0.026336669921875, -0.021961212158203125, -0.01758575439453125, -0.013210296630859375, -0.0088348388671875, -0.004459381103515625, -8.392333984375e-05, 0.004291534423828125, 0.0086669921875, 0.013042449951171875, 0.01741790771484375, 0.021793365478515625, 0.0261688232421875, 0.030544281005859375, 0.03491973876953125, 0.039295196533203125, 0.043670654296875, 0.048046112060546875, 0.05242156982421875, 0.056797027587890625, 0.0611724853515625, 0.06554794311523438, 0.06992340087890625, 0.07429885864257812, 0.07867431640625, 0.08304977416992188, 0.08742523193359375, 0.09180068969726562, 0.0961761474609375, 0.10055160522460938, 0.10492706298828125, 0.10930252075195312, 0.113677978515625, 0.11805343627929688, 0.12242889404296875, 0.12680435180664062, 0.1311798095703125, 0.13555526733398438, 0.13993072509765625, 0.14430618286132812, 0.148681640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 12.0, 16.0, 12.0, 9.0, 16.0, 20.0, 12.0, 25.0, 33.0, 32.0, 33.0, 30.0, 47.0, 34.0, 40.0, 47.0, 38.0, 55.0, 59.0, 49.0, 49.0, 44.0, 33.0, 37.0, 28.0, 28.0, 33.0, 23.0, 15.0, 15.0, 14.0, 10.0, 15.0, 5.0, 3.0, 2.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2204437255859375, -0.213714599609375, -0.2069854736328125, -0.20025634765625, -0.1935272216796875, -0.186798095703125, -0.1800689697265625, -0.17333984375, -0.1666107177734375, -0.159881591796875, -0.1531524658203125, -0.14642333984375, -0.1396942138671875, -0.132965087890625, -0.1262359619140625, -0.1195068359375, -0.1127777099609375, -0.106048583984375, -0.0993194580078125, -0.09259033203125, -0.0858612060546875, -0.079132080078125, -0.0724029541015625, -0.065673828125, -0.0589447021484375, -0.052215576171875, -0.0454864501953125, -0.03875732421875, -0.0320281982421875, -0.025299072265625, -0.0185699462890625, -0.0118408203125, -0.0051116943359375, 0.001617431640625, 0.0083465576171875, 0.01507568359375, 0.0218048095703125, 0.028533935546875, 0.0352630615234375, 0.0419921875, 0.0487213134765625, 0.055450439453125, 0.0621795654296875, 0.06890869140625, 0.0756378173828125, 0.082366943359375, 0.0890960693359375, 0.0958251953125, 0.1025543212890625, 0.109283447265625, 0.1160125732421875, 0.12274169921875, 0.1294708251953125, 0.136199951171875, 0.1429290771484375, 0.149658203125, 0.1563873291015625, 0.163116455078125, 0.1698455810546875, 0.17657470703125, 0.1833038330078125, 0.190032958984375, 0.1967620849609375, 0.2034912109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 13.0, 8.0, 21.0, 28.0, 58.0, 85.0, 122.0, 229.0, 452.0, 750.0, 1346.0, 2403.0, 4616.0, 9050.0, 19051.0, 40490.0, 90230.0, 184651.0, 266941.0, 217008.0, 113153.0, 50991.0, 23342.0, 11177.0, 5600.0, 2967.0, 1702.0, 872.0, 495.0, 286.0, 161.0, 92.0, 58.0, 40.0, 13.0, 17.0, 7.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0416259765625, -0.04045820236206055, -0.039290428161621094, -0.03812265396118164, -0.03695487976074219, -0.035787105560302734, -0.03461933135986328, -0.03345155715942383, -0.032283782958984375, -0.031116008758544922, -0.02994823455810547, -0.028780460357666016, -0.027612686157226562, -0.02644491195678711, -0.025277137756347656, -0.024109363555908203, -0.02294158935546875, -0.021773815155029297, -0.020606040954589844, -0.01943826675415039, -0.018270492553710938, -0.017102718353271484, -0.01593494415283203, -0.014767169952392578, -0.013599395751953125, -0.012431621551513672, -0.011263847351074219, -0.010096073150634766, -0.008928298950195312, -0.007760524749755859, -0.006592750549316406, -0.005424976348876953, -0.0042572021484375, -0.003089427947998047, -0.0019216537475585938, -0.0007538795471191406, 0.0004138946533203125, 0.0015816688537597656, 0.0027494430541992188, 0.003917217254638672, 0.005084991455078125, 0.006252765655517578, 0.007420539855957031, 0.008588314056396484, 0.009756088256835938, 0.01092386245727539, 0.012091636657714844, 0.013259410858154297, 0.01442718505859375, 0.015594959259033203, 0.016762733459472656, 0.01793050765991211, 0.019098281860351562, 0.020266056060791016, 0.02143383026123047, 0.022601604461669922, 0.023769378662109375, 0.024937152862548828, 0.02610492706298828, 0.027272701263427734, 0.028440475463867188, 0.02960824966430664, 0.030776023864746094, 0.03194379806518555, 0.033111572265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 13.0, 14.0, 12.0, 18.0, 20.0, 19.0, 45.0, 44.0, 47.0, 48.0, 49.0, 62.0, 74.0, 69.0, 69.0, 57.0, 51.0, 42.0, 31.0, 52.0, 24.0, 24.0, 22.0, 19.0, 15.0, 6.0, 7.0, 12.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.2993812561035156e-05, -1.2588687241077423e-05, -1.218356192111969e-05, -1.1778436601161957e-05, -1.1373311281204224e-05, -1.096818596124649e-05, -1.0563060641288757e-05, -1.0157935321331024e-05, -9.752810001373291e-06, -9.347684681415558e-06, -8.942559361457825e-06, -8.537434041500092e-06, -8.132308721542358e-06, -7.727183401584625e-06, -7.322058081626892e-06, -6.916932761669159e-06, -6.511807441711426e-06, -6.106682121753693e-06, -5.7015568017959595e-06, -5.296431481838226e-06, -4.891306161880493e-06, -4.48618084192276e-06, -4.081055521965027e-06, -3.6759302020072937e-06, -3.2708048820495605e-06, -2.8656795620918274e-06, -2.4605542421340942e-06, -2.055428922176361e-06, -1.650303602218628e-06, -1.2451782822608948e-06, -8.400529623031616e-07, -4.3492764234542847e-07, -2.9802322387695312e-08, 3.7532299757003784e-07, 7.80448317527771e-07, 1.1855736374855042e-06, 1.5906989574432373e-06, 1.9958242774009705e-06, 2.4009495973587036e-06, 2.8060749173164368e-06, 3.21120023727417e-06, 3.616325557231903e-06, 4.021450877189636e-06, 4.426576197147369e-06, 4.8317015171051025e-06, 5.236826837062836e-06, 5.641952157020569e-06, 6.047077476978302e-06, 6.452202796936035e-06, 6.857328116893768e-06, 7.2624534368515015e-06, 7.667578756809235e-06, 8.072704076766968e-06, 8.477829396724701e-06, 8.882954716682434e-06, 9.288080036640167e-06, 9.6932053565979e-06, 1.0098330676555634e-05, 1.0503455996513367e-05, 1.09085813164711e-05, 1.1313706636428833e-05, 1.1718831956386566e-05, 1.21239572763443e-05, 1.2529082596302032e-05, 1.2934207916259766e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 5.0, 12.0, 12.0, 11.0, 19.0, 27.0, 39.0, 65.0, 100.0, 123.0, 232.0, 437.0, 823.0, 1611.0, 3301.0, 7370.0, 16391.0, 35982.0, 77572.0, 155302.0, 243021.0, 234690.0, 141499.0, 70231.0, 32109.0, 14551.0, 6612.0, 3140.0, 1464.0, 785.0, 379.0, 222.0, 133.0, 90.0, 57.0, 43.0, 29.0, 21.0, 18.0, 11.0, 3.0, 1.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.042388916015625, -0.04120922088623047, -0.04002952575683594, -0.038849830627441406, -0.037670135498046875, -0.036490440368652344, -0.03531074523925781, -0.03413105010986328, -0.03295135498046875, -0.03177165985107422, -0.030591964721679688, -0.029412269592285156, -0.028232574462890625, -0.027052879333496094, -0.025873184204101562, -0.02469348907470703, -0.0235137939453125, -0.02233409881591797, -0.021154403686523438, -0.019974708557128906, -0.018795013427734375, -0.017615318298339844, -0.016435623168945312, -0.015255928039550781, -0.01407623291015625, -0.012896537780761719, -0.011716842651367188, -0.010537147521972656, -0.009357452392578125, -0.008177757263183594, -0.0069980621337890625, -0.005818367004394531, -0.004638671875, -0.0034589767456054688, -0.0022792816162109375, -0.0010995864868164062, 8.0108642578125e-05, 0.0012598037719726562, 0.0024394989013671875, 0.0036191940307617188, 0.00479888916015625, 0.005978584289550781, 0.0071582794189453125, 0.008337974548339844, 0.009517669677734375, 0.010697364807128906, 0.011877059936523438, 0.013056755065917969, 0.0142364501953125, 0.015416145324707031, 0.016595840454101562, 0.017775535583496094, 0.018955230712890625, 0.020134925842285156, 0.021314620971679688, 0.02249431610107422, 0.02367401123046875, 0.02485370635986328, 0.026033401489257812, 0.027213096618652344, 0.028392791748046875, 0.029572486877441406, 0.030752182006835938, 0.03193187713623047, 0.033111572265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 10.0, 15.0, 28.0, 22.0, 40.0, 48.0, 50.0, 65.0, 74.0, 78.0, 84.0, 91.0, 62.0, 66.0, 58.0, 46.0, 33.0, 43.0, 17.0, 17.0, 16.0, 8.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.074951171875, -0.07318258285522461, -0.07141399383544922, -0.06964540481567383, -0.06787681579589844, -0.06610822677612305, -0.06433963775634766, -0.06257104873657227, -0.060802459716796875, -0.059033870697021484, -0.057265281677246094, -0.0554966926574707, -0.05372810363769531, -0.05195951461791992, -0.05019092559814453, -0.04842233657836914, -0.04665374755859375, -0.04488515853881836, -0.04311656951904297, -0.04134798049926758, -0.03957939147949219, -0.0378108024597168, -0.036042213439941406, -0.034273624420166016, -0.032505035400390625, -0.030736446380615234, -0.028967857360839844, -0.027199268341064453, -0.025430679321289062, -0.023662090301513672, -0.02189350128173828, -0.02012491226196289, -0.0183563232421875, -0.01658773422241211, -0.014819145202636719, -0.013050556182861328, -0.011281967163085938, -0.009513378143310547, -0.007744789123535156, -0.005976200103759766, -0.004207611083984375, -0.0024390220642089844, -0.0006704330444335938, 0.0010981559753417969, 0.0028667449951171875, 0.004635334014892578, 0.006403923034667969, 0.00817251205444336, 0.00994110107421875, 0.01170969009399414, 0.013478279113769531, 0.015246868133544922, 0.017015457153320312, 0.018784046173095703, 0.020552635192871094, 0.022321224212646484, 0.024089813232421875, 0.025858402252197266, 0.027626991271972656, 0.029395580291748047, 0.031164169311523438, 0.03293275833129883, 0.03470134735107422, 0.03646993637084961, 0.038238525390625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 20.0, 65.0, 261.0, 354.0, 197.0, 65.0, 19.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4630708694458008, -1.4112446308135986, -1.359418272972107, -1.3075919151306152, -1.255765676498413, -1.203939437866211, -1.1521130800247192, -1.1002867221832275, -1.0484604835510254, -0.9966341853141785, -0.9448078870773315, -0.8929815888404846, -0.8411552906036377, -0.7893289923667908, -0.7375026941299438, -0.6856763958930969, -0.63385009765625, -0.5820237994194031, -0.5301975011825562, -0.47837120294570923, -0.4265449047088623, -0.3747186064720154, -0.32289230823516846, -0.27106600999832153, -0.2192397117614746, -0.16741341352462769, -0.11558711528778076, -0.06376081705093384, -0.011934518814086914, 0.03989177942276001, 0.09171807765960693, 0.14354437589645386, 0.19537067413330078, 0.2471969723701477, 0.29902327060699463, 0.35084956884384155, 0.4026758670806885, 0.4545021653175354, 0.5063284635543823, 0.5581547617912292, 0.6099810600280762, 0.6618073582649231, 0.71363365650177, 0.7654599547386169, 0.8172862529754639, 0.8691125512123108, 0.9209388494491577, 0.9727651476860046, 1.0245914459228516, 1.0764176845550537, 1.1282440423965454, 1.180070400238037, 1.2318966388702393, 1.2837228775024414, 1.335549235343933, 1.3873755931854248, 1.439201831817627, 1.491028070449829, 1.5428544282913208, 1.5946807861328125, 1.6465070247650146, 1.6983332633972168, 1.7501596212387085, 1.8019859790802002, 1.8538122177124023]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 8.0, 13.0, 9.0, 15.0, 15.0, 22.0, 23.0, 28.0, 31.0, 25.0, 33.0, 37.0, 35.0, 37.0, 38.0, 42.0, 47.0, 39.0, 32.0, 50.0, 40.0, 32.0, 38.0, 38.0, 31.0, 33.0, 30.0, 38.0, 29.0, 17.0, 16.0, 11.0, 9.0, 7.0, 7.0, 3.0, 8.0, 5.0, 6.0, 3.0, 0.0, 8.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.526828944683075, -0.510692834854126, -0.494556725025177, -0.478420615196228, -0.46228450536727905, -0.4461483955383301, -0.4300122857093811, -0.41387617588043213, -0.39774006605148315, -0.3816039562225342, -0.3654678463935852, -0.34933173656463623, -0.33319562673568726, -0.3170595169067383, -0.3009234070777893, -0.28478729724884033, -0.26865118741989136, -0.2525150775909424, -0.2363789677619934, -0.22024285793304443, -0.20410674810409546, -0.18797063827514648, -0.1718345284461975, -0.15569841861724854, -0.13956230878829956, -0.12342619895935059, -0.10729008913040161, -0.09115397930145264, -0.07501786947250366, -0.05888175964355469, -0.04274564981460571, -0.02660953998565674, -0.010473489761352539, 0.0056626200675964355, 0.02179872989654541, 0.037934839725494385, 0.05407094955444336, 0.07020705938339233, 0.08634316921234131, 0.10247927904129028, 0.11861538887023926, 0.13475149869918823, 0.1508876085281372, 0.16702371835708618, 0.18315982818603516, 0.19929593801498413, 0.2154320478439331, 0.23156815767288208, 0.24770426750183105, 0.26384037733078003, 0.279976487159729, 0.296112596988678, 0.31224870681762695, 0.3283848166465759, 0.3445209264755249, 0.3606570363044739, 0.37679314613342285, 0.3929292559623718, 0.4090653657913208, 0.4252014756202698, 0.44133758544921875, 0.4574736952781677, 0.4736098051071167, 0.4897459149360657, 0.5058820247650146]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 9.0, 4.0, 3.0, 10.0, 18.0, 21.0, 24.0, 30.0, 56.0, 74.0, 107.0, 197.0, 344.0, 675.0, 1326.0, 2766.0, 6573.0, 16170.0, 42554.0, 129119.0, 408932.0, 1074726.0, 1438208.0, 718799.0, 235044.0, 73527.0, 25957.0, 10413.0, 4282.0, 2010.0, 999.0, 501.0, 276.0, 188.0, 112.0, 70.0, 47.0, 26.0, 23.0, 18.0, 15.0, 15.0, 9.0, 8.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.085693359375, -0.08326339721679688, -0.08083343505859375, -0.07840347290039062, -0.0759735107421875, -0.07354354858398438, -0.07111358642578125, -0.06868362426757812, -0.066253662109375, -0.06382369995117188, -0.06139373779296875, -0.058963775634765625, -0.0565338134765625, -0.054103851318359375, -0.05167388916015625, -0.049243927001953125, -0.04681396484375, -0.044384002685546875, -0.04195404052734375, -0.039524078369140625, -0.0370941162109375, -0.034664154052734375, -0.03223419189453125, -0.029804229736328125, -0.027374267578125, -0.024944305419921875, -0.02251434326171875, -0.020084381103515625, -0.0176544189453125, -0.015224456787109375, -0.01279449462890625, -0.010364532470703125, -0.0079345703125, -0.005504608154296875, -0.00307464599609375, -0.000644683837890625, 0.0017852783203125, 0.004215240478515625, 0.00664520263671875, 0.009075164794921875, 0.011505126953125, 0.013935089111328125, 0.01636505126953125, 0.018795013427734375, 0.0212249755859375, 0.023654937744140625, 0.02608489990234375, 0.028514862060546875, 0.03094482421875, 0.033374786376953125, 0.03580474853515625, 0.038234710693359375, 0.0406646728515625, 0.043094635009765625, 0.04552459716796875, 0.047954559326171875, 0.050384521484375, 0.052814483642578125, 0.05524444580078125, 0.057674407958984375, 0.0601043701171875, 0.06253433227539062, 0.06496429443359375, 0.06739425659179688, 0.06982421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 3.0, 8.0, 6.0, 12.0, 19.0, 11.0, 13.0, 18.0, 8.0, 24.0, 25.0, 28.0, 27.0, 37.0, 39.0, 40.0, 44.0, 48.0, 34.0, 39.0, 41.0, 37.0, 45.0, 35.0, 33.0, 31.0, 37.0, 34.0, 37.0, 20.0, 15.0, 15.0, 21.0, 18.0, 16.0, 7.0, 17.0, 12.0, 8.0, 8.0, 8.0, 6.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.07281494140625, -0.07056522369384766, -0.06831550598144531, -0.06606578826904297, -0.06381607055664062, -0.06156635284423828, -0.05931663513183594, -0.057066917419433594, -0.05481719970703125, -0.052567481994628906, -0.05031776428222656, -0.04806804656982422, -0.045818328857421875, -0.04356861114501953, -0.04131889343261719, -0.039069175720214844, -0.0368194580078125, -0.034569740295410156, -0.03232002258300781, -0.03007030487060547, -0.027820587158203125, -0.02557086944580078, -0.023321151733398438, -0.021071434020996094, -0.01882171630859375, -0.016571998596191406, -0.014322280883789062, -0.012072563171386719, -0.009822845458984375, -0.007573127746582031, -0.0053234100341796875, -0.0030736923217773438, -0.000823974609375, 0.0014257431030273438, 0.0036754608154296875, 0.005925178527832031, 0.008174896240234375, 0.010424613952636719, 0.012674331665039062, 0.014924049377441406, 0.01717376708984375, 0.019423484802246094, 0.021673202514648438, 0.02392292022705078, 0.026172637939453125, 0.02842235565185547, 0.030672073364257812, 0.032921791076660156, 0.0351715087890625, 0.037421226501464844, 0.03967094421386719, 0.04192066192626953, 0.044170379638671875, 0.04642009735107422, 0.04866981506347656, 0.050919532775878906, 0.05316925048828125, 0.055418968200683594, 0.05766868591308594, 0.05991840362548828, 0.062168121337890625, 0.06441783905029297, 0.06666755676269531, 0.06891727447509766, 0.0711669921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 12.0, 15.0, 23.0, 38.0, 72.0, 140.0, 209.0, 458.0, 889.0, 2276.0, 6793.0, 26063.0, 123595.0, 923294.0, 2633868.0, 388153.0, 65760.0, 15101.0, 4476.0, 1601.0, 689.0, 314.0, 187.0, 101.0, 49.0, 30.0, 17.0, 19.0, 12.0, 10.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1746196746826172, -0.16967391967773438, -0.16472816467285156, -0.15978240966796875, -0.15483665466308594, -0.14989089965820312, -0.1449451446533203, -0.1399993896484375, -0.1350536346435547, -0.13010787963867188, -0.12516212463378906, -0.12021636962890625, -0.11527061462402344, -0.11032485961914062, -0.10537910461425781, -0.100433349609375, -0.09548759460449219, -0.09054183959960938, -0.08559608459472656, -0.08065032958984375, -0.07570457458496094, -0.07075881958007812, -0.06581306457519531, -0.0608673095703125, -0.05592155456542969, -0.050975799560546875, -0.04603004455566406, -0.04108428955078125, -0.03613853454589844, -0.031192779541015625, -0.026247024536132812, -0.02130126953125, -0.016355514526367188, -0.011409759521484375, -0.0064640045166015625, -0.00151824951171875, 0.0034275054931640625, 0.008373260498046875, 0.013319015502929688, 0.0182647705078125, 0.023210525512695312, 0.028156280517578125, 0.03310203552246094, 0.03804779052734375, 0.04299354553222656, 0.047939300537109375, 0.05288505554199219, 0.057830810546875, 0.06277656555175781, 0.06772232055664062, 0.07266807556152344, 0.07761383056640625, 0.08255958557128906, 0.08750534057617188, 0.09245109558105469, 0.0973968505859375, 0.10234260559082031, 0.10728836059570312, 0.11223411560058594, 0.11717987060546875, 0.12212562561035156, 0.12707138061523438, 0.1320171356201172, 0.136962890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 23.0, 18.0, 31.0, 38.0, 52.0, 83.0, 110.0, 161.0, 239.0, 365.0, 408.0, 531.0, 527.0, 404.0, 300.0, 193.0, 126.0, 101.0, 73.0, 53.0, 37.0, 35.0, 27.0, 21.0, 11.0, 13.0, 3.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09765625, -0.093719482421875, -0.08978271484375, -0.085845947265625, -0.0819091796875, -0.077972412109375, -0.07403564453125, -0.070098876953125, -0.066162109375, -0.062225341796875, -0.05828857421875, -0.054351806640625, -0.0504150390625, -0.046478271484375, -0.04254150390625, -0.038604736328125, -0.03466796875, -0.030731201171875, -0.02679443359375, -0.022857666015625, -0.0189208984375, -0.014984130859375, -0.01104736328125, -0.007110595703125, -0.003173828125, 0.000762939453125, 0.00469970703125, 0.008636474609375, 0.0125732421875, 0.016510009765625, 0.02044677734375, 0.024383544921875, 0.0283203125, 0.032257080078125, 0.03619384765625, 0.040130615234375, 0.0440673828125, 0.048004150390625, 0.05194091796875, 0.055877685546875, 0.059814453125, 0.063751220703125, 0.06768798828125, 0.071624755859375, 0.0755615234375, 0.079498291015625, 0.08343505859375, 0.087371826171875, 0.09130859375, 0.095245361328125, 0.09918212890625, 0.103118896484375, 0.1070556640625, 0.110992431640625, 0.11492919921875, 0.118865966796875, 0.122802734375, 0.126739501953125, 0.13067626953125, 0.134613037109375, 0.1385498046875, 0.142486572265625, 0.14642333984375, 0.150360107421875, 0.154296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 14.0, 20.0, 38.0, 78.0, 92.0, 116.0, 152.0, 126.0, 114.0, 84.0, 65.0, 39.0, 16.0, 14.0, 9.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0181869268417358, -0.9925392866134644, -0.9668917059898376, -0.9412440657615662, -0.9155964851379395, -0.889948844909668, -0.8643012046813965, -0.8386536240577698, -0.8130060434341431, -0.7873584032058716, -0.7617108225822449, -0.7360631823539734, -0.7104156017303467, -0.6847679615020752, -0.6591203212738037, -0.633472740650177, -0.6078251004219055, -0.582177460193634, -0.5565298795700073, -0.5308822393417358, -0.5052346587181091, -0.47958701848983765, -0.45393940806388855, -0.42829179763793945, -0.40264418721199036, -0.37699657678604126, -0.35134896636009216, -0.32570135593414307, -0.3000537157058716, -0.2744061350822449, -0.2487584948539734, -0.2231108844280243, -0.1974632740020752, -0.1718156635761261, -0.146168053150177, -0.12052042782306671, -0.09487281739711761, -0.06922520697116852, -0.04357758164405823, -0.01792997121810913, 0.007717639207839966, 0.03336525335907936, 0.059012867510318756, 0.08466048538684845, 0.11030809581279755, 0.13595570623874664, 0.16160333156585693, 0.18725094199180603, 0.21289855241775513, 0.23854616284370422, 0.2641937732696533, 0.2898414134979248, 0.3154889941215515, 0.341136634349823, 0.3667842447757721, 0.3924318552017212, 0.4180794656276703, 0.4437270760536194, 0.4693746864795685, 0.4950222969055176, 0.5206699371337891, 0.5463175177574158, 0.5719651579856873, 0.597612738609314, 0.6232603788375854]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 7.0, 7.0, 3.0, 9.0, 16.0, 15.0, 19.0, 18.0, 28.0, 25.0, 35.0, 25.0, 40.0, 40.0, 43.0, 66.0, 55.0, 47.0, 46.0, 43.0, 41.0, 41.0, 54.0, 38.0, 41.0, 32.0, 24.0, 32.0, 31.0, 18.0, 12.0, 12.0, 17.0, 6.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5241436958312988, -0.5090140700340271, -0.49388444423675537, -0.47875481843948364, -0.4636251926422119, -0.4484955668449402, -0.43336591124534607, -0.41823628544807434, -0.4031066596508026, -0.3879770338535309, -0.37284740805625916, -0.3577177822589874, -0.3425881266593933, -0.3274585008621216, -0.31232887506484985, -0.2971992492675781, -0.2820696234703064, -0.26693999767303467, -0.25181037187576294, -0.23668073117733002, -0.2215511053800583, -0.20642147958278656, -0.19129183888435364, -0.1761622130870819, -0.16103258728981018, -0.14590296149253845, -0.13077333569526672, -0.1156436949968338, -0.10051406919956207, -0.08538444340229034, -0.07025481015443802, -0.05512517690658569, -0.039995551109313965, -0.024865921586751938, -0.009736292064189911, 0.005393337458372116, 0.020522966980934143, 0.03565259277820587, 0.0507822260260582, 0.06591185927391052, 0.08104148507118225, 0.09617111086845398, 0.1113007441163063, 0.12643037736415863, 0.14156000316143036, 0.1566896289587021, 0.171819269657135, 0.18694889545440674, 0.20207852125167847, 0.2172081470489502, 0.23233777284622192, 0.24746741354465485, 0.2625970244407654, 0.2777266502380371, 0.2928563058376312, 0.30798593163490295, 0.3231155574321747, 0.3382451832294464, 0.35337480902671814, 0.36850443482398987, 0.383634090423584, 0.3987637162208557, 0.41389334201812744, 0.42902296781539917, 0.4441525936126709]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 13.0, 31.0, 44.0, 69.0, 136.0, 260.0, 561.0, 1209.0, 3088.0, 8227.0, 23399.0, 85583.0, 346571.0, 415748.0, 117054.0, 29958.0, 10119.0, 3811.0, 1454.0, 562.0, 291.0, 158.0, 75.0, 50.0, 29.0, 14.0, 14.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15087890625, -0.14569473266601562, -0.14051055908203125, -0.13532638549804688, -0.1301422119140625, -0.12495803833007812, -0.11977386474609375, -0.11458969116210938, -0.109405517578125, -0.10422134399414062, -0.09903717041015625, -0.09385299682617188, -0.0886688232421875, -0.08348464965820312, -0.07830047607421875, -0.07311630249023438, -0.06793212890625, -0.06274795532226562, -0.05756378173828125, -0.052379608154296875, -0.0471954345703125, -0.042011260986328125, -0.03682708740234375, -0.031642913818359375, -0.026458740234375, -0.021274566650390625, -0.01609039306640625, -0.010906219482421875, -0.0057220458984375, -0.000537872314453125, 0.00464630126953125, 0.009830474853515625, 0.0150146484375, 0.020198822021484375, 0.02538299560546875, 0.030567169189453125, 0.0357513427734375, 0.040935516357421875, 0.04611968994140625, 0.051303863525390625, 0.056488037109375, 0.061672210693359375, 0.06685638427734375, 0.07204055786132812, 0.0772247314453125, 0.08240890502929688, 0.08759307861328125, 0.09277725219726562, 0.09796142578125, 0.10314559936523438, 0.10832977294921875, 0.11351394653320312, 0.1186981201171875, 0.12388229370117188, 0.12906646728515625, 0.13425064086914062, 0.139434814453125, 0.14461898803710938, 0.14980316162109375, 0.15498733520507812, 0.1601715087890625, 0.16535568237304688, 0.17053985595703125, 0.17572402954101562, 0.180908203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 3.0, 4.0, 10.0, 17.0, 8.0, 9.0, 16.0, 17.0, 15.0, 21.0, 27.0, 28.0, 26.0, 26.0, 36.0, 29.0, 37.0, 29.0, 40.0, 43.0, 45.0, 38.0, 39.0, 38.0, 50.0, 38.0, 37.0, 38.0, 29.0, 27.0, 35.0, 13.0, 21.0, 13.0, 18.0, 13.0, 8.0, 11.0, 9.0, 7.0, 9.0, 2.0, 8.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07025146484375, -0.06804466247558594, -0.06583786010742188, -0.06363105773925781, -0.06142425537109375, -0.05921745300292969, -0.057010650634765625, -0.05480384826660156, -0.0525970458984375, -0.05039024353027344, -0.048183441162109375, -0.04597663879394531, -0.04376983642578125, -0.04156303405761719, -0.039356231689453125, -0.03714942932128906, -0.034942626953125, -0.03273582458496094, -0.030529022216796875, -0.028322219848632812, -0.02611541748046875, -0.023908615112304688, -0.021701812744140625, -0.019495010375976562, -0.0172882080078125, -0.015081405639648438, -0.012874603271484375, -0.010667800903320312, -0.00846099853515625, -0.0062541961669921875, -0.004047393798828125, -0.0018405914306640625, 0.0003662109375, 0.0025730133056640625, 0.004779815673828125, 0.0069866180419921875, 0.00919342041015625, 0.011400222778320312, 0.013607025146484375, 0.015813827514648438, 0.0180206298828125, 0.020227432250976562, 0.022434234619140625, 0.024641036987304688, 0.02684783935546875, 0.029054641723632812, 0.031261444091796875, 0.03346824645996094, 0.035675048828125, 0.03788185119628906, 0.040088653564453125, 0.04229545593261719, 0.04450225830078125, 0.04670906066894531, 0.048915863037109375, 0.05112266540527344, 0.0533294677734375, 0.05553627014160156, 0.057743072509765625, 0.05994987487792969, 0.06215667724609375, 0.06436347961425781, 0.06657028198242188, 0.06877708435058594, 0.07098388671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 13.0, 16.0, 27.0, 35.0, 53.0, 110.0, 132.0, 247.0, 442.0, 783.0, 1503.0, 3004.0, 5923.0, 12502.0, 29141.0, 84162.0, 263428.0, 389729.0, 166566.0, 52456.0, 19851.0, 9011.0, 4497.0, 2216.0, 1156.0, 639.0, 293.0, 239.0, 117.0, 72.0, 51.0, 40.0, 26.0, 18.0, 12.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.124786376953125, -0.12066650390625, -0.116546630859375, -0.1124267578125, -0.108306884765625, -0.10418701171875, -0.100067138671875, -0.095947265625, -0.091827392578125, -0.08770751953125, -0.083587646484375, -0.0794677734375, -0.075347900390625, -0.07122802734375, -0.067108154296875, -0.06298828125, -0.058868408203125, -0.05474853515625, -0.050628662109375, -0.0465087890625, -0.042388916015625, -0.03826904296875, -0.034149169921875, -0.030029296875, -0.025909423828125, -0.02178955078125, -0.017669677734375, -0.0135498046875, -0.009429931640625, -0.00531005859375, -0.001190185546875, 0.0029296875, 0.007049560546875, 0.01116943359375, 0.015289306640625, 0.0194091796875, 0.023529052734375, 0.02764892578125, 0.031768798828125, 0.035888671875, 0.040008544921875, 0.04412841796875, 0.048248291015625, 0.0523681640625, 0.056488037109375, 0.06060791015625, 0.064727783203125, 0.06884765625, 0.072967529296875, 0.07708740234375, 0.081207275390625, 0.0853271484375, 0.089447021484375, 0.09356689453125, 0.097686767578125, 0.101806640625, 0.105926513671875, 0.11004638671875, 0.114166259765625, 0.1182861328125, 0.122406005859375, 0.12652587890625, 0.130645751953125, 0.134765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 9.0, 12.0, 11.0, 16.0, 21.0, 26.0, 29.0, 38.0, 35.0, 49.0, 37.0, 43.0, 50.0, 59.0, 59.0, 46.0, 54.0, 41.0, 44.0, 41.0, 38.0, 29.0, 37.0, 30.0, 21.0, 21.0, 14.0, 16.0, 19.0, 14.0, 5.0, 7.0, 8.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.21668243408203125, -0.2087554931640625, -0.20082855224609375, -0.192901611328125, -0.18497467041015625, -0.1770477294921875, -0.16912078857421875, -0.16119384765625, -0.15326690673828125, -0.1453399658203125, -0.13741302490234375, -0.129486083984375, -0.12155914306640625, -0.1136322021484375, -0.10570526123046875, -0.0977783203125, -0.08985137939453125, -0.0819244384765625, -0.07399749755859375, -0.066070556640625, -0.05814361572265625, -0.0502166748046875, -0.04228973388671875, -0.03436279296875, -0.02643585205078125, -0.0185089111328125, -0.01058197021484375, -0.002655029296875, 0.00527191162109375, 0.0131988525390625, 0.02112579345703125, 0.029052734375, 0.03697967529296875, 0.0449066162109375, 0.05283355712890625, 0.060760498046875, 0.06868743896484375, 0.0766143798828125, 0.08454132080078125, 0.09246826171875, 0.10039520263671875, 0.1083221435546875, 0.11624908447265625, 0.124176025390625, 0.13210296630859375, 0.1400299072265625, 0.14795684814453125, 0.1558837890625, 0.16381072998046875, 0.1717376708984375, 0.17966461181640625, 0.187591552734375, 0.19551849365234375, 0.2034454345703125, 0.21137237548828125, 0.21929931640625, 0.22722625732421875, 0.2351531982421875, 0.24308013916015625, 0.251007080078125, 0.25893402099609375, 0.2668609619140625, 0.27478790283203125, 0.28271484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 15.0, 15.0, 21.0, 37.0, 63.0, 77.0, 134.0, 194.0, 358.0, 525.0, 737.0, 1244.0, 1880.0, 3006.0, 5016.0, 8043.0, 13878.0, 25436.0, 50556.0, 110948.0, 233992.0, 281047.0, 161020.0, 71570.0, 33647.0, 18107.0, 10282.0, 6241.0, 3813.0, 2337.0, 1442.0, 986.0, 632.0, 421.0, 288.0, 176.0, 126.0, 90.0, 46.0, 36.0, 18.0, 13.0, 11.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.03343963623046875, -0.0323333740234375, -0.03122711181640625, -0.030120849609375, -0.02901458740234375, -0.0279083251953125, -0.02680206298828125, -0.02569580078125, -0.02458953857421875, -0.0234832763671875, -0.02237701416015625, -0.021270751953125, -0.02016448974609375, -0.0190582275390625, -0.01795196533203125, -0.016845703125, -0.01573944091796875, -0.0146331787109375, -0.01352691650390625, -0.012420654296875, -0.01131439208984375, -0.0102081298828125, -0.00910186767578125, -0.00799560546875, -0.00688934326171875, -0.0057830810546875, -0.00467681884765625, -0.003570556640625, -0.00246429443359375, -0.0013580322265625, -0.00025177001953125, 0.0008544921875, 0.00196075439453125, 0.0030670166015625, 0.00417327880859375, 0.005279541015625, 0.00638580322265625, 0.0074920654296875, 0.00859832763671875, 0.00970458984375, 0.01081085205078125, 0.0119171142578125, 0.01302337646484375, 0.014129638671875, 0.01523590087890625, 0.0163421630859375, 0.01744842529296875, 0.0185546875, 0.01966094970703125, 0.0207672119140625, 0.02187347412109375, 0.022979736328125, 0.02408599853515625, 0.0251922607421875, 0.02629852294921875, 0.02740478515625, 0.02851104736328125, 0.0296173095703125, 0.03072357177734375, 0.031829833984375, 0.03293609619140625, 0.0340423583984375, 0.03514862060546875, 0.0362548828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 5.0, 10.0, 10.0, 9.0, 22.0, 24.0, 22.0, 39.0, 67.0, 94.0, 92.0, 99.0, 95.0, 82.0, 85.0, 63.0, 48.0, 35.0, 21.0, 17.0, 15.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5437602996826172e-05, -1.4842487871646881e-05, -1.424737274646759e-05, -1.36522576212883e-05, -1.3057142496109009e-05, -1.2462027370929718e-05, -1.1866912245750427e-05, -1.1271797120571136e-05, -1.0676681995391846e-05, -1.0081566870212555e-05, -9.486451745033264e-06, -8.891336619853973e-06, -8.296221494674683e-06, -7.701106369495392e-06, -7.105991244316101e-06, -6.51087611913681e-06, -5.9157609939575195e-06, -5.320645868778229e-06, -4.725530743598938e-06, -4.130415618419647e-06, -3.5353004932403564e-06, -2.9401853680610657e-06, -2.345070242881775e-06, -1.7499551177024841e-06, -1.1548399925231934e-06, -5.597248673439026e-07, 3.5390257835388184e-08, 6.30505383014679e-07, 1.2256205081939697e-06, 1.8207356333732605e-06, 2.4158507585525513e-06, 3.010965883731842e-06, 3.606081008911133e-06, 4.201196134090424e-06, 4.796311259269714e-06, 5.391426384449005e-06, 5.986541509628296e-06, 6.581656634807587e-06, 7.1767717599868774e-06, 7.771886885166168e-06, 8.367002010345459e-06, 8.96211713552475e-06, 9.55723226070404e-06, 1.0152347385883331e-05, 1.0747462511062622e-05, 1.1342577636241913e-05, 1.1937692761421204e-05, 1.2532807886600494e-05, 1.3127923011779785e-05, 1.3723038136959076e-05, 1.4318153262138367e-05, 1.4913268387317657e-05, 1.5508383512496948e-05, 1.610349863767624e-05, 1.669861376285553e-05, 1.729372888803482e-05, 1.788884401321411e-05, 1.8483959138393402e-05, 1.9079074263572693e-05, 1.9674189388751984e-05, 2.0269304513931274e-05, 2.0864419639110565e-05, 2.1459534764289856e-05, 2.2054649889469147e-05, 2.2649765014648438e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 9.0, 12.0, 14.0, 37.0, 48.0, 92.0, 186.0, 383.0, 823.0, 1720.0, 3894.0, 9033.0, 20306.0, 47786.0, 122532.0, 278443.0, 309787.0, 151562.0, 58031.0, 24335.0, 10696.0, 4774.0, 2086.0, 981.0, 435.0, 243.0, 125.0, 70.0, 37.0, 25.0, 8.0, 10.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03765869140625, -0.0362696647644043, -0.034880638122558594, -0.03349161148071289, -0.03210258483886719, -0.030713558197021484, -0.02932453155517578, -0.027935504913330078, -0.026546478271484375, -0.025157451629638672, -0.02376842498779297, -0.022379398345947266, -0.020990371704101562, -0.01960134506225586, -0.018212318420410156, -0.016823291778564453, -0.01543426513671875, -0.014045238494873047, -0.012656211853027344, -0.01126718521118164, -0.009878158569335938, -0.008489131927490234, -0.007100105285644531, -0.005711078643798828, -0.004322052001953125, -0.002933025360107422, -0.0015439987182617188, -0.00015497207641601562, 0.0012340545654296875, 0.0026230812072753906, 0.004012107849121094, 0.005401134490966797, 0.0067901611328125, 0.008179187774658203, 0.009568214416503906, 0.01095724105834961, 0.012346267700195312, 0.013735294342041016, 0.015124320983886719, 0.016513347625732422, 0.017902374267578125, 0.019291400909423828, 0.02068042755126953, 0.022069454193115234, 0.023458480834960938, 0.02484750747680664, 0.026236534118652344, 0.027625560760498047, 0.02901458740234375, 0.030403614044189453, 0.031792640686035156, 0.03318166732788086, 0.03457069396972656, 0.035959720611572266, 0.03734874725341797, 0.03873777389526367, 0.040126800537109375, 0.04151582717895508, 0.04290485382080078, 0.044293880462646484, 0.04568290710449219, 0.04707193374633789, 0.048460960388183594, 0.0498499870300293, 0.051239013671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 2.0, 4.0, 8.0, 9.0, 17.0, 22.0, 24.0, 38.0, 35.0, 52.0, 49.0, 71.0, 80.0, 60.0, 72.0, 66.0, 53.0, 58.0, 49.0, 30.0, 33.0, 28.0, 18.0, 14.0, 24.0, 9.0, 11.0, 6.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.045257568359375, -0.043843746185302734, -0.04242992401123047, -0.0410161018371582, -0.03960227966308594, -0.03818845748901367, -0.036774635314941406, -0.03536081314086914, -0.033946990966796875, -0.03253316879272461, -0.031119346618652344, -0.029705524444580078, -0.028291702270507812, -0.026877880096435547, -0.02546405792236328, -0.024050235748291016, -0.02263641357421875, -0.021222591400146484, -0.01980876922607422, -0.018394947052001953, -0.016981124877929688, -0.015567302703857422, -0.014153480529785156, -0.01273965835571289, -0.011325836181640625, -0.00991201400756836, -0.008498191833496094, -0.007084369659423828, -0.0056705474853515625, -0.004256725311279297, -0.0028429031372070312, -0.0014290809631347656, -1.52587890625e-05, 0.0013985633850097656, 0.0028123855590820312, 0.004226207733154297, 0.0056400299072265625, 0.007053852081298828, 0.008467674255371094, 0.00988149642944336, 0.011295318603515625, 0.01270914077758789, 0.014122962951660156, 0.015536785125732422, 0.016950607299804688, 0.018364429473876953, 0.01977825164794922, 0.021192073822021484, 0.02260589599609375, 0.024019718170166016, 0.02543354034423828, 0.026847362518310547, 0.028261184692382812, 0.029675006866455078, 0.031088829040527344, 0.03250265121459961, 0.033916473388671875, 0.03533029556274414, 0.036744117736816406, 0.03815793991088867, 0.03957176208496094, 0.0409855842590332, 0.04239940643310547, 0.043813228607177734, 0.04522705078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 19.0, 50.0, 98.0, 166.0, 201.0, 178.0, 143.0, 70.0, 39.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5278503894805908, -1.4943004846572876, -1.4607505798339844, -1.4272006750106812, -1.393650770187378, -1.3601009845733643, -1.326551079750061, -1.2930011749267578, -1.2594512701034546, -1.2259013652801514, -1.1923514604568481, -1.158801555633545, -1.1252517700195312, -1.091701865196228, -1.0581519603729248, -1.0246020555496216, -0.9910521507263184, -0.9575022459030151, -0.9239523410797119, -0.8904024958610535, -0.8568525910377502, -0.823302686214447, -0.7897528409957886, -0.7562029361724854, -0.7226530313491821, -0.6891031265258789, -0.6555532217025757, -0.6220033764839172, -0.588453471660614, -0.5549035668373108, -0.5213537216186523, -0.4878038167953491, -0.4542539119720459, -0.4207040071487427, -0.38715413212776184, -0.353604257106781, -0.3200543522834778, -0.28650444746017456, -0.2529545724391937, -0.2194046825170517, -0.18585479259490967, -0.15230490267276764, -0.11875501275062561, -0.08520512282848358, -0.05165523290634155, -0.018105342984199524, 0.015444546937942505, 0.048994436860084534, 0.08254432678222656, 0.11609421670436859, 0.14964410662651062, 0.18319399654865265, 0.21674388647079468, 0.2502937912940979, 0.28384366631507874, 0.31739354133605957, 0.3509434461593628, 0.384493350982666, 0.41804322600364685, 0.4515931010246277, 0.4851430058479309, 0.5186929106712341, 0.5522427558898926, 0.5857926607131958, 0.619342565536499]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 13.0, 20.0, 21.0, 18.0, 27.0, 26.0, 29.0, 37.0, 44.0, 36.0, 43.0, 43.0, 53.0, 44.0, 56.0, 49.0, 37.0, 46.0, 51.0, 38.0, 31.0, 28.0, 33.0, 23.0, 20.0, 18.0, 21.0, 21.0, 7.0, 17.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5830000638961792, -0.5650597214698792, -0.5471193194389343, -0.5291789770126343, -0.5112386345863342, -0.4932982325553894, -0.47535789012908936, -0.4574175179004669, -0.4394771456718445, -0.42153677344322205, -0.403596431016922, -0.38565605878829956, -0.3677156865596771, -0.3497753143310547, -0.33183497190475464, -0.3138945996761322, -0.29595425724983215, -0.2780138850212097, -0.26007354259490967, -0.24213317036628723, -0.2241927981376648, -0.20625244081020355, -0.1883120834827423, -0.17037171125411987, -0.15243135392665863, -0.1344909965991974, -0.11655062437057495, -0.09861026704311371, -0.08066990226507187, -0.06272953748703003, -0.04478918015956879, -0.02684880793094635, -0.008908450603485107, 0.009031912311911583, 0.026972275227308273, 0.044912636280059814, 0.06285300105810165, 0.0807933658361435, 0.09873372316360474, 0.11667409539222717, 0.13461445271968842, 0.15255481004714966, 0.1704951822757721, 0.18843553960323334, 0.20637589693069458, 0.22431626915931702, 0.24225662648677826, 0.2601969838142395, 0.27813735604286194, 0.2960777282714844, 0.3140180706977844, 0.33195844292640686, 0.3498988151550293, 0.36783915758132935, 0.3857795298099518, 0.4037199020385742, 0.42166024446487427, 0.4396006166934967, 0.45754095911979675, 0.4754813313484192, 0.4934217035770416, 0.5113620758056641, 0.5293024182319641, 0.5472427606582642, 0.565183162689209]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 20.0, 21.0, 29.0, 53.0, 94.0, 167.0, 262.0, 476.0, 891.0, 1803.0, 3472.0, 7926.0, 18723.0, 45754.0, 114271.0, 279064.0, 599656.0, 977980.0, 1004317.0, 627732.0, 298477.0, 125389.0, 50570.0, 20235.0, 8923.0, 4029.0, 1853.0, 953.0, 515.0, 248.0, 138.0, 81.0, 51.0, 27.0, 13.0, 20.0, 9.0, 7.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05975341796875, -0.05782794952392578, -0.05590248107910156, -0.053977012634277344, -0.052051544189453125, -0.050126075744628906, -0.04820060729980469, -0.04627513885498047, -0.04434967041015625, -0.04242420196533203, -0.04049873352050781, -0.038573265075683594, -0.036647796630859375, -0.034722328186035156, -0.03279685974121094, -0.03087139129638672, -0.0289459228515625, -0.02702045440673828, -0.025094985961914062, -0.023169517517089844, -0.021244049072265625, -0.019318580627441406, -0.017393112182617188, -0.015467643737792969, -0.01354217529296875, -0.011616706848144531, -0.009691238403320312, -0.007765769958496094, -0.005840301513671875, -0.003914833068847656, -0.0019893646240234375, -6.389617919921875e-05, 0.001861572265625, 0.0037870407104492188, 0.0057125091552734375, 0.007637977600097656, 0.009563446044921875, 0.011488914489746094, 0.013414382934570312, 0.015339851379394531, 0.01726531982421875, 0.01919078826904297, 0.021116256713867188, 0.023041725158691406, 0.024967193603515625, 0.026892662048339844, 0.028818130493164062, 0.03074359893798828, 0.0326690673828125, 0.03459453582763672, 0.03652000427246094, 0.038445472717285156, 0.040370941162109375, 0.042296409606933594, 0.04422187805175781, 0.04614734649658203, 0.04807281494140625, 0.04999828338623047, 0.05192375183105469, 0.053849220275878906, 0.055774688720703125, 0.057700157165527344, 0.05962562561035156, 0.06155109405517578, 0.0634765625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 5.0, 11.0, 7.0, 8.0, 12.0, 17.0, 16.0, 17.0, 24.0, 12.0, 27.0, 30.0, 26.0, 32.0, 28.0, 37.0, 45.0, 57.0, 56.0, 54.0, 38.0, 42.0, 36.0, 24.0, 47.0, 38.0, 24.0, 30.0, 22.0, 23.0, 31.0, 22.0, 13.0, 12.0, 17.0, 7.0, 12.0, 11.0, 4.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07668399810791016, -0.07426643371582031, -0.07184886932373047, -0.06943130493164062, -0.06701374053955078, -0.06459617614746094, -0.062178611755371094, -0.05976104736328125, -0.057343482971191406, -0.05492591857910156, -0.05250835418701172, -0.050090789794921875, -0.04767322540283203, -0.04525566101074219, -0.042838096618652344, -0.0404205322265625, -0.038002967834472656, -0.03558540344238281, -0.03316783905029297, -0.030750274658203125, -0.02833271026611328, -0.025915145874023438, -0.023497581481933594, -0.02108001708984375, -0.018662452697753906, -0.016244888305664062, -0.013827323913574219, -0.011409759521484375, -0.008992195129394531, -0.0065746307373046875, -0.004157066345214844, -0.001739501953125, 0.0006780624389648438, 0.0030956268310546875, 0.005513191223144531, 0.007930755615234375, 0.010348320007324219, 0.012765884399414062, 0.015183448791503906, 0.01760101318359375, 0.020018577575683594, 0.022436141967773438, 0.02485370635986328, 0.027271270751953125, 0.02968883514404297, 0.03210639953613281, 0.034523963928222656, 0.0369415283203125, 0.039359092712402344, 0.04177665710449219, 0.04419422149658203, 0.046611785888671875, 0.04902935028076172, 0.05144691467285156, 0.053864479064941406, 0.05628204345703125, 0.058699607849121094, 0.06111717224121094, 0.06353473663330078, 0.06595230102539062, 0.06836986541748047, 0.07078742980957031, 0.07320499420166016, 0.07562255859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 7.0, 10.0, 19.0, 22.0, 43.0, 74.0, 120.0, 336.0, 847.0, 3084.0, 14582.0, 98381.0, 1059179.0, 2670946.0, 301412.0, 36396.0, 6313.0, 1552.0, 488.0, 201.0, 131.0, 44.0, 41.0, 17.0, 8.0, 14.0, 11.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14208984375, -0.13597869873046875, -0.1298675537109375, -0.12375640869140625, -0.117645263671875, -0.11153411865234375, -0.1054229736328125, -0.09931182861328125, -0.09320068359375, -0.08708953857421875, -0.0809783935546875, -0.07486724853515625, -0.068756103515625, -0.06264495849609375, -0.0565338134765625, -0.05042266845703125, -0.0443115234375, -0.03820037841796875, -0.0320892333984375, -0.02597808837890625, -0.019866943359375, -0.01375579833984375, -0.0076446533203125, -0.00153350830078125, 0.00457763671875, 0.01068878173828125, 0.0167999267578125, 0.02291107177734375, 0.029022216796875, 0.03513336181640625, 0.0412445068359375, 0.04735565185546875, 0.053466796875, 0.05957794189453125, 0.0656890869140625, 0.07180023193359375, 0.077911376953125, 0.08402252197265625, 0.0901336669921875, 0.09624481201171875, 0.10235595703125, 0.10846710205078125, 0.1145782470703125, 0.12068939208984375, 0.126800537109375, 0.13291168212890625, 0.1390228271484375, 0.14513397216796875, 0.1512451171875, 0.15735626220703125, 0.1634674072265625, 0.16957855224609375, 0.175689697265625, 0.18180084228515625, 0.1879119873046875, 0.19402313232421875, 0.20013427734375, 0.20624542236328125, 0.2123565673828125, 0.21846771240234375, 0.224578857421875, 0.23069000244140625, 0.2368011474609375, 0.24291229248046875, 0.2490234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 2.0, 14.0, 17.0, 43.0, 54.0, 68.0, 144.0, 200.0, 314.0, 578.0, 730.0, 710.0, 484.0, 262.0, 157.0, 106.0, 63.0, 50.0, 34.0, 14.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12238693237304688, -0.11586761474609375, -0.10934829711914062, -0.1028289794921875, -0.09630966186523438, -0.08979034423828125, -0.08327102661132812, -0.076751708984375, -0.07023239135742188, -0.06371307373046875, -0.057193756103515625, -0.0506744384765625, -0.044155120849609375, -0.03763580322265625, -0.031116485595703125, -0.02459716796875, -0.018077850341796875, -0.01155853271484375, -0.005039215087890625, 0.0014801025390625, 0.007999420166015625, 0.01451873779296875, 0.021038055419921875, 0.027557373046875, 0.034076690673828125, 0.04059600830078125, 0.047115325927734375, 0.0536346435546875, 0.060153961181640625, 0.06667327880859375, 0.07319259643554688, 0.0797119140625, 0.08623123168945312, 0.09275054931640625, 0.09926986694335938, 0.1057891845703125, 0.11230850219726562, 0.11882781982421875, 0.12534713745117188, 0.131866455078125, 0.13838577270507812, 0.14490509033203125, 0.15142440795898438, 0.1579437255859375, 0.16446304321289062, 0.17098236083984375, 0.17750167846679688, 0.18402099609375, 0.19054031372070312, 0.19705963134765625, 0.20357894897460938, 0.2100982666015625, 0.21661758422851562, 0.22313690185546875, 0.22965621948242188, 0.236175537109375, 0.24269485473632812, 0.24921417236328125, 0.2557334899902344, 0.2622528076171875, 0.2687721252441406, 0.27529144287109375, 0.2818107604980469, 0.288330078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 24.0, 36.0, 69.0, 115.0, 157.0, 178.0, 163.0, 100.0, 78.0, 42.0, 13.0, 5.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4230341911315918, -1.3887436389923096, -1.3544529676437378, -1.3201624155044556, -1.2858717441558838, -1.2515811920166016, -1.2172906398773193, -1.1829999685287476, -1.1487094163894653, -1.114418864250183, -1.0801281929016113, -1.045837640762329, -1.0115470886230469, -0.9772564172744751, -0.9429658651351929, -0.9086752533912659, -0.8743846416473389, -0.8400940299034119, -0.8058034181594849, -0.7715128660202026, -0.7372222542762756, -0.7029316425323486, -0.6686410903930664, -0.6343504786491394, -0.6000598669052124, -0.5657692551612854, -0.5314786434173584, -0.49718809127807617, -0.46289747953414917, -0.42860686779022217, -0.39431628584861755, -0.36002570390701294, -0.3257349729537964, -0.2914443612098694, -0.25715377926826477, -0.22286318242549896, -0.18857258558273315, -0.15428198873996735, -0.11999139189720154, -0.08570079505443573, -0.05141019821166992, -0.017119601368904114, 0.017170995473861694, 0.0514615923166275, 0.08575218915939331, 0.12004278600215912, 0.15433338284492493, 0.18862397968769073, 0.22291457653045654, 0.25720518827438354, 0.29149577021598816, 0.3257863521575928, 0.3600769639015198, 0.3943675756454468, 0.4286581575870514, 0.462948739528656, 0.497239351272583, 0.53152996301651, 0.565820574760437, 0.6001111268997192, 0.6344017386436462, 0.6686923503875732, 0.7029829025268555, 0.7372735142707825, 0.7715641260147095]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 11.0, 6.0, 10.0, 18.0, 22.0, 23.0, 25.0, 25.0, 35.0, 19.0, 30.0, 45.0, 44.0, 44.0, 41.0, 36.0, 57.0, 67.0, 48.0, 44.0, 33.0, 45.0, 32.0, 35.0, 36.0, 18.0, 28.0, 24.0, 19.0, 20.0, 13.0, 8.0, 4.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5732724666595459, -0.5583806037902832, -0.5434887409210205, -0.5285968780517578, -0.5137050151824951, -0.4988131523132324, -0.4839212894439697, -0.46902942657470703, -0.45413756370544434, -0.43924570083618164, -0.42435383796691895, -0.40946197509765625, -0.39457011222839355, -0.37967824935913086, -0.36478638648986816, -0.34989452362060547, -0.3350026309490204, -0.3201107680797577, -0.305218905210495, -0.2903270423412323, -0.2754351794719696, -0.2605433166027069, -0.24565143883228302, -0.23075957596302032, -0.21586771309375763, -0.20097585022449493, -0.18608398735523224, -0.17119210958480835, -0.15630024671554565, -0.14140838384628296, -0.12651652097702026, -0.11162465810775757, -0.09673279523849487, -0.08184093236923218, -0.06694906949996948, -0.05205719918012619, -0.037165336310863495, -0.0222734734416008, -0.007381603121757507, 0.007510259747505188, 0.022402122616767883, 0.03729398548603058, 0.05218585208058357, 0.06707771867513657, 0.08196958154439926, 0.09686144441366196, 0.11175331473350525, 0.12664517760276794, 0.14153704047203064, 0.15642890334129333, 0.17132076621055603, 0.18621262907981873, 0.20110449194908142, 0.21599635481834412, 0.230888232588768, 0.2457800954580307, 0.2606719732284546, 0.2755638360977173, 0.29045569896698, 0.3053475618362427, 0.32023942470550537, 0.33513128757476807, 0.35002315044403076, 0.36491501331329346, 0.37980687618255615]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 3.0, 12.0, 13.0, 14.0, 19.0, 35.0, 43.0, 67.0, 100.0, 172.0, 253.0, 395.0, 690.0, 1235.0, 1961.0, 3538.0, 5916.0, 10722.0, 21564.0, 52332.0, 142322.0, 285459.0, 284515.0, 139946.0, 51052.0, 21175.0, 10476.0, 5839.0, 3623.0, 2093.0, 1135.0, 667.0, 386.0, 264.0, 186.0, 96.0, 69.0, 40.0, 37.0, 28.0, 18.0, 9.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.12109375, -0.11742305755615234, -0.11375236511230469, -0.11008167266845703, -0.10641098022460938, -0.10274028778076172, -0.09906959533691406, -0.0953989028930664, -0.09172821044921875, -0.0880575180053711, -0.08438682556152344, -0.08071613311767578, -0.07704544067382812, -0.07337474822998047, -0.06970405578613281, -0.06603336334228516, -0.0623626708984375, -0.058691978454589844, -0.05502128601074219, -0.05135059356689453, -0.047679901123046875, -0.04400920867919922, -0.04033851623535156, -0.036667823791503906, -0.03299713134765625, -0.029326438903808594, -0.025655746459960938, -0.02198505401611328, -0.018314361572265625, -0.014643669128417969, -0.010972976684570312, -0.007302284240722656, -0.003631591796875, 3.910064697265625e-05, 0.0037097930908203125, 0.007380485534667969, 0.011051177978515625, 0.014721870422363281, 0.018392562866210938, 0.022063255310058594, 0.02573394775390625, 0.029404640197753906, 0.03307533264160156, 0.03674602508544922, 0.040416717529296875, 0.04408740997314453, 0.04775810241699219, 0.051428794860839844, 0.0550994873046875, 0.058770179748535156, 0.06244087219238281, 0.06611156463623047, 0.06978225708007812, 0.07345294952392578, 0.07712364196777344, 0.0807943344116211, 0.08446502685546875, 0.0881357192993164, 0.09180641174316406, 0.09547710418701172, 0.09914779663085938, 0.10281848907470703, 0.10648918151855469, 0.11015987396240234, 0.11383056640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 4.0, 9.0, 10.0, 14.0, 10.0, 16.0, 17.0, 14.0, 22.0, 22.0, 22.0, 45.0, 31.0, 28.0, 36.0, 40.0, 38.0, 39.0, 38.0, 51.0, 52.0, 46.0, 49.0, 36.0, 44.0, 35.0, 28.0, 27.0, 29.0, 30.0, 28.0, 17.0, 12.0, 14.0, 9.0, 15.0, 5.0, 1.0, 6.0, 4.0, 5.0, 8.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0970458984375, -0.09445381164550781, -0.09186172485351562, -0.08926963806152344, -0.08667755126953125, -0.08408546447753906, -0.08149337768554688, -0.07890129089355469, -0.0763092041015625, -0.07371711730957031, -0.07112503051757812, -0.06853294372558594, -0.06594085693359375, -0.06334877014160156, -0.060756683349609375, -0.05816459655761719, -0.055572509765625, -0.05298042297363281, -0.050388336181640625, -0.04779624938964844, -0.04520416259765625, -0.04261207580566406, -0.040019989013671875, -0.03742790222167969, -0.0348358154296875, -0.03224372863769531, -0.029651641845703125, -0.027059555053710938, -0.02446746826171875, -0.021875381469726562, -0.019283294677734375, -0.016691207885742188, -0.01409912109375, -0.011507034301757812, -0.008914947509765625, -0.0063228607177734375, -0.00373077392578125, -0.0011386871337890625, 0.001453399658203125, 0.0040454864501953125, 0.0066375732421875, 0.009229660034179688, 0.011821746826171875, 0.014413833618164062, 0.01700592041015625, 0.019598007202148438, 0.022190093994140625, 0.024782180786132812, 0.027374267578125, 0.029966354370117188, 0.032558441162109375, 0.03515052795410156, 0.03774261474609375, 0.04033470153808594, 0.042926788330078125, 0.04551887512207031, 0.0481109619140625, 0.05070304870605469, 0.053295135498046875, 0.05588722229003906, 0.05847930908203125, 0.06107139587402344, 0.06366348266601562, 0.06625556945800781, 0.06884765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 14.0, 6.0, 16.0, 16.0, 38.0, 54.0, 61.0, 113.0, 217.0, 444.0, 1079.0, 2435.0, 5749.0, 14822.0, 43081.0, 183488.0, 491992.0, 224954.0, 51644.0, 16868.0, 6573.0, 2672.0, 1139.0, 489.0, 226.0, 138.0, 77.0, 49.0, 34.0, 19.0, 12.0, 12.0, 2.0, 5.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171630859375, -0.1654052734375, -0.1591796875, -0.1529541015625, -0.146728515625, -0.1405029296875, -0.13427734375, -0.1280517578125, -0.121826171875, -0.1156005859375, -0.109375, -0.1031494140625, -0.096923828125, -0.0906982421875, -0.08447265625, -0.0782470703125, -0.072021484375, -0.0657958984375, -0.0595703125, -0.0533447265625, -0.047119140625, -0.0408935546875, -0.03466796875, -0.0284423828125, -0.022216796875, -0.0159912109375, -0.009765625, -0.0035400390625, 0.002685546875, 0.0089111328125, 0.01513671875, 0.0213623046875, 0.027587890625, 0.0338134765625, 0.0400390625, 0.0462646484375, 0.052490234375, 0.0587158203125, 0.06494140625, 0.0711669921875, 0.077392578125, 0.0836181640625, 0.08984375, 0.0960693359375, 0.102294921875, 0.1085205078125, 0.11474609375, 0.1209716796875, 0.127197265625, 0.1334228515625, 0.1396484375, 0.1458740234375, 0.152099609375, 0.1583251953125, 0.16455078125, 0.1707763671875, 0.177001953125, 0.1832275390625, 0.189453125, 0.1956787109375, 0.201904296875, 0.2081298828125, 0.21435546875, 0.2205810546875, 0.226806640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 5.0, 9.0, 7.0, 12.0, 7.0, 20.0, 16.0, 25.0, 23.0, 28.0, 31.0, 32.0, 40.0, 37.0, 35.0, 35.0, 51.0, 40.0, 41.0, 57.0, 47.0, 46.0, 39.0, 45.0, 44.0, 29.0, 15.0, 21.0, 26.0, 26.0, 24.0, 12.0, 18.0, 9.0, 9.0, 5.0, 6.0, 8.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2489013671875, -0.24129676818847656, -0.23369216918945312, -0.2260875701904297, -0.21848297119140625, -0.2108783721923828, -0.20327377319335938, -0.19566917419433594, -0.1880645751953125, -0.18045997619628906, -0.17285537719726562, -0.1652507781982422, -0.15764617919921875, -0.1500415802001953, -0.14243698120117188, -0.13483238220214844, -0.127227783203125, -0.11962318420410156, -0.11201858520507812, -0.10441398620605469, -0.09680938720703125, -0.08920478820800781, -0.08160018920898438, -0.07399559020996094, -0.0663909912109375, -0.05878639221191406, -0.051181793212890625, -0.04357719421386719, -0.03597259521484375, -0.028367996215820312, -0.020763397216796875, -0.013158798217773438, -0.00555419921875, 0.0020503997802734375, 0.009654998779296875, 0.017259597778320312, 0.02486419677734375, 0.03246879577636719, 0.040073394775390625, 0.04767799377441406, 0.0552825927734375, 0.06288719177246094, 0.07049179077148438, 0.07809638977050781, 0.08570098876953125, 0.09330558776855469, 0.10091018676757812, 0.10851478576660156, 0.116119384765625, 0.12372398376464844, 0.13132858276367188, 0.1389331817626953, 0.14653778076171875, 0.1541423797607422, 0.16174697875976562, 0.16935157775878906, 0.1769561767578125, 0.18456077575683594, 0.19216537475585938, 0.1997699737548828, 0.20737457275390625, 0.2149791717529297, 0.22258377075195312, 0.23018836975097656, 0.23779296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 10.0, 11.0, 17.0, 31.0, 51.0, 77.0, 122.0, 205.0, 422.0, 662.0, 1382.0, 2260.0, 4401.0, 7696.0, 14093.0, 27671.0, 64560.0, 183192.0, 368363.0, 226191.0, 78963.0, 32355.0, 16214.0, 8721.0, 4872.0, 2648.0, 1513.0, 807.0, 479.0, 240.0, 129.0, 90.0, 38.0, 27.0, 15.0, 12.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.049468994140625, -0.047951698303222656, -0.04643440246582031, -0.04491710662841797, -0.043399810791015625, -0.04188251495361328, -0.04036521911621094, -0.038847923278808594, -0.03733062744140625, -0.035813331604003906, -0.03429603576660156, -0.03277873992919922, -0.031261444091796875, -0.02974414825439453, -0.028226852416992188, -0.026709556579589844, -0.0251922607421875, -0.023674964904785156, -0.022157669067382812, -0.02064037322998047, -0.019123077392578125, -0.01760578155517578, -0.016088485717773438, -0.014571189880371094, -0.01305389404296875, -0.011536598205566406, -0.010019302368164062, -0.008502006530761719, -0.006984710693359375, -0.005467414855957031, -0.0039501190185546875, -0.0024328231811523438, -0.00091552734375, 0.0006017684936523438, 0.0021190643310546875, 0.0036363601684570312, 0.005153656005859375, 0.006670951843261719, 0.008188247680664062, 0.009705543518066406, 0.01122283935546875, 0.012740135192871094, 0.014257431030273438, 0.01577472686767578, 0.017292022705078125, 0.01880931854248047, 0.020326614379882812, 0.021843910217285156, 0.0233612060546875, 0.024878501892089844, 0.026395797729492188, 0.02791309356689453, 0.029430389404296875, 0.03094768524169922, 0.03246498107910156, 0.033982276916503906, 0.03549957275390625, 0.037016868591308594, 0.03853416442871094, 0.04005146026611328, 0.041568756103515625, 0.04308605194091797, 0.04460334777832031, 0.046120643615722656, 0.047637939453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 2.0, 10.0, 9.0, 11.0, 10.0, 16.0, 12.0, 22.0, 41.0, 33.0, 61.0, 80.0, 92.0, 106.0, 87.0, 82.0, 78.0, 53.0, 46.0, 44.0, 26.0, 15.0, 10.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.823902130126953e-05, -1.7630867660045624e-05, -1.7022714018821716e-05, -1.641456037759781e-05, -1.58064067363739e-05, -1.5198253095149994e-05, -1.4590099453926086e-05, -1.3981945812702179e-05, -1.3373792171478271e-05, -1.2765638530254364e-05, -1.2157484889030457e-05, -1.1549331247806549e-05, -1.0941177606582642e-05, -1.0333023965358734e-05, -9.724870324134827e-06, -9.11671668291092e-06, -8.508563041687012e-06, -7.900409400463104e-06, -7.292255759239197e-06, -6.684102118015289e-06, -6.075948476791382e-06, -5.467794835567474e-06, -4.859641194343567e-06, -4.2514875531196594e-06, -3.643333911895752e-06, -3.0351802706718445e-06, -2.427026629447937e-06, -1.8188729882240295e-06, -1.210719347000122e-06, -6.025657057762146e-07, 5.587935447692871e-09, 6.137415766716003e-07, 1.2218952178955078e-06, 1.8300488591194153e-06, 2.4382025003433228e-06, 3.0463561415672302e-06, 3.6545097827911377e-06, 4.262663424015045e-06, 4.870817065238953e-06, 5.47897070646286e-06, 6.087124347686768e-06, 6.695277988910675e-06, 7.3034316301345825e-06, 7.91158527135849e-06, 8.519738912582397e-06, 9.127892553806305e-06, 9.736046195030212e-06, 1.034419983625412e-05, 1.0952353477478027e-05, 1.1560507118701935e-05, 1.2168660759925842e-05, 1.277681440114975e-05, 1.3384968042373657e-05, 1.3993121683597565e-05, 1.4601275324821472e-05, 1.520942896604538e-05, 1.5817582607269287e-05, 1.6425736248493195e-05, 1.7033889889717102e-05, 1.764204353094101e-05, 1.8250197172164917e-05, 1.8858350813388824e-05, 1.9466504454612732e-05, 2.007465809583664e-05, 2.0682811737060547e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 11.0, 13.0, 8.0, 17.0, 26.0, 32.0, 57.0, 75.0, 124.0, 203.0, 353.0, 598.0, 1230.0, 2256.0, 4457.0, 8705.0, 16886.0, 35025.0, 78431.0, 179793.0, 292891.0, 229586.0, 106014.0, 46432.0, 22220.0, 11199.0, 5583.0, 2836.0, 1494.0, 827.0, 472.0, 259.0, 152.0, 89.0, 49.0, 42.0, 25.0, 17.0, 19.0, 10.0, 7.0, 4.0, 7.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04248046875, -0.041219234466552734, -0.03995800018310547, -0.0386967658996582, -0.03743553161621094, -0.03617429733276367, -0.034913063049316406, -0.03365182876586914, -0.032390594482421875, -0.03112936019897461, -0.029868125915527344, -0.028606891632080078, -0.027345657348632812, -0.026084423065185547, -0.02482318878173828, -0.023561954498291016, -0.02230072021484375, -0.021039485931396484, -0.01977825164794922, -0.018517017364501953, -0.017255783081054688, -0.015994548797607422, -0.014733314514160156, -0.01347208023071289, -0.012210845947265625, -0.01094961166381836, -0.009688377380371094, -0.008427143096923828, -0.0071659088134765625, -0.005904674530029297, -0.004643440246582031, -0.0033822059631347656, -0.0021209716796875, -0.0008597373962402344, 0.00040149688720703125, 0.0016627311706542969, 0.0029239654541015625, 0.004185199737548828, 0.005446434020996094, 0.006707668304443359, 0.007968902587890625, 0.00923013687133789, 0.010491371154785156, 0.011752605438232422, 0.013013839721679688, 0.014275074005126953, 0.015536308288574219, 0.016797542572021484, 0.01805877685546875, 0.019320011138916016, 0.02058124542236328, 0.021842479705810547, 0.023103713989257812, 0.024364948272705078, 0.025626182556152344, 0.02688741683959961, 0.028148651123046875, 0.02940988540649414, 0.030671119689941406, 0.03193235397338867, 0.03319358825683594, 0.0344548225402832, 0.03571605682373047, 0.036977291107177734, 0.038238525390625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 7.0, 12.0, 9.0, 7.0, 12.0, 14.0, 22.0, 31.0, 32.0, 44.0, 44.0, 61.0, 69.0, 79.0, 79.0, 76.0, 69.0, 67.0, 57.0, 35.0, 32.0, 32.0, 17.0, 20.0, 11.0, 10.0, 7.0, 10.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0633544921875, -0.061719417572021484, -0.06008434295654297, -0.05844926834106445, -0.05681419372558594, -0.05517911911010742, -0.053544044494628906, -0.05190896987915039, -0.050273895263671875, -0.04863882064819336, -0.047003746032714844, -0.04536867141723633, -0.04373359680175781, -0.0420985221862793, -0.04046344757080078, -0.038828372955322266, -0.03719329833984375, -0.035558223724365234, -0.03392314910888672, -0.0322880744934082, -0.030652999877929688, -0.029017925262451172, -0.027382850646972656, -0.02574777603149414, -0.024112701416015625, -0.02247762680053711, -0.020842552185058594, -0.019207477569580078, -0.017572402954101562, -0.015937328338623047, -0.014302253723144531, -0.012667179107666016, -0.0110321044921875, -0.009397029876708984, -0.007761955261230469, -0.006126880645751953, -0.0044918060302734375, -0.002856731414794922, -0.0012216567993164062, 0.0004134178161621094, 0.002048492431640625, 0.0036835670471191406, 0.005318641662597656, 0.006953716278076172, 0.008588790893554688, 0.010223865509033203, 0.011858940124511719, 0.013494014739990234, 0.01512908935546875, 0.016764163970947266, 0.01839923858642578, 0.020034313201904297, 0.021669387817382812, 0.023304462432861328, 0.024939537048339844, 0.02657461166381836, 0.028209686279296875, 0.02984476089477539, 0.031479835510253906, 0.03311491012573242, 0.03474998474121094, 0.03638505935668945, 0.03802013397216797, 0.039655208587646484, 0.041290283203125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 14.0, 16.0, 42.0, 77.0, 137.0, 193.0, 197.0, 166.0, 76.0, 35.0, 16.0, 7.0, 4.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4243934154510498, -1.3868799209594727, -1.349366545677185, -1.311853051185608, -1.2743396759033203, -1.2368261814117432, -1.199312686920166, -1.1617991924285889, -1.1242858171463013, -1.0867723226547241, -1.0492589473724365, -1.0117454528808594, -0.974232017993927, -0.9367185831069946, -0.8992050886154175, -0.8616916537284851, -0.8241782188415527, -0.7866647839546204, -0.749151349067688, -0.7116378545761108, -0.6741244196891785, -0.6366109848022461, -0.599097490310669, -0.5615840554237366, -0.5240706205368042, -0.4865571856498718, -0.44904372096061707, -0.4115302562713623, -0.37401682138442993, -0.33650338649749756, -0.2989899218082428, -0.26147645711898804, -0.22396314144134521, -0.18644969165325165, -0.14893624186515808, -0.11142279207706451, -0.07390934228897095, -0.03639589250087738, 0.0011175572872161865, 0.03863102197647095, 0.07614445686340332, 0.11365790665149689, 0.15117135643959045, 0.18868480622768402, 0.2261982560157776, 0.26371169090270996, 0.3012251555919647, 0.3387386202812195, 0.37625205516815186, 0.41376549005508423, 0.451278954744339, 0.48879241943359375, 0.5263058543205261, 0.5638192892074585, 0.6013327836990356, 0.638846218585968, 0.6763596534729004, 0.7138730883598328, 0.7513865232467651, 0.7889000177383423, 0.8264134526252747, 0.863926887512207, 0.9014403820037842, 0.9389538168907166, 0.9764672517776489]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 4.0, 7.0, 7.0, 8.0, 8.0, 15.0, 12.0, 29.0, 22.0, 29.0, 14.0, 30.0, 24.0, 23.0, 40.0, 37.0, 42.0, 33.0, 46.0, 46.0, 39.0, 41.0, 31.0, 35.0, 44.0, 38.0, 37.0, 27.0, 34.0, 19.0, 27.0, 22.0, 27.0, 20.0, 11.0, 5.0, 10.0, 17.0, 8.0, 5.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.4886553883552551, -0.4730220139026642, -0.45738863945007324, -0.4417552351951599, -0.42612186074256897, -0.410488486289978, -0.3948551118373871, -0.37922173738479614, -0.3635883331298828, -0.34795495867729187, -0.3323215842247009, -0.3166881799697876, -0.30105480551719666, -0.2854214310646057, -0.26978805661201477, -0.25415468215942383, -0.23852130770683289, -0.22288793325424194, -0.2072545439004898, -0.19162116944789886, -0.17598778009414673, -0.1603544056415558, -0.14472103118896484, -0.1290876567363739, -0.11345426738262177, -0.09782088547945023, -0.08218750357627869, -0.06655412912368774, -0.050920747220516205, -0.035287365317344666, -0.019653990864753723, -0.004020608961582184, 0.011612772941589355, 0.027246152982115746, 0.042879533022642136, 0.058512911200523376, 0.07414629310369492, 0.08977967500686646, 0.1054130494594574, 0.12104643136262894, 0.13667981326580048, 0.15231318771839142, 0.16794657707214355, 0.1835799515247345, 0.19921332597732544, 0.21484671533107758, 0.23048008978366852, 0.24611347913742065, 0.2617468535900116, 0.27738022804260254, 0.2930136024951935, 0.3086469769477844, 0.32428038120269775, 0.3399137556552887, 0.35554713010787964, 0.3711805045604706, 0.3868138790130615, 0.40244725346565247, 0.4180806279182434, 0.43371403217315674, 0.4493474066257477, 0.4649807810783386, 0.48061415553092957, 0.4962475299835205, 0.5118809342384338]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 20.0, 13.0, 25.0, 42.0, 117.0, 217.0, 479.0, 977.0, 2388.0, 6276.0, 18899.0, 64388.0, 233756.0, 734585.0, 1384374.0, 1117316.0, 449770.0, 129086.0, 34489.0, 10552.0, 3704.0, 1515.0, 675.0, 325.0, 137.0, 64.0, 35.0, 28.0, 11.0, 6.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062255859375, -0.059393882751464844, -0.05653190612792969, -0.05366992950439453, -0.050807952880859375, -0.04794597625732422, -0.04508399963378906, -0.042222023010253906, -0.03936004638671875, -0.036498069763183594, -0.03363609313964844, -0.03077411651611328, -0.027912139892578125, -0.02505016326904297, -0.022188186645507812, -0.019326210021972656, -0.0164642333984375, -0.013602256774902344, -0.010740280151367188, -0.007878303527832031, -0.005016326904296875, -0.0021543502807617188, 0.0007076263427734375, 0.0035696029663085938, 0.00643157958984375, 0.009293556213378906, 0.012155532836914062, 0.015017509460449219, 0.017879486083984375, 0.02074146270751953, 0.023603439331054688, 0.026465415954589844, 0.029327392578125, 0.032189369201660156, 0.03505134582519531, 0.03791332244873047, 0.040775299072265625, 0.04363727569580078, 0.04649925231933594, 0.049361228942871094, 0.05222320556640625, 0.055085182189941406, 0.05794715881347656, 0.06080913543701172, 0.06367111206054688, 0.06653308868408203, 0.06939506530761719, 0.07225704193115234, 0.0751190185546875, 0.07798099517822266, 0.08084297180175781, 0.08370494842529297, 0.08656692504882812, 0.08942890167236328, 0.09229087829589844, 0.0951528549194336, 0.09801483154296875, 0.1008768081665039, 0.10373878479003906, 0.10660076141357422, 0.10946273803710938, 0.11232471466064453, 0.11518669128417969, 0.11804866790771484, 0.12091064453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 4.0, 6.0, 10.0, 8.0, 11.0, 20.0, 21.0, 17.0, 15.0, 16.0, 25.0, 30.0, 36.0, 29.0, 35.0, 35.0, 39.0, 35.0, 54.0, 36.0, 45.0, 47.0, 37.0, 44.0, 32.0, 32.0, 40.0, 37.0, 23.0, 27.0, 23.0, 16.0, 28.0, 20.0, 11.0, 5.0, 17.0, 7.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07659912109375, -0.0741567611694336, -0.07171440124511719, -0.06927204132080078, -0.06682968139648438, -0.06438732147216797, -0.06194496154785156, -0.059502601623535156, -0.05706024169921875, -0.054617881774902344, -0.05217552185058594, -0.04973316192626953, -0.047290802001953125, -0.04484844207763672, -0.04240608215332031, -0.039963722229003906, -0.0375213623046875, -0.035079002380371094, -0.03263664245605469, -0.03019428253173828, -0.027751922607421875, -0.02530956268310547, -0.022867202758789062, -0.020424842834472656, -0.01798248291015625, -0.015540122985839844, -0.013097763061523438, -0.010655403137207031, -0.008213043212890625, -0.005770683288574219, -0.0033283233642578125, -0.0008859634399414062, 0.001556396484375, 0.003998756408691406, 0.0064411163330078125, 0.008883476257324219, 0.011325836181640625, 0.013768196105957031, 0.016210556030273438, 0.018652915954589844, 0.02109527587890625, 0.023537635803222656, 0.025979995727539062, 0.02842235565185547, 0.030864715576171875, 0.03330707550048828, 0.03574943542480469, 0.038191795349121094, 0.0406341552734375, 0.043076515197753906, 0.04551887512207031, 0.04796123504638672, 0.050403594970703125, 0.05284595489501953, 0.05528831481933594, 0.057730674743652344, 0.06017303466796875, 0.06261539459228516, 0.06505775451660156, 0.06750011444091797, 0.06994247436523438, 0.07238483428955078, 0.07482719421386719, 0.0772695541381836, 0.0797119140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 24.0, 33.0, 61.0, 93.0, 219.0, 429.0, 898.0, 2139.0, 5714.0, 16074.0, 52621.0, 203724.0, 972199.0, 2094644.0, 646256.0, 141131.0, 38251.0, 12105.0, 4315.0, 1767.0, 769.0, 350.0, 213.0, 97.0, 50.0, 39.0, 21.0, 13.0, 6.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1507568359375, -0.1469278335571289, -0.1430988311767578, -0.13926982879638672, -0.13544082641601562, -0.13161182403564453, -0.12778282165527344, -0.12395381927490234, -0.12012481689453125, -0.11629581451416016, -0.11246681213378906, -0.10863780975341797, -0.10480880737304688, -0.10097980499267578, -0.09715080261230469, -0.0933218002319336, -0.0894927978515625, -0.0856637954711914, -0.08183479309082031, -0.07800579071044922, -0.07417678833007812, -0.07034778594970703, -0.06651878356933594, -0.06268978118896484, -0.05886077880859375, -0.055031776428222656, -0.05120277404785156, -0.04737377166748047, -0.043544769287109375, -0.03971576690673828, -0.03588676452636719, -0.032057762145996094, -0.028228759765625, -0.024399757385253906, -0.020570755004882812, -0.01674175262451172, -0.012912750244140625, -0.009083747863769531, -0.0052547454833984375, -0.0014257431030273438, 0.00240325927734375, 0.006232261657714844, 0.010061264038085938, 0.013890266418457031, 0.017719268798828125, 0.02154827117919922, 0.025377273559570312, 0.029206275939941406, 0.0330352783203125, 0.036864280700683594, 0.04069328308105469, 0.04452228546142578, 0.048351287841796875, 0.05218029022216797, 0.05600929260253906, 0.059838294982910156, 0.06366729736328125, 0.06749629974365234, 0.07132530212402344, 0.07515430450439453, 0.07898330688476562, 0.08281230926513672, 0.08664131164550781, 0.0904703140258789, 0.09429931640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 15.0, 21.0, 26.0, 33.0, 39.0, 52.0, 76.0, 104.0, 127.0, 154.0, 228.0, 272.0, 330.0, 372.0, 396.0, 385.0, 318.0, 254.0, 210.0, 148.0, 101.0, 88.0, 68.0, 54.0, 42.0, 22.0, 30.0, 18.0, 19.0, 12.0, 7.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.11474609375, -0.11117839813232422, -0.10761070251464844, -0.10404300689697266, -0.10047531127929688, -0.0969076156616211, -0.09333992004394531, -0.08977222442626953, -0.08620452880859375, -0.08263683319091797, -0.07906913757324219, -0.0755014419555664, -0.07193374633789062, -0.06836605072021484, -0.06479835510253906, -0.06123065948486328, -0.0576629638671875, -0.05409526824951172, -0.05052757263183594, -0.046959877014160156, -0.043392181396484375, -0.039824485778808594, -0.03625679016113281, -0.03268909454345703, -0.02912139892578125, -0.02555370330810547, -0.021986007690429688, -0.018418312072753906, -0.014850616455078125, -0.011282920837402344, -0.0077152252197265625, -0.004147529602050781, -0.000579833984375, 0.0029878616333007812, 0.0065555572509765625, 0.010123252868652344, 0.013690948486328125, 0.017258644104003906, 0.020826339721679688, 0.02439403533935547, 0.02796173095703125, 0.03152942657470703, 0.03509712219238281, 0.038664817810058594, 0.042232513427734375, 0.045800209045410156, 0.04936790466308594, 0.05293560028076172, 0.0565032958984375, 0.06007099151611328, 0.06363868713378906, 0.06720638275146484, 0.07077407836914062, 0.0743417739868164, 0.07790946960449219, 0.08147716522216797, 0.08504486083984375, 0.08861255645751953, 0.09218025207519531, 0.0957479476928711, 0.09931564331054688, 0.10288333892822266, 0.10645103454589844, 0.11001873016357422, 0.11358642578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 12.0, 16.0, 36.0, 73.0, 105.0, 159.0, 170.0, 148.0, 132.0, 65.0, 31.0, 20.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7154151201248169, -0.6804477572441101, -0.6454803943634033, -0.6105130314826965, -0.5755456686019897, -0.540578305721283, -0.5056109428405762, -0.4706435799598694, -0.4356762170791626, -0.4007088541984558, -0.365741491317749, -0.33077412843704224, -0.29580676555633545, -0.26083940267562866, -0.22587203979492188, -0.1909046769142151, -0.1559373140335083, -0.12096995115280151, -0.08600258827209473, -0.05103522539138794, -0.016067862510681152, 0.018899500370025635, 0.05386686325073242, 0.08883422613143921, 0.123801589012146, 0.15876895189285278, 0.19373631477355957, 0.22870367765426636, 0.26367104053497314, 0.29863840341567993, 0.3336057662963867, 0.3685731291770935, 0.40354037284851074, 0.43850773572921753, 0.4734750986099243, 0.5084424614906311, 0.5434098243713379, 0.5783771872520447, 0.6133445501327515, 0.6483119130134583, 0.683279275894165, 0.7182466387748718, 0.7532140016555786, 0.7881813645362854, 0.8231487274169922, 0.858116090297699, 0.8930834531784058, 0.9280508160591125, 0.9630181789398193, 0.9979855418205261, 1.032952904701233, 1.067920207977295, 1.1028876304626465, 1.137855052947998, 1.17282235622406, 1.207789659500122, 1.2427570819854736, 1.2777245044708252, 1.3126918077468872, 1.3476591110229492, 1.3826265335083008, 1.4175939559936523, 1.4525612592697144, 1.4875285625457764, 1.522495985031128]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 13.0, 13.0, 9.0, 10.0, 14.0, 16.0, 24.0, 31.0, 30.0, 40.0, 39.0, 35.0, 47.0, 36.0, 38.0, 33.0, 40.0, 46.0, 57.0, 53.0, 50.0, 37.0, 39.0, 45.0, 32.0, 23.0, 37.0, 28.0, 16.0, 18.0, 7.0, 13.0, 7.0, 6.0, 9.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45728325843811035, -0.4416397213935852, -0.42599615454673767, -0.41035258769989014, -0.394709050655365, -0.37906551361083984, -0.3634219467639923, -0.3477783799171448, -0.33213484287261963, -0.3164913058280945, -0.30084773898124695, -0.2852041721343994, -0.26956063508987427, -0.2539170980453491, -0.2382735311985016, -0.22262997925281525, -0.2069864273071289, -0.19134287536144257, -0.17569932341575623, -0.16005577147006989, -0.14441221952438354, -0.1287686675786972, -0.11312511563301086, -0.09748156368732452, -0.08183801174163818, -0.06619445979595184, -0.0505509078502655, -0.03490735590457916, -0.019263803958892822, -0.003620252013206482, 0.012023299932479858, 0.0276668518781662, 0.04331040382385254, 0.05895395576953888, 0.07459750771522522, 0.09024105966091156, 0.1058846116065979, 0.12152816355228424, 0.13717171549797058, 0.15281526744365692, 0.16845881938934326, 0.1841023713350296, 0.19974592328071594, 0.21538947522640228, 0.23103302717208862, 0.24667657911777496, 0.2623201310634613, 0.27796369791030884, 0.293607234954834, 0.30925077199935913, 0.32489433884620667, 0.3405379056930542, 0.35618144273757935, 0.3718249797821045, 0.387468546628952, 0.40311211347579956, 0.4187556505203247, 0.43439918756484985, 0.4500427544116974, 0.4656863212585449, 0.48132985830307007, 0.4969733953475952, 0.5126169919967651, 0.5282605290412903, 0.5439040660858154]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 11.0, 14.0, 24.0, 36.0, 59.0, 85.0, 154.0, 197.0, 326.0, 599.0, 944.0, 1586.0, 2816.0, 5512.0, 12665.0, 38045.0, 126855.0, 318396.0, 332078.0, 139708.0, 41374.0, 14057.0, 5945.0, 3002.0, 1561.0, 931.0, 573.0, 371.0, 229.0, 126.0, 87.0, 55.0, 48.0, 36.0, 15.0, 11.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13139724731445312, -0.12729644775390625, -0.12319564819335938, -0.1190948486328125, -0.11499404907226562, -0.11089324951171875, -0.10679244995117188, -0.102691650390625, -0.09859085083007812, -0.09449005126953125, -0.09038925170898438, -0.0862884521484375, -0.08218765258789062, -0.07808685302734375, -0.07398605346679688, -0.06988525390625, -0.06578445434570312, -0.06168365478515625, -0.057582855224609375, -0.0534820556640625, -0.049381256103515625, -0.04528045654296875, -0.041179656982421875, -0.037078857421875, -0.032978057861328125, -0.02887725830078125, -0.024776458740234375, -0.0206756591796875, -0.016574859619140625, -0.01247406005859375, -0.008373260498046875, -0.0042724609375, -0.000171661376953125, 0.00392913818359375, 0.008029937744140625, 0.0121307373046875, 0.016231536865234375, 0.02033233642578125, 0.024433135986328125, 0.028533935546875, 0.032634735107421875, 0.03673553466796875, 0.040836334228515625, 0.0449371337890625, 0.049037933349609375, 0.05313873291015625, 0.057239532470703125, 0.06134033203125, 0.06544113159179688, 0.06954193115234375, 0.07364273071289062, 0.0777435302734375, 0.08184432983398438, 0.08594512939453125, 0.09004592895507812, 0.094146728515625, 0.09824752807617188, 0.10234832763671875, 0.10644912719726562, 0.1105499267578125, 0.11465072631835938, 0.11875152587890625, 0.12285232543945312, 0.126953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 2.0, 5.0, 9.0, 10.0, 17.0, 14.0, 17.0, 12.0, 22.0, 30.0, 28.0, 31.0, 49.0, 33.0, 41.0, 44.0, 47.0, 43.0, 39.0, 56.0, 58.0, 45.0, 45.0, 36.0, 33.0, 34.0, 25.0, 23.0, 22.0, 23.0, 17.0, 12.0, 14.0, 12.0, 5.0, 5.0, 8.0, 5.0, 8.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.083251953125, -0.08035564422607422, -0.07745933532714844, -0.07456302642822266, -0.07166671752929688, -0.0687704086303711, -0.06587409973144531, -0.06297779083251953, -0.06008148193359375, -0.05718517303466797, -0.05428886413574219, -0.051392555236816406, -0.048496246337890625, -0.045599937438964844, -0.04270362854003906, -0.03980731964111328, -0.0369110107421875, -0.03401470184326172, -0.031118392944335938, -0.028222084045410156, -0.025325775146484375, -0.022429466247558594, -0.019533157348632812, -0.01663684844970703, -0.01374053955078125, -0.010844230651855469, -0.007947921752929688, -0.005051612854003906, -0.002155303955078125, 0.0007410049438476562, 0.0036373138427734375, 0.006533622741699219, 0.009429931640625, 0.012326240539550781, 0.015222549438476562, 0.018118858337402344, 0.021015167236328125, 0.023911476135253906, 0.026807785034179688, 0.02970409393310547, 0.03260040283203125, 0.03549671173095703, 0.03839302062988281, 0.041289329528808594, 0.044185638427734375, 0.047081947326660156, 0.04997825622558594, 0.05287456512451172, 0.0557708740234375, 0.05866718292236328, 0.06156349182128906, 0.06445980072021484, 0.06735610961914062, 0.0702524185180664, 0.07314872741699219, 0.07604503631591797, 0.07894134521484375, 0.08183765411376953, 0.08473396301269531, 0.0876302719116211, 0.09052658081054688, 0.09342288970947266, 0.09631919860839844, 0.09921550750732422, 0.10211181640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 10.0, 21.0, 23.0, 30.0, 53.0, 87.0, 132.0, 250.0, 430.0, 750.0, 1391.0, 2482.0, 4827.0, 9743.0, 21180.0, 51930.0, 139783.0, 288164.0, 290019.0, 141890.0, 53294.0, 21454.0, 9955.0, 4967.0, 2534.0, 1352.0, 728.0, 399.0, 246.0, 164.0, 79.0, 55.0, 40.0, 14.0, 15.0, 10.0, 12.0, 5.0, 6.0, 5.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1146240234375, -0.11104297637939453, -0.10746192932128906, -0.1038808822631836, -0.10029983520507812, -0.09671878814697266, -0.09313774108886719, -0.08955669403076172, -0.08597564697265625, -0.08239459991455078, -0.07881355285644531, -0.07523250579833984, -0.07165145874023438, -0.0680704116821289, -0.06448936462402344, -0.06090831756591797, -0.0573272705078125, -0.05374622344970703, -0.05016517639160156, -0.046584129333496094, -0.043003082275390625, -0.039422035217285156, -0.03584098815917969, -0.03225994110107422, -0.02867889404296875, -0.02509784698486328, -0.021516799926757812, -0.017935752868652344, -0.014354705810546875, -0.010773658752441406, -0.0071926116943359375, -0.0036115646362304688, -3.0517578125e-05, 0.0035505294799804688, 0.0071315765380859375, 0.010712623596191406, 0.014293670654296875, 0.017874717712402344, 0.021455764770507812, 0.02503681182861328, 0.02861785888671875, 0.03219890594482422, 0.03577995300292969, 0.039361000061035156, 0.042942047119140625, 0.046523094177246094, 0.05010414123535156, 0.05368518829345703, 0.0572662353515625, 0.06084728240966797, 0.06442832946777344, 0.0680093765258789, 0.07159042358398438, 0.07517147064208984, 0.07875251770019531, 0.08233356475830078, 0.08591461181640625, 0.08949565887451172, 0.09307670593261719, 0.09665775299072266, 0.10023880004882812, 0.1038198471069336, 0.10740089416503906, 0.11098194122314453, 0.11456298828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 2.0, 5.0, 7.0, 4.0, 13.0, 9.0, 13.0, 11.0, 13.0, 22.0, 25.0, 25.0, 29.0, 21.0, 36.0, 29.0, 40.0, 44.0, 46.0, 32.0, 37.0, 42.0, 39.0, 47.0, 35.0, 56.0, 36.0, 35.0, 39.0, 30.0, 26.0, 22.0, 26.0, 22.0, 12.0, 13.0, 11.0, 7.0, 10.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220947265625, -0.21349334716796875, -0.2060394287109375, -0.19858551025390625, -0.191131591796875, -0.18367767333984375, -0.1762237548828125, -0.16876983642578125, -0.16131591796875, -0.15386199951171875, -0.1464080810546875, -0.13895416259765625, -0.131500244140625, -0.12404632568359375, -0.1165924072265625, -0.10913848876953125, -0.1016845703125, -0.09423065185546875, -0.0867767333984375, -0.07932281494140625, -0.071868896484375, -0.06441497802734375, -0.0569610595703125, -0.04950714111328125, -0.04205322265625, -0.03459930419921875, -0.0271453857421875, -0.01969146728515625, -0.012237548828125, -0.00478363037109375, 0.0026702880859375, 0.01012420654296875, 0.017578125, 0.02503204345703125, 0.0324859619140625, 0.03993988037109375, 0.047393798828125, 0.05484771728515625, 0.0623016357421875, 0.06975555419921875, 0.07720947265625, 0.08466339111328125, 0.0921173095703125, 0.09957122802734375, 0.107025146484375, 0.11447906494140625, 0.1219329833984375, 0.12938690185546875, 0.1368408203125, 0.14429473876953125, 0.1517486572265625, 0.15920257568359375, 0.166656494140625, 0.17411041259765625, 0.1815643310546875, 0.18901824951171875, 0.19647216796875, 0.20392608642578125, 0.2113800048828125, 0.21883392333984375, 0.226287841796875, 0.23374176025390625, 0.2411956787109375, 0.24864959716796875, 0.256103515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 22.0, 27.0, 37.0, 72.0, 124.0, 200.0, 320.0, 498.0, 851.0, 1340.0, 2402.0, 4255.0, 7593.0, 14982.0, 32337.0, 80106.0, 199789.0, 324221.0, 219406.0, 89285.0, 35528.0, 16292.0, 8121.0, 4385.0, 2544.0, 1508.0, 861.0, 528.0, 343.0, 201.0, 134.0, 86.0, 56.0, 31.0, 20.0, 10.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0283660888671875, -0.027256250381469727, -0.026146411895751953, -0.02503657341003418, -0.023926734924316406, -0.022816896438598633, -0.02170705795288086, -0.020597219467163086, -0.019487380981445312, -0.01837754249572754, -0.017267704010009766, -0.016157865524291992, -0.015048027038574219, -0.013938188552856445, -0.012828350067138672, -0.011718511581420898, -0.010608673095703125, -0.009498834609985352, -0.008388996124267578, -0.007279157638549805, -0.006169319152832031, -0.005059480667114258, -0.003949642181396484, -0.002839803695678711, -0.0017299652099609375, -0.0006201267242431641, 0.0004897117614746094, 0.0015995502471923828, 0.0027093887329101562, 0.0038192272186279297, 0.004929065704345703, 0.0060389041900634766, 0.00714874267578125, 0.008258581161499023, 0.009368419647216797, 0.01047825813293457, 0.011588096618652344, 0.012697935104370117, 0.01380777359008789, 0.014917612075805664, 0.016027450561523438, 0.01713728904724121, 0.018247127532958984, 0.019356966018676758, 0.02046680450439453, 0.021576642990112305, 0.022686481475830078, 0.02379631996154785, 0.024906158447265625, 0.0260159969329834, 0.027125835418701172, 0.028235673904418945, 0.02934551239013672, 0.030455350875854492, 0.031565189361572266, 0.03267502784729004, 0.03378486633300781, 0.034894704818725586, 0.03600454330444336, 0.03711438179016113, 0.038224220275878906, 0.03933405876159668, 0.04044389724731445, 0.04155373573303223, 0.04266357421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 7.0, 19.0, 19.0, 23.0, 30.0, 43.0, 45.0, 61.0, 80.0, 85.0, 85.0, 72.0, 90.0, 77.0, 72.0, 41.0, 31.0, 29.0, 21.0, 22.0, 9.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6570091247558594e-05, -1.6014091670513153e-05, -1.5458092093467712e-05, -1.4902092516422272e-05, -1.4346092939376831e-05, -1.379009336233139e-05, -1.323409378528595e-05, -1.2678094208240509e-05, -1.2122094631195068e-05, -1.1566095054149628e-05, -1.1010095477104187e-05, -1.0454095900058746e-05, -9.898096323013306e-06, -9.342096745967865e-06, -8.786097168922424e-06, -8.230097591876984e-06, -7.674098014831543e-06, -7.118098437786102e-06, -6.562098860740662e-06, -6.006099283695221e-06, -5.45009970664978e-06, -4.89410012960434e-06, -4.338100552558899e-06, -3.7821009755134583e-06, -3.2261013984680176e-06, -2.670101821422577e-06, -2.1141022443771362e-06, -1.5581026673316956e-06, -1.0021030902862549e-06, -4.461035132408142e-07, 1.0989606380462646e-07, 6.658956408500671e-07, 1.2218952178955078e-06, 1.7778947949409485e-06, 2.333894371986389e-06, 2.88989394903183e-06, 3.4458935260772705e-06, 4.001893103122711e-06, 4.557892680168152e-06, 5.1138922572135925e-06, 5.669891834259033e-06, 6.225891411304474e-06, 6.7818909883499146e-06, 7.337890565395355e-06, 7.893890142440796e-06, 8.449889719486237e-06, 9.005889296531677e-06, 9.561888873577118e-06, 1.0117888450622559e-05, 1.0673888027668e-05, 1.122988760471344e-05, 1.178588718175888e-05, 1.2341886758804321e-05, 1.2897886335849762e-05, 1.3453885912895203e-05, 1.4009885489940643e-05, 1.4565885066986084e-05, 1.5121884644031525e-05, 1.5677884221076965e-05, 1.6233883798122406e-05, 1.6789883375167847e-05, 1.7345882952213287e-05, 1.7901882529258728e-05, 1.845788210630417e-05, 1.901388168334961e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 10.0, 8.0, 6.0, 20.0, 29.0, 38.0, 66.0, 98.0, 155.0, 281.0, 477.0, 899.0, 1764.0, 3522.0, 7327.0, 15131.0, 32356.0, 72411.0, 158080.0, 264937.0, 245450.0, 133001.0, 60159.0, 26947.0, 12828.0, 6134.0, 3031.0, 1526.0, 775.0, 464.0, 234.0, 143.0, 75.0, 56.0, 44.0, 18.0, 20.0, 7.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.03582763671875, -0.03480052947998047, -0.03377342224121094, -0.032746315002441406, -0.031719207763671875, -0.030692100524902344, -0.029664993286132812, -0.02863788604736328, -0.02761077880859375, -0.02658367156982422, -0.025556564331054688, -0.024529457092285156, -0.023502349853515625, -0.022475242614746094, -0.021448135375976562, -0.02042102813720703, -0.0193939208984375, -0.01836681365966797, -0.017339706420898438, -0.016312599182128906, -0.015285491943359375, -0.014258384704589844, -0.013231277465820312, -0.012204170227050781, -0.01117706298828125, -0.010149955749511719, -0.009122848510742188, -0.008095741271972656, -0.007068634033203125, -0.006041526794433594, -0.0050144195556640625, -0.003987312316894531, -0.002960205078125, -0.0019330978393554688, -0.0009059906005859375, 0.00012111663818359375, 0.001148223876953125, 0.0021753311157226562, 0.0032024383544921875, 0.004229545593261719, 0.00525665283203125, 0.006283760070800781, 0.0073108673095703125, 0.008337974548339844, 0.009365081787109375, 0.010392189025878906, 0.011419296264648438, 0.012446403503417969, 0.0134735107421875, 0.014500617980957031, 0.015527725219726562, 0.016554832458496094, 0.017581939697265625, 0.018609046936035156, 0.019636154174804688, 0.02066326141357422, 0.02169036865234375, 0.02271747589111328, 0.023744583129882812, 0.024771690368652344, 0.025798797607421875, 0.026825904846191406, 0.027853012084960938, 0.02888011932373047, 0.0299072265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 6.0, 6.0, 8.0, 4.0, 7.0, 8.0, 14.0, 11.0, 7.0, 17.0, 20.0, 21.0, 30.0, 35.0, 36.0, 38.0, 51.0, 62.0, 41.0, 65.0, 48.0, 58.0, 64.0, 50.0, 36.0, 40.0, 44.0, 26.0, 26.0, 26.0, 26.0, 14.0, 12.0, 9.0, 7.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03668212890625, -0.03542137145996094, -0.034160614013671875, -0.03289985656738281, -0.03163909912109375, -0.030378341674804688, -0.029117584228515625, -0.027856826782226562, -0.0265960693359375, -0.025335311889648438, -0.024074554443359375, -0.022813796997070312, -0.02155303955078125, -0.020292282104492188, -0.019031524658203125, -0.017770767211914062, -0.016510009765625, -0.015249252319335938, -0.013988494873046875, -0.012727737426757812, -0.01146697998046875, -0.010206222534179688, -0.008945465087890625, -0.0076847076416015625, -0.0064239501953125, -0.0051631927490234375, -0.003902435302734375, -0.0026416778564453125, -0.00138092041015625, -0.0001201629638671875, 0.001140594482421875, 0.0024013519287109375, 0.003662109375, 0.0049228668212890625, 0.006183624267578125, 0.0074443817138671875, 0.00870513916015625, 0.009965896606445312, 0.011226654052734375, 0.012487411499023438, 0.0137481689453125, 0.015008926391601562, 0.016269683837890625, 0.017530441284179688, 0.01879119873046875, 0.020051956176757812, 0.021312713623046875, 0.022573471069335938, 0.023834228515625, 0.025094985961914062, 0.026355743408203125, 0.027616500854492188, 0.02887725830078125, 0.030138015747070312, 0.031398773193359375, 0.03265953063964844, 0.0339202880859375, 0.03518104553222656, 0.036441802978515625, 0.03770256042480469, 0.03896331787109375, 0.04022407531738281, 0.041484832763671875, 0.04274559020996094, 0.04400634765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 12.0, 15.0, 24.0, 62.0, 164.0, 226.0, 225.0, 143.0, 61.0, 34.0, 8.0, 8.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1912773847579956, -1.150343656539917, -1.1094098091125488, -1.0684760808944702, -1.0275423526763916, -0.986608624458313, -0.9456748366355896, -0.9047410488128662, -0.8638073205947876, -0.822873592376709, -0.7819398045539856, -0.7410060167312622, -0.7000722885131836, -0.659138560295105, -0.6182047724723816, -0.5772709846496582, -0.5363372564315796, -0.4954034984111786, -0.4544697403907776, -0.4135359823703766, -0.3726022243499756, -0.3316684663295746, -0.2907347083091736, -0.24980095028877258, -0.20886719226837158, -0.16793343424797058, -0.12699967622756958, -0.08606591820716858, -0.04513216018676758, -0.004198402166366577, 0.036735355854034424, 0.07766911387443542, 0.11860299110412598, 0.15953674912452698, 0.20047050714492798, 0.24140426516532898, 0.28233802318573, 0.323271781206131, 0.364205539226532, 0.405139297246933, 0.446073055267334, 0.487006813287735, 0.527940571308136, 0.5688743591308594, 0.609808087348938, 0.6507418155670166, 0.69167560338974, 0.7326093912124634, 0.773543119430542, 0.8144768476486206, 0.855410635471344, 0.8963444232940674, 0.937278151512146, 0.9782118797302246, 1.0191457271575928, 1.0600794553756714, 1.10101318359375, 1.1419469118118286, 1.1828806400299072, 1.2238144874572754, 1.264748215675354, 1.3056819438934326, 1.3466157913208008, 1.3875495195388794, 1.428483247756958]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 11.0, 10.0, 7.0, 22.0, 13.0, 17.0, 24.0, 25.0, 38.0, 39.0, 35.0, 24.0, 47.0, 41.0, 50.0, 53.0, 50.0, 52.0, 45.0, 59.0, 49.0, 47.0, 45.0, 34.0, 21.0, 23.0, 32.0, 18.0, 13.0, 13.0, 8.0, 10.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6935819387435913, -0.6730813980102539, -0.6525807976722717, -0.6320801973342896, -0.6115796566009521, -0.5910791158676147, -0.5705785155296326, -0.5500779151916504, -0.529577374458313, -0.5090768337249756, -0.4885762333869934, -0.4680756628513336, -0.44757509231567383, -0.42707452178001404, -0.40657395124435425, -0.38607338070869446, -0.36557281017303467, -0.3450722396373749, -0.3245716691017151, -0.3040710985660553, -0.2835705280303955, -0.2630699574947357, -0.24256938695907593, -0.22206881642341614, -0.20156824588775635, -0.18106767535209656, -0.16056710481643677, -0.14006653428077698, -0.11956596374511719, -0.0990653932094574, -0.07856482267379761, -0.05806425213813782, -0.0375637412071228, -0.017063170671463013, 0.0034373998641967773, 0.023937970399856567, 0.04443854093551636, 0.06493911147117615, 0.08543968200683594, 0.10594025254249573, 0.12644082307815552, 0.1469413936138153, 0.1674419641494751, 0.1879425346851349, 0.20844310522079468, 0.22894367575645447, 0.24944424629211426, 0.26994481682777405, 0.29044538736343384, 0.31094595789909363, 0.3314465284347534, 0.3519470989704132, 0.372447669506073, 0.3929482400417328, 0.4134488105773926, 0.43394938111305237, 0.45444995164871216, 0.47495052218437195, 0.49545109272003174, 0.5159516334533691, 0.5364522337913513, 0.5569528341293335, 0.5774533748626709, 0.5979539155960083, 0.6184545159339905]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 11.0, 11.0, 17.0, 21.0, 37.0, 64.0, 83.0, 112.0, 180.0, 285.0, 498.0, 832.0, 1463.0, 2776.0, 5288.0, 10847.0, 23047.0, 53215.0, 127617.0, 305597.0, 634084.0, 984984.0, 953203.0, 593662.0, 285448.0, 120421.0, 49509.0, 21170.0, 9716.0, 4601.0, 2408.0, 1341.0, 690.0, 394.0, 235.0, 144.0, 89.0, 56.0, 48.0, 23.0, 14.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.07244873046875, -0.07043123245239258, -0.06841373443603516, -0.06639623641967773, -0.06437873840332031, -0.06236124038696289, -0.06034374237060547, -0.05832624435424805, -0.056308746337890625, -0.0542912483215332, -0.05227375030517578, -0.05025625228881836, -0.04823875427246094, -0.046221256256103516, -0.044203758239746094, -0.04218626022338867, -0.04016876220703125, -0.03815126419067383, -0.036133766174316406, -0.034116268157958984, -0.03209877014160156, -0.03008127212524414, -0.02806377410888672, -0.026046276092529297, -0.024028778076171875, -0.022011280059814453, -0.01999378204345703, -0.01797628402709961, -0.015958786010742188, -0.013941287994384766, -0.011923789978027344, -0.009906291961669922, -0.0078887939453125, -0.005871295928955078, -0.0038537979125976562, -0.0018362998962402344, 0.0001811981201171875, 0.0021986961364746094, 0.004216194152832031, 0.006233692169189453, 0.008251190185546875, 0.010268688201904297, 0.012286186218261719, 0.01430368423461914, 0.016321182250976562, 0.018338680267333984, 0.020356178283691406, 0.022373676300048828, 0.02439117431640625, 0.026408672332763672, 0.028426170349121094, 0.030443668365478516, 0.03246116638183594, 0.03447866439819336, 0.03649616241455078, 0.0385136604309082, 0.040531158447265625, 0.04254865646362305, 0.04456615447998047, 0.04658365249633789, 0.04860115051269531, 0.050618648529052734, 0.052636146545410156, 0.05465364456176758, 0.056671142578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 13.0, 8.0, 8.0, 13.0, 14.0, 19.0, 19.0, 17.0, 22.0, 29.0, 30.0, 36.0, 35.0, 39.0, 37.0, 39.0, 54.0, 47.0, 50.0, 47.0, 53.0, 44.0, 42.0, 37.0, 45.0, 31.0, 20.0, 21.0, 20.0, 24.0, 17.0, 12.0, 18.0, 10.0, 9.0, 1.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.084228515625, -0.08170890808105469, -0.07918930053710938, -0.07666969299316406, -0.07415008544921875, -0.07163047790527344, -0.06911087036132812, -0.06659126281738281, -0.0640716552734375, -0.06155204772949219, -0.059032440185546875, -0.05651283264160156, -0.05399322509765625, -0.05147361755371094, -0.048954010009765625, -0.04643440246582031, -0.043914794921875, -0.04139518737792969, -0.038875579833984375, -0.03635597229003906, -0.03383636474609375, -0.03131675720214844, -0.028797149658203125, -0.026277542114257812, -0.0237579345703125, -0.021238327026367188, -0.018718719482421875, -0.016199111938476562, -0.01367950439453125, -0.011159896850585938, -0.008640289306640625, -0.0061206817626953125, -0.00360107421875, -0.0010814666748046875, 0.001438140869140625, 0.0039577484130859375, 0.00647735595703125, 0.008996963500976562, 0.011516571044921875, 0.014036178588867188, 0.0165557861328125, 0.019075393676757812, 0.021595001220703125, 0.024114608764648438, 0.02663421630859375, 0.029153823852539062, 0.031673431396484375, 0.03419303894042969, 0.036712646484375, 0.03923225402832031, 0.041751861572265625, 0.04427146911621094, 0.04679107666015625, 0.04931068420410156, 0.051830291748046875, 0.05434989929199219, 0.0568695068359375, 0.05938911437988281, 0.061908721923828125, 0.06442832946777344, 0.06694793701171875, 0.06946754455566406, 0.07198715209960938, 0.07450675964355469, 0.0770263671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 12.0, 18.0, 38.0, 66.0, 131.0, 209.0, 476.0, 1137.0, 3225.0, 11349.0, 53841.0, 432900.0, 2896172.0, 697317.0, 76164.0, 14768.0, 3920.0, 1426.0, 584.0, 237.0, 113.0, 83.0, 43.0, 20.0, 13.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.19623184204101562, -0.19055938720703125, -0.18488693237304688, -0.1792144775390625, -0.17354202270507812, -0.16786956787109375, -0.16219711303710938, -0.156524658203125, -0.15085220336914062, -0.14517974853515625, -0.13950729370117188, -0.1338348388671875, -0.12816238403320312, -0.12248992919921875, -0.11681747436523438, -0.11114501953125, -0.10547256469726562, -0.09980010986328125, -0.09412765502929688, -0.0884552001953125, -0.08278274536132812, -0.07711029052734375, -0.07143783569335938, -0.065765380859375, -0.060092926025390625, -0.05442047119140625, -0.048748016357421875, -0.0430755615234375, -0.037403106689453125, -0.03173065185546875, -0.026058197021484375, -0.0203857421875, -0.014713287353515625, -0.00904083251953125, -0.003368377685546875, 0.0023040771484375, 0.007976531982421875, 0.01364898681640625, 0.019321441650390625, 0.024993896484375, 0.030666351318359375, 0.03633880615234375, 0.042011260986328125, 0.0476837158203125, 0.053356170654296875, 0.05902862548828125, 0.06470108032226562, 0.07037353515625, 0.07604598999023438, 0.08171844482421875, 0.08739089965820312, 0.0930633544921875, 0.09873580932617188, 0.10440826416015625, 0.11008071899414062, 0.115753173828125, 0.12142562866210938, 0.12709808349609375, 0.13277053833007812, 0.1384429931640625, 0.14411544799804688, 0.14978790283203125, 0.15546035766601562, 0.1611328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 7.0, 13.0, 10.0, 32.0, 37.0, 58.0, 87.0, 148.0, 228.0, 339.0, 514.0, 646.0, 622.0, 453.0, 287.0, 197.0, 117.0, 94.0, 55.0, 30.0, 32.0, 22.0, 11.0, 8.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.1806507110595703, -0.17514419555664062, -0.16963768005371094, -0.16413116455078125, -0.15862464904785156, -0.15311813354492188, -0.1476116180419922, -0.1421051025390625, -0.1365985870361328, -0.13109207153320312, -0.12558555603027344, -0.12007904052734375, -0.11457252502441406, -0.10906600952148438, -0.10355949401855469, -0.098052978515625, -0.09254646301269531, -0.08703994750976562, -0.08153343200683594, -0.07602691650390625, -0.07052040100097656, -0.06501388549804688, -0.05950736999511719, -0.0540008544921875, -0.04849433898925781, -0.042987823486328125, -0.03748130798339844, -0.03197479248046875, -0.026468276977539062, -0.020961761474609375, -0.015455245971679688, -0.00994873046875, -0.0044422149658203125, 0.001064300537109375, 0.0065708160400390625, 0.01207733154296875, 0.017583847045898438, 0.023090362548828125, 0.028596878051757812, 0.0341033935546875, 0.03960990905761719, 0.045116424560546875, 0.05062294006347656, 0.05612945556640625, 0.06163597106933594, 0.06714248657226562, 0.07264900207519531, 0.078155517578125, 0.08366203308105469, 0.08916854858398438, 0.09467506408691406, 0.10018157958984375, 0.10568809509277344, 0.11119461059570312, 0.11670112609863281, 0.1222076416015625, 0.1277141571044922, 0.13322067260742188, 0.13872718811035156, 0.14423370361328125, 0.14974021911621094, 0.15524673461914062, 0.1607532501220703, 0.166259765625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 17.0, 28.0, 49.0, 110.0, 157.0, 178.0, 172.0, 115.0, 72.0, 45.0, 20.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0852274894714355, -1.0457690954208374, -1.0063108205795288, -0.9668524265289307, -0.9273940920829773, -0.8879357576370239, -0.8484773635864258, -0.8090190291404724, -0.769560694694519, -0.7301023602485657, -0.6906439661979675, -0.6511856317520142, -0.6117272973060608, -0.5722689628601074, -0.5328105688095093, -0.4933522343635559, -0.45389384031295776, -0.414435476064682, -0.37497714161872864, -0.3355187773704529, -0.2960604429244995, -0.25660207867622375, -0.217143714427948, -0.17768537998199463, -0.13822701573371887, -0.09876866638660431, -0.05931030958890915, -0.01985195279121399, 0.019606396555900574, 0.05906474590301514, 0.0985231101512909, 0.13798144459724426, 0.17743980884552002, 0.21689815819263458, 0.25635650753974915, 0.2958148717880249, 0.33527320623397827, 0.37473157048225403, 0.4141899347305298, 0.45364826917648315, 0.4931066334247589, 0.5325649976730347, 0.572023332118988, 0.6114816665649414, 0.6509400606155396, 0.6903983950614929, 0.7298567295074463, 0.7693151235580444, 0.8087734580039978, 0.8482317924499512, 0.8876901865005493, 0.9271485209465027, 0.966606855392456, 1.0060652494430542, 1.0455236434936523, 1.084981918334961, 1.124440312385559, 1.1638987064361572, 1.2033569812774658, 1.242815375328064, 1.282273769378662, 1.3217320442199707, 1.3611904382705688, 1.400648832321167, 1.4401071071624756]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 18.0, 15.0, 36.0, 28.0, 31.0, 29.0, 25.0, 37.0, 45.0, 36.0, 40.0, 38.0, 32.0, 44.0, 47.0, 45.0, 40.0, 48.0, 46.0, 40.0, 29.0, 31.0, 29.0, 22.0, 23.0, 26.0, 14.0, 17.0, 11.0, 12.0, 6.0, 3.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.48263466358184814, -0.4694255590438843, -0.4562164545059204, -0.44300737977027893, -0.42979827523231506, -0.4165891706943512, -0.4033800959587097, -0.39017099142074585, -0.376961886882782, -0.3637527823448181, -0.35054367780685425, -0.33733460307121277, -0.3241254985332489, -0.31091639399528503, -0.29770731925964355, -0.2844982147216797, -0.2712891101837158, -0.25808000564575195, -0.24487091600894928, -0.2316618263721466, -0.21845272183418274, -0.20524361729621887, -0.1920345276594162, -0.17882543802261353, -0.16561633348464966, -0.1524072289466858, -0.13919813930988312, -0.12598904967308044, -0.11277994513511658, -0.0995708480477333, -0.08636175096035004, -0.07315265387296677, -0.059943556785583496, -0.046734459698200226, -0.033525362610816956, -0.020316265523433685, -0.007107168436050415, 0.006101928651332855, 0.019311025738716125, 0.032520122826099396, 0.045729219913482666, 0.058938317000865936, 0.0721474140882492, 0.08535651117563248, 0.09856560826301575, 0.11177470535039902, 0.12498380243778229, 0.13819289207458496, 0.15140199661254883, 0.1646111011505127, 0.17782019078731537, 0.19102928042411804, 0.2042383849620819, 0.21744748950004578, 0.23065657913684845, 0.24386566877365112, 0.257074773311615, 0.27028387784957886, 0.2834929823875427, 0.2967020571231842, 0.30991116166114807, 0.32312026619911194, 0.3363293409347534, 0.3495384454727173, 0.36274755001068115]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 9.0, 14.0, 19.0, 30.0, 41.0, 53.0, 79.0, 95.0, 152.0, 217.0, 368.0, 609.0, 924.0, 1695.0, 2878.0, 5045.0, 9119.0, 16546.0, 30240.0, 55005.0, 94044.0, 145743.0, 183626.0, 178149.0, 133529.0, 83279.0, 47349.0, 26341.0, 14495.0, 8101.0, 4350.0, 2578.0, 1459.0, 837.0, 559.0, 340.0, 200.0, 132.0, 90.0, 72.0, 42.0, 29.0, 16.0, 16.0, 11.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0654296875, -0.06337738037109375, -0.0613250732421875, -0.05927276611328125, -0.057220458984375, -0.05516815185546875, -0.0531158447265625, -0.05106353759765625, -0.04901123046875, -0.04695892333984375, -0.0449066162109375, -0.04285430908203125, -0.040802001953125, -0.03874969482421875, -0.0366973876953125, -0.03464508056640625, -0.0325927734375, -0.03054046630859375, -0.0284881591796875, -0.02643585205078125, -0.024383544921875, -0.02233123779296875, -0.0202789306640625, -0.01822662353515625, -0.01617431640625, -0.01412200927734375, -0.0120697021484375, -0.01001739501953125, -0.007965087890625, -0.00591278076171875, -0.0038604736328125, -0.00180816650390625, 0.000244140625, 0.00229644775390625, 0.0043487548828125, 0.00640106201171875, 0.008453369140625, 0.01050567626953125, 0.0125579833984375, 0.01461029052734375, 0.01666259765625, 0.01871490478515625, 0.0207672119140625, 0.02281951904296875, 0.024871826171875, 0.02692413330078125, 0.0289764404296875, 0.03102874755859375, 0.0330810546875, 0.03513336181640625, 0.0371856689453125, 0.03923797607421875, 0.041290283203125, 0.04334259033203125, 0.0453948974609375, 0.04744720458984375, 0.04949951171875, 0.05155181884765625, 0.0536041259765625, 0.05565643310546875, 0.057708740234375, 0.05976104736328125, 0.0618133544921875, 0.06386566162109375, 0.06591796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 2.0, 7.0, 10.0, 15.0, 24.0, 20.0, 18.0, 26.0, 22.0, 34.0, 28.0, 54.0, 49.0, 56.0, 38.0, 58.0, 53.0, 46.0, 45.0, 45.0, 47.0, 41.0, 51.0, 32.0, 31.0, 28.0, 17.0, 10.0, 17.0, 13.0, 10.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09368896484375, -0.09053230285644531, -0.08737564086914062, -0.08421897888183594, -0.08106231689453125, -0.07790565490722656, -0.07474899291992188, -0.07159233093261719, -0.0684356689453125, -0.06527900695800781, -0.062122344970703125, -0.05896568298339844, -0.05580902099609375, -0.05265235900878906, -0.049495697021484375, -0.04633903503417969, -0.043182373046875, -0.04002571105957031, -0.036869049072265625, -0.03371238708496094, -0.03055572509765625, -0.027399063110351562, -0.024242401123046875, -0.021085739135742188, -0.0179290771484375, -0.014772415161132812, -0.011615753173828125, -0.008459091186523438, -0.00530242919921875, -0.0021457672119140625, 0.001010894775390625, 0.0041675567626953125, 0.00732421875, 0.010480880737304688, 0.013637542724609375, 0.016794204711914062, 0.01995086669921875, 0.023107528686523438, 0.026264190673828125, 0.029420852661132812, 0.0325775146484375, 0.03573417663574219, 0.038890838623046875, 0.04204750061035156, 0.04520416259765625, 0.04836082458496094, 0.051517486572265625, 0.05467414855957031, 0.057830810546875, 0.06098747253417969, 0.06414413452148438, 0.06730079650878906, 0.07045745849609375, 0.07361412048339844, 0.07677078247070312, 0.07992744445800781, 0.0830841064453125, 0.08624076843261719, 0.08939743041992188, 0.09255409240722656, 0.09571075439453125, 0.09886741638183594, 0.10202407836914062, 0.10518074035644531, 0.10833740234375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 11.0, 21.0, 32.0, 22.0, 41.0, 49.0, 110.0, 188.0, 241.0, 424.0, 827.0, 1456.0, 2663.0, 4890.0, 9677.0, 18661.0, 37638.0, 72459.0, 133107.0, 207941.0, 236409.0, 149370.0, 84106.0, 42934.0, 21782.0, 10992.0, 5739.0, 3011.0, 1581.0, 896.0, 501.0, 304.0, 155.0, 108.0, 62.0, 53.0, 31.0, 20.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.0666341781616211, -0.06417655944824219, -0.06171894073486328, -0.059261322021484375, -0.05680370330810547, -0.05434608459472656, -0.051888465881347656, -0.04943084716796875, -0.046973228454589844, -0.04451560974121094, -0.04205799102783203, -0.039600372314453125, -0.03714275360107422, -0.03468513488769531, -0.032227516174316406, -0.0297698974609375, -0.027312278747558594, -0.024854660034179688, -0.02239704132080078, -0.019939422607421875, -0.01748180389404297, -0.015024185180664062, -0.012566566467285156, -0.01010894775390625, -0.007651329040527344, -0.0051937103271484375, -0.0027360916137695312, -0.000278472900390625, 0.0021791458129882812, 0.0046367645263671875, 0.007094383239746094, 0.009552001953125, 0.012009620666503906, 0.014467239379882812, 0.01692485809326172, 0.019382476806640625, 0.02184009552001953, 0.024297714233398438, 0.026755332946777344, 0.02921295166015625, 0.031670570373535156, 0.03412818908691406, 0.03658580780029297, 0.039043426513671875, 0.04150104522705078, 0.04395866394042969, 0.046416282653808594, 0.0488739013671875, 0.051331520080566406, 0.05378913879394531, 0.05624675750732422, 0.058704376220703125, 0.06116199493408203, 0.06361961364746094, 0.06607723236083984, 0.06853485107421875, 0.07099246978759766, 0.07345008850097656, 0.07590770721435547, 0.07836532592773438, 0.08082294464111328, 0.08328056335449219, 0.0857381820678711, 0.08819580078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 11.0, 10.0, 10.0, 9.0, 9.0, 18.0, 13.0, 29.0, 27.0, 28.0, 47.0, 32.0, 37.0, 46.0, 57.0, 51.0, 54.0, 60.0, 43.0, 44.0, 58.0, 45.0, 42.0, 43.0, 24.0, 26.0, 33.0, 23.0, 12.0, 15.0, 10.0, 15.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.328857421875, -0.32010650634765625, -0.3113555908203125, -0.30260467529296875, -0.293853759765625, -0.28510284423828125, -0.2763519287109375, -0.26760101318359375, -0.25885009765625, -0.25009918212890625, -0.2413482666015625, -0.23259735107421875, -0.223846435546875, -0.21509552001953125, -0.2063446044921875, -0.19759368896484375, -0.1888427734375, -0.18009185791015625, -0.1713409423828125, -0.16259002685546875, -0.153839111328125, -0.14508819580078125, -0.1363372802734375, -0.12758636474609375, -0.11883544921875, -0.11008453369140625, -0.1013336181640625, -0.09258270263671875, -0.083831787109375, -0.07508087158203125, -0.0663299560546875, -0.05757904052734375, -0.048828125, -0.04007720947265625, -0.0313262939453125, -0.02257537841796875, -0.013824462890625, -0.00507354736328125, 0.0036773681640625, 0.01242828369140625, 0.02117919921875, 0.02993011474609375, 0.0386810302734375, 0.04743194580078125, 0.056182861328125, 0.06493377685546875, 0.0736846923828125, 0.08243560791015625, 0.0911865234375, 0.09993743896484375, 0.1086883544921875, 0.11743927001953125, 0.126190185546875, 0.13494110107421875, 0.1436920166015625, 0.15244293212890625, 0.16119384765625, 0.16994476318359375, 0.1786956787109375, 0.18744659423828125, 0.196197509765625, 0.20494842529296875, 0.2136993408203125, 0.22245025634765625, 0.231201171875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 9.0, 15.0, 19.0, 25.0, 49.0, 94.0, 140.0, 232.0, 319.0, 598.0, 974.0, 1792.0, 3437.0, 6500.0, 12872.0, 24868.0, 47668.0, 88968.0, 154008.0, 241748.0, 197339.0, 123474.0, 68167.0, 36026.0, 18622.0, 9652.0, 4907.0, 2576.0, 1445.0, 806.0, 444.0, 256.0, 184.0, 109.0, 73.0, 44.0, 29.0, 25.0, 13.0, 8.0, 10.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.016353845596313477, -0.015785694122314453, -0.01521754264831543, -0.014649391174316406, -0.014081239700317383, -0.01351308822631836, -0.012944936752319336, -0.012376785278320312, -0.011808633804321289, -0.011240482330322266, -0.010672330856323242, -0.010104179382324219, -0.009536027908325195, -0.008967876434326172, -0.008399724960327148, -0.007831573486328125, -0.0072634220123291016, -0.006695270538330078, -0.006127119064331055, -0.005558967590332031, -0.004990816116333008, -0.004422664642333984, -0.003854513168334961, -0.0032863616943359375, -0.002718210220336914, -0.0021500587463378906, -0.0015819072723388672, -0.0010137557983398438, -0.0004456043243408203, 0.00012254714965820312, 0.0006906986236572266, 0.00125885009765625, 0.0018270015716552734, 0.002395153045654297, 0.0029633045196533203, 0.0035314559936523438, 0.004099607467651367, 0.004667758941650391, 0.005235910415649414, 0.0058040618896484375, 0.006372213363647461, 0.006940364837646484, 0.007508516311645508, 0.008076667785644531, 0.008644819259643555, 0.009212970733642578, 0.009781122207641602, 0.010349273681640625, 0.010917425155639648, 0.011485576629638672, 0.012053728103637695, 0.012621879577636719, 0.013190031051635742, 0.013758182525634766, 0.014326333999633789, 0.014894485473632812, 0.015462636947631836, 0.01603078842163086, 0.016598939895629883, 0.017167091369628906, 0.01773524284362793, 0.018303394317626953, 0.018871545791625977, 0.019439697265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 2.0, 8.0, 10.0, 6.0, 12.0, 12.0, 17.0, 16.0, 23.0, 19.0, 34.0, 32.0, 25.0, 27.0, 31.0, 46.0, 52.0, 64.0, 49.0, 49.0, 46.0, 45.0, 33.0, 43.0, 37.0, 33.0, 43.0, 26.0, 28.0, 14.0, 15.0, 18.0, 16.0, 11.0, 13.0, 8.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.0728836059570312e-05, -1.043267548084259e-05, -1.0136514902114868e-05, -9.840354323387146e-06, -9.544193744659424e-06, -9.248033165931702e-06, -8.95187258720398e-06, -8.655712008476257e-06, -8.359551429748535e-06, -8.063390851020813e-06, -7.76723027229309e-06, -7.471069693565369e-06, -7.1749091148376465e-06, -6.878748536109924e-06, -6.582587957382202e-06, -6.28642737865448e-06, -5.990266799926758e-06, -5.694106221199036e-06, -5.3979456424713135e-06, -5.101785063743591e-06, -4.805624485015869e-06, -4.509463906288147e-06, -4.213303327560425e-06, -3.917142748832703e-06, -3.6209821701049805e-06, -3.3248215913772583e-06, -3.028661012649536e-06, -2.732500433921814e-06, -2.436339855194092e-06, -2.1401792764663696e-06, -1.8440186977386475e-06, -1.5478581190109253e-06, -1.2516975402832031e-06, -9.55536961555481e-07, -6.593763828277588e-07, -3.632158041000366e-07, -6.705522537231445e-08, 2.2910535335540771e-07, 5.252659320831299e-07, 8.21426510810852e-07, 1.1175870895385742e-06, 1.4137476682662964e-06, 1.7099082469940186e-06, 2.0060688257217407e-06, 2.302229404449463e-06, 2.598389983177185e-06, 2.8945505619049072e-06, 3.1907111406326294e-06, 3.4868717193603516e-06, 3.7830322980880737e-06, 4.079192876815796e-06, 4.375353455543518e-06, 4.67151403427124e-06, 4.967674612998962e-06, 5.2638351917266846e-06, 5.559995770454407e-06, 5.856156349182129e-06, 6.152316927909851e-06, 6.448477506637573e-06, 6.744638085365295e-06, 7.040798664093018e-06, 7.33695924282074e-06, 7.633119821548462e-06, 7.929280400276184e-06, 8.225440979003906e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 7.0, 9.0, 14.0, 10.0, 19.0, 41.0, 51.0, 85.0, 119.0, 239.0, 350.0, 558.0, 898.0, 1574.0, 2774.0, 4848.0, 8457.0, 15236.0, 28629.0, 51307.0, 90607.0, 145030.0, 214628.0, 183814.0, 126859.0, 76168.0, 43119.0, 23416.0, 12833.0, 7172.0, 4010.0, 2314.0, 1297.0, 732.0, 497.0, 283.0, 192.0, 107.0, 82.0, 50.0, 34.0, 22.0, 20.0, 9.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0172882080078125, -0.016727685928344727, -0.016167163848876953, -0.01560664176940918, -0.015046119689941406, -0.014485597610473633, -0.01392507553100586, -0.013364553451538086, -0.012804031372070312, -0.012243509292602539, -0.011682987213134766, -0.011122465133666992, -0.010561943054199219, -0.010001420974731445, -0.009440898895263672, -0.008880376815795898, -0.008319854736328125, -0.0077593326568603516, -0.007198810577392578, -0.006638288497924805, -0.006077766418457031, -0.005517244338989258, -0.004956722259521484, -0.004396200180053711, -0.0038356781005859375, -0.003275156021118164, -0.0027146339416503906, -0.002154111862182617, -0.0015935897827148438, -0.0010330677032470703, -0.0004725456237792969, 8.797645568847656e-05, 0.00064849853515625, 0.0012090206146240234, 0.0017695426940917969, 0.0023300647735595703, 0.0028905868530273438, 0.003451108932495117, 0.004011631011962891, 0.004572153091430664, 0.0051326751708984375, 0.005693197250366211, 0.006253719329833984, 0.006814241409301758, 0.007374763488769531, 0.007935285568237305, 0.008495807647705078, 0.009056329727172852, 0.009616851806640625, 0.010177373886108398, 0.010737895965576172, 0.011298418045043945, 0.011858940124511719, 0.012419462203979492, 0.012979984283447266, 0.013540506362915039, 0.014101028442382812, 0.014661550521850586, 0.01522207260131836, 0.015782594680786133, 0.016343116760253906, 0.01690363883972168, 0.017464160919189453, 0.018024682998657227, 0.018585205078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 3.0, 7.0, 1.0, 5.0, 7.0, 6.0, 12.0, 16.0, 18.0, 20.0, 21.0, 29.0, 35.0, 35.0, 45.0, 52.0, 38.0, 45.0, 57.0, 49.0, 50.0, 42.0, 44.0, 52.0, 39.0, 41.0, 29.0, 34.0, 30.0, 22.0, 20.0, 12.0, 13.0, 11.0, 16.0, 11.0, 5.0, 10.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0311737060546875, -0.030230045318603516, -0.02928638458251953, -0.028342723846435547, -0.027399063110351562, -0.026455402374267578, -0.025511741638183594, -0.02456808090209961, -0.023624420166015625, -0.02268075942993164, -0.021737098693847656, -0.020793437957763672, -0.019849777221679688, -0.018906116485595703, -0.01796245574951172, -0.017018795013427734, -0.01607513427734375, -0.015131473541259766, -0.014187812805175781, -0.013244152069091797, -0.012300491333007812, -0.011356830596923828, -0.010413169860839844, -0.00946950912475586, -0.008525848388671875, -0.007582187652587891, -0.006638526916503906, -0.005694866180419922, -0.0047512054443359375, -0.003807544708251953, -0.0028638839721679688, -0.0019202232360839844, -0.0009765625, -3.2901763916015625e-05, 0.0009107589721679688, 0.0018544197082519531, 0.0027980804443359375, 0.003741741180419922, 0.004685401916503906, 0.005629062652587891, 0.006572723388671875, 0.007516384124755859, 0.008460044860839844, 0.009403705596923828, 0.010347366333007812, 0.011291027069091797, 0.012234687805175781, 0.013178348541259766, 0.01412200927734375, 0.015065670013427734, 0.01600933074951172, 0.016952991485595703, 0.017896652221679688, 0.018840312957763672, 0.019783973693847656, 0.02072763442993164, 0.021671295166015625, 0.02261495590209961, 0.023558616638183594, 0.024502277374267578, 0.025445938110351562, 0.026389598846435547, 0.02733325958251953, 0.028276920318603516, 0.0292205810546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 18.0, 20.0, 44.0, 72.0, 89.0, 116.0, 149.0, 156.0, 105.0, 93.0, 50.0, 35.0, 12.0, 9.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0282689332962036, -1.005516529083252, -0.9827641844749451, -0.9600118398666382, -0.9372594952583313, -0.9145071506500244, -0.8917547464370728, -0.8690024018287659, -0.846250057220459, -0.8234977126121521, -0.8007453083992004, -0.7779929637908936, -0.7552406191825867, -0.7324882745742798, -0.7097358703613281, -0.6869835257530212, -0.6642311811447144, -0.6414788365364075, -0.6187264323234558, -0.5959740877151489, -0.573221743106842, -0.5504693984985352, -0.5277169942855835, -0.5049646496772766, -0.48221224546432495, -0.4594598710536957, -0.4367075264453888, -0.4139551520347595, -0.39120280742645264, -0.36845043301582336, -0.3456980586051941, -0.3229457139968872, -0.30019333958625793, -0.27744096517562866, -0.2546886205673218, -0.2319362461566925, -0.20918390154838562, -0.18643152713775635, -0.16367916762828827, -0.1409268081188202, -0.11817444860935211, -0.09542208909988403, -0.07266972959041595, -0.04991736263036728, -0.0271650031208992, -0.004412643611431122, 0.018339723348617554, 0.04109208285808563, 0.06384444236755371, 0.08659680187702179, 0.10934916138648987, 0.13210153579711914, 0.15485388040542603, 0.1776062548160553, 0.20035861432552338, 0.22311097383499146, 0.24586333334445953, 0.2686156928539276, 0.2913680672645569, 0.31412041187286377, 0.33687278628349304, 0.3596251308917999, 0.3823775053024292, 0.4051298499107361, 0.42788222432136536]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 4.0, 7.0, 15.0, 11.0, 24.0, 21.0, 20.0, 32.0, 28.0, 28.0, 33.0, 36.0, 37.0, 49.0, 47.0, 55.0, 52.0, 56.0, 46.0, 56.0, 28.0, 46.0, 36.0, 41.0, 43.0, 24.0, 31.0, 23.0, 11.0, 10.0, 14.0, 9.0, 4.0, 6.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7194504141807556, -0.6988180875778198, -0.678185760974884, -0.6575534343719482, -0.6369211077690125, -0.6162887811660767, -0.5956564545631409, -0.5750241279602051, -0.5543918013572693, -0.5337594747543335, -0.5131271481513977, -0.4924948215484619, -0.4718624949455261, -0.45123016834259033, -0.43059784173965454, -0.40996551513671875, -0.38933318853378296, -0.36870086193084717, -0.3480685353279114, -0.3274362087249756, -0.3068038821220398, -0.286171555519104, -0.2655392289161682, -0.24490690231323242, -0.22427457571029663, -0.20364224910736084, -0.18300992250442505, -0.16237759590148926, -0.14174526929855347, -0.12111294269561768, -0.10048061609268188, -0.0798482894897461, -0.0592159628868103, -0.03858363628387451, -0.01795130968093872, 0.0026810169219970703, 0.02331334352493286, 0.04394567012786865, 0.06457799673080444, 0.08521032333374023, 0.10584264993667603, 0.12647497653961182, 0.1471073031425476, 0.1677396297454834, 0.1883719563484192, 0.20900428295135498, 0.22963660955429077, 0.25026893615722656, 0.27090126276016235, 0.29153358936309814, 0.31216591596603394, 0.3327982425689697, 0.3534305691719055, 0.3740628957748413, 0.3946952223777771, 0.4153275489807129, 0.4359598755836487, 0.4565922021865845, 0.47722452878952026, 0.49785685539245605, 0.5184891819953918, 0.5391215085983276, 0.5597538352012634, 0.5803861618041992, 0.601018488407135]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 17.0, 18.0, 21.0, 35.0, 56.0, 81.0, 137.0, 205.0, 378.0, 671.0, 1187.0, 2269.0, 4569.0, 10077.0, 24645.0, 62124.0, 155652.0, 350430.0, 635717.0, 853271.0, 844392.0, 623481.0, 356575.0, 161065.0, 63784.0, 24327.0, 9877.0, 4393.0, 2125.0, 1081.0, 596.0, 383.0, 240.0, 151.0, 93.0, 56.0, 30.0, 26.0, 18.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05841064453125, -0.056396484375, -0.05438232421875, -0.0523681640625, -0.05035400390625, -0.04833984375, -0.04632568359375, -0.0443115234375, -0.04229736328125, -0.040283203125, -0.03826904296875, -0.0362548828125, -0.03424072265625, -0.0322265625, -0.03021240234375, -0.0281982421875, -0.02618408203125, -0.024169921875, -0.02215576171875, -0.0201416015625, -0.01812744140625, -0.01611328125, -0.01409912109375, -0.0120849609375, -0.01007080078125, -0.008056640625, -0.00604248046875, -0.0040283203125, -0.00201416015625, 0.0, 0.00201416015625, 0.0040283203125, 0.00604248046875, 0.008056640625, 0.01007080078125, 0.0120849609375, 0.01409912109375, 0.01611328125, 0.01812744140625, 0.0201416015625, 0.02215576171875, 0.024169921875, 0.02618408203125, 0.0281982421875, 0.03021240234375, 0.0322265625, 0.03424072265625, 0.0362548828125, 0.03826904296875, 0.040283203125, 0.04229736328125, 0.0443115234375, 0.04632568359375, 0.04833984375, 0.05035400390625, 0.0523681640625, 0.05438232421875, 0.056396484375, 0.05841064453125, 0.0604248046875, 0.06243896484375, 0.064453125, 0.06646728515625, 0.0684814453125, 0.07049560546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 11.0, 9.0, 13.0, 18.0, 15.0, 15.0, 29.0, 31.0, 27.0, 24.0, 25.0, 32.0, 34.0, 33.0, 38.0, 49.0, 40.0, 47.0, 39.0, 29.0, 41.0, 47.0, 33.0, 40.0, 54.0, 28.0, 38.0, 20.0, 26.0, 20.0, 18.0, 18.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.08013916015625, -0.07768726348876953, -0.07523536682128906, -0.0727834701538086, -0.07033157348632812, -0.06787967681884766, -0.06542778015136719, -0.06297588348388672, -0.06052398681640625, -0.05807209014892578, -0.05562019348144531, -0.053168296813964844, -0.050716400146484375, -0.048264503479003906, -0.04581260681152344, -0.04336071014404297, -0.0409088134765625, -0.03845691680908203, -0.03600502014160156, -0.033553123474121094, -0.031101226806640625, -0.028649330139160156, -0.026197433471679688, -0.02374553680419922, -0.02129364013671875, -0.01884174346923828, -0.016389846801757812, -0.013937950134277344, -0.011486053466796875, -0.009034156799316406, -0.0065822601318359375, -0.004130363464355469, -0.001678466796875, 0.0007734298706054688, 0.0032253265380859375, 0.005677223205566406, 0.008129119873046875, 0.010581016540527344, 0.013032913208007812, 0.015484809875488281, 0.01793670654296875, 0.02038860321044922, 0.022840499877929688, 0.025292396545410156, 0.027744293212890625, 0.030196189880371094, 0.03264808654785156, 0.03509998321533203, 0.0375518798828125, 0.04000377655029297, 0.04245567321777344, 0.044907569885253906, 0.047359466552734375, 0.049811363220214844, 0.05226325988769531, 0.05471515655517578, 0.05716705322265625, 0.05961894989013672, 0.06207084655761719, 0.06452274322509766, 0.06697463989257812, 0.0694265365600586, 0.07187843322753906, 0.07433032989501953, 0.0767822265625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 17.0, 15.0, 28.0, 40.0, 43.0, 88.0, 98.0, 177.0, 230.0, 446.0, 735.0, 1470.0, 3264.0, 9176.0, 40608.0, 314330.0, 2697042.0, 1002407.0, 96816.0, 17536.0, 4994.0, 2026.0, 1006.0, 588.0, 372.0, 204.0, 157.0, 121.0, 62.0, 45.0, 40.0, 21.0, 22.0, 12.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15185546875, -0.14657020568847656, -0.14128494262695312, -0.1359996795654297, -0.13071441650390625, -0.1254291534423828, -0.12014389038085938, -0.11485862731933594, -0.1095733642578125, -0.10428810119628906, -0.09900283813476562, -0.09371757507324219, -0.08843231201171875, -0.08314704895019531, -0.07786178588867188, -0.07257652282714844, -0.067291259765625, -0.06200599670410156, -0.056720733642578125, -0.05143547058105469, -0.04615020751953125, -0.04086494445800781, -0.035579681396484375, -0.030294418334960938, -0.0250091552734375, -0.019723892211914062, -0.014438629150390625, -0.009153366088867188, -0.00386810302734375, 0.0014171600341796875, 0.006702423095703125, 0.011987686157226562, 0.01727294921875, 0.022558212280273438, 0.027843475341796875, 0.03312873840332031, 0.03841400146484375, 0.04369926452636719, 0.048984527587890625, 0.05426979064941406, 0.0595550537109375, 0.06484031677246094, 0.07012557983398438, 0.07541084289550781, 0.08069610595703125, 0.08598136901855469, 0.09126663208007812, 0.09655189514160156, 0.101837158203125, 0.10712242126464844, 0.11240768432617188, 0.11769294738769531, 0.12297821044921875, 0.1282634735107422, 0.13354873657226562, 0.13883399963378906, 0.1441192626953125, 0.14940452575683594, 0.15468978881835938, 0.1599750518798828, 0.16526031494140625, 0.1705455780029297, 0.17583084106445312, 0.18111610412597656, 0.1864013671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 2.0, 6.0, 5.0, 6.0, 9.0, 19.0, 18.0, 21.0, 33.0, 55.0, 77.0, 100.0, 138.0, 180.0, 251.0, 298.0, 352.0, 427.0, 416.0, 403.0, 321.0, 249.0, 189.0, 135.0, 108.0, 75.0, 48.0, 34.0, 29.0, 18.0, 10.0, 12.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17333984375, -0.16812515258789062, -0.16291046142578125, -0.15769577026367188, -0.1524810791015625, -0.14726638793945312, -0.14205169677734375, -0.13683700561523438, -0.131622314453125, -0.12640762329101562, -0.12119293212890625, -0.11597824096679688, -0.1107635498046875, -0.10554885864257812, -0.10033416748046875, -0.09511947631835938, -0.08990478515625, -0.08469009399414062, -0.07947540283203125, -0.07426071166992188, -0.0690460205078125, -0.06383132934570312, -0.05861663818359375, -0.053401947021484375, -0.048187255859375, -0.042972564697265625, -0.03775787353515625, -0.032543182373046875, -0.0273284912109375, -0.022113800048828125, -0.01689910888671875, -0.011684417724609375, -0.0064697265625, -0.001255035400390625, 0.00395965576171875, 0.009174346923828125, 0.0143890380859375, 0.019603729248046875, 0.02481842041015625, 0.030033111572265625, 0.035247802734375, 0.040462493896484375, 0.04567718505859375, 0.050891876220703125, 0.0561065673828125, 0.061321258544921875, 0.06653594970703125, 0.07175064086914062, 0.07696533203125, 0.08218002319335938, 0.08739471435546875, 0.09260940551757812, 0.0978240966796875, 0.10303878784179688, 0.10825347900390625, 0.11346817016601562, 0.118682861328125, 0.12389755249023438, 0.12911224365234375, 0.13432693481445312, 0.1395416259765625, 0.14475631713867188, 0.14997100830078125, 0.15518569946289062, 0.160400390625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 9.0, 19.0, 15.0, 27.0, 50.0, 60.0, 74.0, 82.0, 102.0, 107.0, 88.0, 97.0, 73.0, 50.0, 42.0, 17.0, 16.0, 19.0, 15.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0907734632492065, -1.0485775470733643, -1.0063815116882324, -0.9641855359077454, -0.9219895601272583, -0.8797935843467712, -0.8375976085662842, -0.7954016327857971, -0.7532056570053101, -0.711009681224823, -0.6688137054443359, -0.6266177296638489, -0.5844217538833618, -0.5422257781028748, -0.5000298023223877, -0.45783382654190063, -0.4156378507614136, -0.3734418749809265, -0.33124589920043945, -0.2890499234199524, -0.24685394763946533, -0.20465797185897827, -0.1624619960784912, -0.12026602029800415, -0.07807004451751709, -0.03587406873703003, 0.006321907043457031, 0.04851788282394409, 0.09071385860443115, 0.1329098343849182, 0.17510581016540527, 0.21730178594589233, 0.25949788093566895, 0.301693856716156, 0.34388983249664307, 0.3860858082771301, 0.4282817840576172, 0.47047775983810425, 0.5126737356185913, 0.5548697113990784, 0.5970656871795654, 0.6392616629600525, 0.6814576387405396, 0.7236536145210266, 0.7658495903015137, 0.8080455660820007, 0.8502415418624878, 0.8924375176429749, 0.9346334934234619, 0.976829469203949, 1.019025444984436, 1.0612213611602783, 1.1034173965454102, 1.145613431930542, 1.1878093481063843, 1.2300052642822266, 1.2722012996673584, 1.3143973350524902, 1.3565932512283325, 1.3987891674041748, 1.4409852027893066, 1.4831812381744385, 1.5253771543502808, 1.567573070526123, 1.6097691059112549]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 5.0, 9.0, 9.0, 22.0, 17.0, 28.0, 35.0, 34.0, 43.0, 55.0, 44.0, 55.0, 69.0, 52.0, 69.0, 54.0, 49.0, 57.0, 46.0, 50.0, 37.0, 29.0, 36.0, 27.0, 25.0, 12.0, 10.0, 5.0, 8.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0028741359710693, -0.9743561148643494, -0.9458381533622742, -0.9173201322555542, -0.8888021111488342, -0.8602840900421143, -0.8317661285400391, -0.8032481074333191, -0.7747300863265991, -0.7462120652198792, -0.717694103717804, -0.689176082611084, -0.660658061504364, -0.632140040397644, -0.6036220788955688, -0.5751040577888489, -0.5465860962867737, -0.5180680751800537, -0.48955008387565613, -0.46103209257125854, -0.4325140714645386, -0.403996080160141, -0.3754780888557434, -0.34696006774902344, -0.31844207644462585, -0.28992408514022827, -0.2614060640335083, -0.23288807272911072, -0.20437006652355194, -0.17585206031799316, -0.14733406901359558, -0.1188160628080368, -0.09029799699783325, -0.061779994517564774, -0.033261992037296295, -0.004743993282318115, 0.02377401292324066, 0.05229201912879944, 0.08081001043319702, 0.1093280166387558, 0.13784602284431458, 0.16636402904987335, 0.19488203525543213, 0.2234000265598297, 0.2519180178642273, 0.28043603897094727, 0.30895403027534485, 0.33747202157974243, 0.3659900426864624, 0.39450803399086, 0.42302605509757996, 0.45154404640197754, 0.4800620675086975, 0.5085800886154175, 0.5370980501174927, 0.5656160712242126, 0.5941340923309326, 0.6226521134376526, 0.6511700749397278, 0.6796880960464478, 0.7082061171531677, 0.7367241382598877, 0.7652420997619629, 0.7937601208686829, 0.8222780823707581]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 16.0, 22.0, 35.0, 36.0, 52.0, 106.0, 153.0, 229.0, 399.0, 717.0, 1345.0, 2747.0, 6250.0, 16368.0, 49779.0, 184742.0, 481328.0, 216186.0, 57029.0, 17919.0, 6792.0, 2984.0, 1412.0, 767.0, 453.0, 275.0, 145.0, 88.0, 62.0, 37.0, 25.0, 20.0, 13.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12373828887939453, -0.12015724182128906, -0.1165761947631836, -0.11299514770507812, -0.10941410064697266, -0.10583305358886719, -0.10225200653076172, -0.09867095947265625, -0.09508991241455078, -0.09150886535644531, -0.08792781829833984, -0.08434677124023438, -0.0807657241821289, -0.07718467712402344, -0.07360363006591797, -0.0700225830078125, -0.06644153594970703, -0.06286048889160156, -0.059279441833496094, -0.055698394775390625, -0.052117347717285156, -0.04853630065917969, -0.04495525360107422, -0.04137420654296875, -0.03779315948486328, -0.03421211242675781, -0.030631065368652344, -0.027050018310546875, -0.023468971252441406, -0.019887924194335938, -0.01630687713623047, -0.012725830078125, -0.009144783020019531, -0.0055637359619140625, -0.0019826889038085938, 0.001598358154296875, 0.005179405212402344, 0.008760452270507812, 0.012341499328613281, 0.01592254638671875, 0.01950359344482422, 0.023084640502929688, 0.026665687561035156, 0.030246734619140625, 0.033827781677246094, 0.03740882873535156, 0.04098987579345703, 0.0445709228515625, 0.04815196990966797, 0.05173301696777344, 0.055314064025878906, 0.058895111083984375, 0.062476158142089844, 0.06605720520019531, 0.06963825225830078, 0.07321929931640625, 0.07680034637451172, 0.08038139343261719, 0.08396244049072266, 0.08754348754882812, 0.0911245346069336, 0.09470558166503906, 0.09828662872314453, 0.10186767578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 2.0, 4.0, 10.0, 21.0, 13.0, 15.0, 22.0, 24.0, 30.0, 22.0, 31.0, 40.0, 41.0, 41.0, 38.0, 59.0, 62.0, 55.0, 47.0, 49.0, 47.0, 61.0, 44.0, 30.0, 43.0, 25.0, 19.0, 19.0, 17.0, 15.0, 15.0, 6.0, 6.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12493896484375, -0.12124156951904297, -0.11754417419433594, -0.1138467788696289, -0.11014938354492188, -0.10645198822021484, -0.10275459289550781, -0.09905719757080078, -0.09535980224609375, -0.09166240692138672, -0.08796501159667969, -0.08426761627197266, -0.08057022094726562, -0.0768728256225586, -0.07317543029785156, -0.06947803497314453, -0.0657806396484375, -0.06208324432373047, -0.05838584899902344, -0.054688453674316406, -0.050991058349609375, -0.047293663024902344, -0.04359626770019531, -0.03989887237548828, -0.03620147705078125, -0.03250408172607422, -0.028806686401367188, -0.025109291076660156, -0.021411895751953125, -0.017714500427246094, -0.014017105102539062, -0.010319709777832031, -0.006622314453125, -0.0029249191284179688, 0.0007724761962890625, 0.004469871520996094, 0.008167266845703125, 0.011864662170410156, 0.015562057495117188, 0.01925945281982422, 0.02295684814453125, 0.02665424346923828, 0.030351638793945312, 0.034049034118652344, 0.037746429443359375, 0.041443824768066406, 0.04514122009277344, 0.04883861541748047, 0.0525360107421875, 0.05623340606689453, 0.05993080139160156, 0.0636281967163086, 0.06732559204101562, 0.07102298736572266, 0.07472038269042969, 0.07841777801513672, 0.08211517333984375, 0.08581256866455078, 0.08950996398925781, 0.09320735931396484, 0.09690475463867188, 0.1006021499633789, 0.10429954528808594, 0.10799694061279297, 0.1116943359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 5.0, 11.0, 24.0, 28.0, 54.0, 84.0, 127.0, 244.0, 425.0, 841.0, 1755.0, 4290.0, 12424.0, 41357.0, 171434.0, 558907.0, 189180.0, 44940.0, 13498.0, 4826.0, 2017.0, 969.0, 465.0, 259.0, 129.0, 86.0, 58.0, 38.0, 22.0, 18.0, 9.0, 11.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09112548828125, -0.08823585510253906, -0.08534622192382812, -0.08245658874511719, -0.07956695556640625, -0.07667732238769531, -0.07378768920898438, -0.07089805603027344, -0.0680084228515625, -0.06511878967285156, -0.062229156494140625, -0.05933952331542969, -0.05644989013671875, -0.05356025695800781, -0.050670623779296875, -0.04778099060058594, -0.044891357421875, -0.04200172424316406, -0.039112091064453125, -0.03622245788574219, -0.03333282470703125, -0.030443191528320312, -0.027553558349609375, -0.024663925170898438, -0.0217742919921875, -0.018884658813476562, -0.015995025634765625, -0.013105392456054688, -0.01021575927734375, -0.0073261260986328125, -0.004436492919921875, -0.0015468597412109375, 0.0013427734375, 0.0042324066162109375, 0.007122039794921875, 0.010011672973632812, 0.01290130615234375, 0.015790939331054688, 0.018680572509765625, 0.021570205688476562, 0.0244598388671875, 0.027349472045898438, 0.030239105224609375, 0.03312873840332031, 0.03601837158203125, 0.03890800476074219, 0.041797637939453125, 0.04468727111816406, 0.047576904296875, 0.05046653747558594, 0.053356170654296875, 0.05624580383300781, 0.05913543701171875, 0.06202507019042969, 0.06491470336914062, 0.06780433654785156, 0.0706939697265625, 0.07358360290527344, 0.07647323608398438, 0.07936286926269531, 0.08225250244140625, 0.08514213562011719, 0.08803176879882812, 0.09092140197753906, 0.09381103515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 5.0, 11.0, 8.0, 20.0, 18.0, 23.0, 28.0, 33.0, 44.0, 48.0, 53.0, 68.0, 72.0, 71.0, 85.0, 63.0, 64.0, 59.0, 39.0, 41.0, 24.0, 24.0, 29.0, 14.0, 12.0, 8.0, 7.0, 6.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.34521484375, -0.3358421325683594, -0.32646942138671875, -0.3170967102050781, -0.3077239990234375, -0.2983512878417969, -0.28897857666015625, -0.2796058654785156, -0.270233154296875, -0.2608604431152344, -0.25148773193359375, -0.24211502075195312, -0.2327423095703125, -0.22336959838867188, -0.21399688720703125, -0.20462417602539062, -0.19525146484375, -0.18587875366210938, -0.17650604248046875, -0.16713333129882812, -0.1577606201171875, -0.14838790893554688, -0.13901519775390625, -0.12964248657226562, -0.120269775390625, -0.11089706420898438, -0.10152435302734375, -0.09215164184570312, -0.0827789306640625, -0.07340621948242188, -0.06403350830078125, -0.054660797119140625, -0.0452880859375, -0.035915374755859375, -0.02654266357421875, -0.017169952392578125, -0.0077972412109375, 0.001575469970703125, 0.01094818115234375, 0.020320892333984375, 0.029693603515625, 0.039066314697265625, 0.04843902587890625, 0.057811737060546875, 0.0671844482421875, 0.07655715942382812, 0.08592987060546875, 0.09530258178710938, 0.10467529296875, 0.11404800415039062, 0.12342071533203125, 0.13279342651367188, 0.1421661376953125, 0.15153884887695312, 0.16091156005859375, 0.17028427124023438, 0.179656982421875, 0.18902969360351562, 0.19840240478515625, 0.20777511596679688, 0.2171478271484375, 0.22652053833007812, 0.23589324951171875, 0.24526596069335938, 0.254638671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 4.0, 11.0, 9.0, 12.0, 18.0, 24.0, 46.0, 45.0, 78.0, 162.0, 259.0, 510.0, 1133.0, 4464.0, 37822.0, 667974.0, 311798.0, 19216.0, 2955.0, 930.0, 390.0, 197.0, 153.0, 104.0, 52.0, 49.0, 35.0, 28.0, 19.0, 3.0, 10.0, 6.0, 3.0, 6.0, 5.0, 2.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03643798828125, -0.03525733947753906, -0.034076690673828125, -0.03289604187011719, -0.03171539306640625, -0.030534744262695312, -0.029354095458984375, -0.028173446655273438, -0.0269927978515625, -0.025812149047851562, -0.024631500244140625, -0.023450851440429688, -0.02227020263671875, -0.021089553833007812, -0.019908905029296875, -0.018728256225585938, -0.017547607421875, -0.016366958618164062, -0.015186309814453125, -0.014005661010742188, -0.01282501220703125, -0.011644363403320312, -0.010463714599609375, -0.009283065795898438, -0.0081024169921875, -0.0069217681884765625, -0.005741119384765625, -0.0045604705810546875, -0.00337982177734375, -0.0021991729736328125, -0.001018524169921875, 0.0001621246337890625, 0.0013427734375, 0.0025234222412109375, 0.003704071044921875, 0.0048847198486328125, 0.00606536865234375, 0.0072460174560546875, 0.008426666259765625, 0.009607315063476562, 0.0107879638671875, 0.011968612670898438, 0.013149261474609375, 0.014329910278320312, 0.01551055908203125, 0.016691207885742188, 0.017871856689453125, 0.019052505493164062, 0.020233154296875, 0.021413803100585938, 0.022594451904296875, 0.023775100708007812, 0.02495574951171875, 0.026136398315429688, 0.027317047119140625, 0.028497695922851562, 0.0296783447265625, 0.030858993530273438, 0.032039642333984375, 0.03322029113769531, 0.03440093994140625, 0.03558158874511719, 0.036762237548828125, 0.03794288635253906, 0.03912353515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 8.0, 6.0, 9.0, 7.0, 13.0, 19.0, 16.0, 17.0, 28.0, 33.0, 29.0, 27.0, 55.0, 55.0, 60.0, 52.0, 63.0, 79.0, 40.0, 50.0, 71.0, 44.0, 27.0, 36.0, 34.0, 20.0, 10.0, 13.0, 14.0, 11.0, 5.0, 4.0, 6.0, 2.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-7.092952728271484e-06, -6.870366632938385e-06, -6.647780537605286e-06, -6.425194442272186e-06, -6.202608346939087e-06, -5.9800222516059875e-06, -5.757436156272888e-06, -5.534850060939789e-06, -5.3122639656066895e-06, -5.08967787027359e-06, -4.867091774940491e-06, -4.644505679607391e-06, -4.421919584274292e-06, -4.199333488941193e-06, -3.976747393608093e-06, -3.754161298274994e-06, -3.5315752029418945e-06, -3.308989107608795e-06, -3.086403012275696e-06, -2.8638169169425964e-06, -2.641230821609497e-06, -2.4186447262763977e-06, -2.1960586309432983e-06, -1.973472535610199e-06, -1.7508864402770996e-06, -1.5283003449440002e-06, -1.3057142496109009e-06, -1.0831281542778015e-06, -8.605420589447021e-07, -6.379559636116028e-07, -4.153698682785034e-07, -1.9278377294540405e-07, 2.9802322387695312e-08, 2.523884177207947e-07, 4.7497451305389404e-07, 6.975606083869934e-07, 9.201467037200928e-07, 1.1427327990531921e-06, 1.3653188943862915e-06, 1.5879049897193909e-06, 1.8104910850524902e-06, 2.0330771803855896e-06, 2.255663275718689e-06, 2.4782493710517883e-06, 2.7008354663848877e-06, 2.923421561717987e-06, 3.1460076570510864e-06, 3.368593752384186e-06, 3.591179847717285e-06, 3.8137659430503845e-06, 4.036352038383484e-06, 4.258938133716583e-06, 4.481524229049683e-06, 4.704110324382782e-06, 4.926696419715881e-06, 5.149282515048981e-06, 5.37186861038208e-06, 5.5944547057151794e-06, 5.817040801048279e-06, 6.039626896381378e-06, 6.2622129917144775e-06, 6.484799087047577e-06, 6.707385182380676e-06, 6.929971277713776e-06, 7.152557373046875e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 7.0, 10.0, 15.0, 21.0, 25.0, 33.0, 41.0, 83.0, 117.0, 156.0, 233.0, 429.0, 981.0, 2803.0, 11980.0, 73585.0, 589086.0, 316985.0, 40605.0, 7426.0, 1981.0, 792.0, 349.0, 240.0, 173.0, 113.0, 61.0, 57.0, 45.0, 26.0, 21.0, 22.0, 8.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03497314453125, -0.033997535705566406, -0.03302192687988281, -0.03204631805419922, -0.031070709228515625, -0.03009510040283203, -0.029119491577148438, -0.028143882751464844, -0.02716827392578125, -0.026192665100097656, -0.025217056274414062, -0.02424144744873047, -0.023265838623046875, -0.02229022979736328, -0.021314620971679688, -0.020339012145996094, -0.0193634033203125, -0.018387794494628906, -0.017412185668945312, -0.01643657684326172, -0.015460968017578125, -0.014485359191894531, -0.013509750366210938, -0.012534141540527344, -0.01155853271484375, -0.010582923889160156, -0.009607315063476562, -0.008631706237792969, -0.007656097412109375, -0.006680488586425781, -0.0057048797607421875, -0.004729270935058594, -0.003753662109375, -0.0027780532836914062, -0.0018024444580078125, -0.0008268356323242188, 0.000148773193359375, 0.0011243820190429688, 0.0020999908447265625, 0.0030755996704101562, 0.00405120849609375, 0.005026817321777344, 0.0060024261474609375, 0.006978034973144531, 0.007953643798828125, 0.008929252624511719, 0.009904861450195312, 0.010880470275878906, 0.0118560791015625, 0.012831687927246094, 0.013807296752929688, 0.014782905578613281, 0.015758514404296875, 0.01673412322998047, 0.017709732055664062, 0.018685340881347656, 0.01966094970703125, 0.020636558532714844, 0.021612167358398438, 0.02258777618408203, 0.023563385009765625, 0.02453899383544922, 0.025514602661132812, 0.026490211486816406, 0.0274658203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 18.0, 36.0, 63.0, 93.0, 139.0, 154.0, 167.0, 122.0, 76.0, 58.0, 21.0, 16.0, 13.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07470703125, -0.07283258438110352, -0.07095813751220703, -0.06908369064331055, -0.06720924377441406, -0.06533479690551758, -0.0634603500366211, -0.06158590316772461, -0.059711456298828125, -0.05783700942993164, -0.055962562561035156, -0.05408811569213867, -0.05221366882324219, -0.0503392219543457, -0.04846477508544922, -0.046590328216552734, -0.04471588134765625, -0.042841434478759766, -0.04096698760986328, -0.0390925407409668, -0.03721809387207031, -0.03534364700317383, -0.033469200134277344, -0.03159475326538086, -0.029720306396484375, -0.02784585952758789, -0.025971412658691406, -0.024096965789794922, -0.022222518920898438, -0.020348072052001953, -0.01847362518310547, -0.016599178314208984, -0.0147247314453125, -0.012850284576416016, -0.010975837707519531, -0.009101390838623047, -0.0072269439697265625, -0.005352497100830078, -0.0034780502319335938, -0.0016036033630371094, 0.000270843505859375, 0.0021452903747558594, 0.004019737243652344, 0.005894184112548828, 0.0077686309814453125, 0.009643077850341797, 0.011517524719238281, 0.013391971588134766, 0.01526641845703125, 0.017140865325927734, 0.01901531219482422, 0.020889759063720703, 0.022764205932617188, 0.024638652801513672, 0.026513099670410156, 0.02838754653930664, 0.030261993408203125, 0.03213644027709961, 0.034010887145996094, 0.03588533401489258, 0.03775978088378906, 0.03963422775268555, 0.04150867462158203, 0.043383121490478516, 0.045257568359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 1.0, 5.0, 6.0, 8.0, 11.0, 19.0, 23.0, 29.0, 53.0, 83.0, 107.0, 160.0, 163.0, 110.0, 81.0, 39.0, 28.0, 25.0, 13.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8822153210639954, -0.8621003031730652, -0.8419852256774902, -0.8218702077865601, -0.8017551898956299, -0.7816401720046997, -0.7615251541137695, -0.7414100766181946, -0.7212950587272644, -0.7011800408363342, -0.6810649633407593, -0.6609499454498291, -0.6408349275588989, -0.6207199096679688, -0.6006048917770386, -0.5804898142814636, -0.5603747963905334, -0.5402597784996033, -0.5201447010040283, -0.5000296831130981, -0.47991466522216797, -0.4597996473312378, -0.43968459963798523, -0.41956955194473267, -0.3994545340538025, -0.3793395161628723, -0.35922446846961975, -0.3391094207763672, -0.318994402885437, -0.29887938499450684, -0.2787643373012543, -0.2586492896080017, -0.23853430151939392, -0.21841926872730255, -0.19830423593521118, -0.1781892031431198, -0.15807417035102844, -0.13795913755893707, -0.1178441047668457, -0.09772907197475433, -0.07761403918266296, -0.057499006390571594, -0.037383973598480225, -0.017268940806388855, 0.0028460919857025146, 0.022961124777793884, 0.043076157569885254, 0.06319119036197662, 0.083306223154068, 0.10342125594615936, 0.12353628873825073, 0.1436513215303421, 0.16376635432243347, 0.18388138711452484, 0.2039964199066162, 0.22411145269870758, 0.24422648549079895, 0.2643415331840515, 0.2844565510749817, 0.30457156896591187, 0.32468661665916443, 0.344801664352417, 0.36491668224334717, 0.38503170013427734, 0.4051467478275299]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 20.0, 25.0, 45.0, 49.0, 62.0, 74.0, 92.0, 159.0, 134.0, 76.0, 68.0, 65.0, 35.0, 37.0, 20.0, 17.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-1.9915807247161865, -1.9508219957351685, -1.91006338596344, -1.8693046569824219, -1.8285460472106934, -1.7877873182296753, -1.7470287084579468, -1.7062699794769287, -1.6655113697052002, -1.6247526407241821, -1.5839940309524536, -1.5432353019714355, -1.502476692199707, -1.461717963218689, -1.4209593534469604, -1.3802006244659424, -1.3394418954849243, -1.2986831665039062, -1.2579245567321777, -1.2171658277511597, -1.1764072179794312, -1.135648488998413, -1.0948898792266846, -1.0541311502456665, -1.0133724212646484, -0.9726137518882751, -0.9318550825119019, -0.8910964131355286, -0.8503377437591553, -0.8095790147781372, -0.7688203454017639, -0.7280616760253906, -0.6873030066490173, -0.646544337272644, -0.6057856678962708, -0.5650269985198975, -0.5242682695388794, -0.4835096299648285, -0.4427509307861328, -0.4019922614097595, -0.36123359203338623, -0.32047492265701294, -0.27971625328063965, -0.23895755410194397, -0.19819888472557068, -0.1574402153491974, -0.1166815310716629, -0.07592284679412842, -0.03516417741775513, 0.005594499409198761, 0.04635317623615265, 0.08711185306310654, 0.12787052989006042, 0.16862919926643372, 0.2093878835439682, 0.2501465678215027, 0.290905237197876, 0.33166390657424927, 0.37242257595062256, 0.41318127512931824, 0.45393994450569153, 0.4946986138820648, 0.5354573130607605, 0.5762159824371338, 0.6169746518135071]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 14.0, 9.0, 23.0, 28.0, 36.0, 48.0, 71.0, 371.0, 158.0, 57.0, 59.0, 33.0, 23.0, 10.0, 17.0, 13.0, 10.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32177734375, -0.3144245147705078, -0.3070716857910156, -0.29971885681152344, -0.29236602783203125, -0.28501319885253906, -0.2776603698730469, -0.2703075408935547, -0.2629547119140625, -0.2556018829345703, -0.24824905395507812, -0.24089622497558594, -0.23354339599609375, -0.22619056701660156, -0.21883773803710938, -0.2114849090576172, -0.204132080078125, -0.1967792510986328, -0.18942642211914062, -0.18207359313964844, -0.17472076416015625, -0.16736793518066406, -0.16001510620117188, -0.1526622772216797, -0.1453094482421875, -0.1379566192626953, -0.13060379028320312, -0.12325096130371094, -0.11589813232421875, -0.10854530334472656, -0.10119247436523438, -0.09383964538574219, -0.08648681640625, -0.07913398742675781, -0.07178115844726562, -0.06442832946777344, -0.05707550048828125, -0.04972267150878906, -0.042369842529296875, -0.03501701354980469, -0.0276641845703125, -0.020311355590820312, -0.012958526611328125, -0.0056056976318359375, 0.00174713134765625, 0.009099960327148438, 0.016452789306640625, 0.023805618286132812, 0.031158447265625, 0.03851127624511719, 0.045864105224609375, 0.05321693420410156, 0.06056976318359375, 0.06792259216308594, 0.07527542114257812, 0.08262825012207031, 0.0899810791015625, 0.09733390808105469, 0.10468673706054688, 0.11203956604003906, 0.11939239501953125, 0.12674522399902344, 0.13409805297851562, 0.1414508819580078, 0.1488037109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 9.0, 11.0, 15.0, 18.0, 17.0, 39.0, 44.0, 67.0, 107.0, 142.0, 229.0, 404.0, 884.0, 2164.0, 6294.0, 28903.0, 8287369.0, 49596.0, 7760.0, 2496.0, 940.0, 405.0, 238.0, 146.0, 101.0, 49.0, 39.0, 27.0, 12.0, 11.0, 12.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46612322330474854, -0.45372939109802246, -0.441335529088974, -0.4289416968822479, -0.41654783487319946, -0.4041540026664734, -0.3917601406574249, -0.37936630845069885, -0.3669724464416504, -0.3545786142349243, -0.34218475222587585, -0.3297909200191498, -0.3173970580101013, -0.30500322580337524, -0.2926093637943268, -0.2802155315876007, -0.26782166957855225, -0.25542783737182617, -0.2430339753627777, -0.23064012825489044, -0.21824628114700317, -0.2058524340391159, -0.19345858693122864, -0.18106475472450256, -0.1686709225177765, -0.15627707540988922, -0.14388322830200195, -0.13148938119411469, -0.11909553408622742, -0.10670168697834015, -0.09430784732103348, -0.08191400021314621, -0.06952014565467834, -0.05712629854679108, -0.04473245143890381, -0.03233860805630684, -0.01994476094841957, -0.007550913840532303, 0.004842929542064667, 0.017236776649951935, 0.029630623757839203, 0.04202447086572647, 0.05441831797361374, 0.06681215763092041, 0.07920600473880768, 0.09159985184669495, 0.10399369895458221, 0.11638754606246948, 0.12878139317035675, 0.14117524027824402, 0.1535690873861313, 0.16596293449401855, 0.17835678160190582, 0.1907506287097931, 0.20314446091651917, 0.21553832292556763, 0.2279321551322937, 0.24032600224018097, 0.25271984934806824, 0.2651136815547943, 0.2775075435638428, 0.28990137577056885, 0.3022952377796173, 0.3146890699863434, 0.32708293199539185]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 1.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 2.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5263785719871521, -0.5044112205505371, -0.4824438691139221, -0.4604765474796295, -0.4385091960430145, -0.41654184460639954, -0.39457452297210693, -0.37260717153549194, -0.35063982009887695, -0.32867246866226196, -0.306705117225647, -0.28473779559135437, -0.2627704441547394, -0.2408030927181244, -0.2188357561826706, -0.1968684196472168, -0.1749010682106018, -0.15293371677398682, -0.13096638023853302, -0.10899903625249863, -0.08703169226646423, -0.06506434828042984, -0.04309700429439545, -0.02112966775894165, 0.0008376836776733398, 0.022805027663707733, 0.044772371649742126, 0.06673971563577652, 0.08870705962181091, 0.1106744036078453, 0.1326417475938797, 0.1546090841293335, 0.1765763759613037, 0.1985437273979187, 0.2205110639333725, 0.2424784004688263, 0.2644457519054413, 0.2864131033420563, 0.3083804249763489, 0.33034777641296387, 0.35231512784957886, 0.37428247928619385, 0.39624983072280884, 0.41821715235710144, 0.44018450379371643, 0.4621518552303314, 0.484119176864624, 0.506086528301239, 0.528053879737854, 0.550021231174469, 0.571988582611084, 0.593955934047699, 0.615923285484314, 0.6378905773162842, 0.6598579287528992, 0.6818252801895142, 0.7037926316261292, 0.7257599830627441, 0.7477273344993591, 0.7696946859359741, 0.7916619777679443, 0.8136293292045593, 0.8355966806411743, 0.8575640320777893, 0.8795313835144043]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 13.0, 6.0, 26.0, 27.0, 33.0, 44.0, 48.0, 60.0, 62.0, 76.0, 88.0, 85.0, 68.0, 74.0, 48.0, 55.0, 62.0, 22.0, 35.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1063232421875, -0.10365676879882812, -0.10099029541015625, -0.09832382202148438, -0.0956573486328125, -0.09299087524414062, -0.09032440185546875, -0.08765792846679688, -0.084991455078125, -0.08232498168945312, -0.07965850830078125, -0.07699203491210938, -0.0743255615234375, -0.07165908813476562, -0.06899261474609375, -0.06632614135742188, -0.06365966796875, -0.060993194580078125, -0.05832672119140625, -0.055660247802734375, -0.0529937744140625, -0.050327301025390625, -0.04766082763671875, -0.044994354248046875, -0.042327880859375, -0.039661407470703125, -0.03699493408203125, -0.034328460693359375, -0.0316619873046875, -0.028995513916015625, -0.02632904052734375, -0.023662567138671875, -0.02099609375, -0.018329620361328125, -0.01566314697265625, -0.012996673583984375, -0.0103302001953125, -0.007663726806640625, -0.00499725341796875, -0.002330780029296875, 0.000335693359375, 0.003002166748046875, 0.00566864013671875, 0.008335113525390625, 0.0110015869140625, 0.013668060302734375, 0.01633453369140625, 0.019001007080078125, 0.02166748046875, 0.024333953857421875, 0.02700042724609375, 0.029666900634765625, 0.0323333740234375, 0.034999847412109375, 0.03766632080078125, 0.040332794189453125, 0.042999267578125, 0.045665740966796875, 0.04833221435546875, 0.050998687744140625, 0.0536651611328125, 0.056331634521484375, 0.05899810791015625, 0.061664581298828125, 0.0643310546875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 19.0, 8.0, 19.0, 16.0, 36.0, 44.0, 57.0, 81.0, 133.0, 237.0, 380.0, 715.0, 1444.0, 2792.0, 5808.0, 12963.0, 34562.0, 129702.0, 227963.0, 67847.0, 21796.0, 9016.0, 4078.0, 2018.0, 1086.0, 551.0, 318.0, 182.0, 115.0, 82.0, 53.0, 30.0, 27.0, 22.0, 12.0, 16.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.181671142578125, -1.14263916015625, -1.103607177734375, -1.0645751953125, -1.025543212890625, -0.98651123046875, -0.947479248046875, -0.908447265625, -0.869415283203125, -0.83038330078125, -0.791351318359375, -0.7523193359375, -0.713287353515625, -0.67425537109375, -0.635223388671875, -0.59619140625, -0.557159423828125, -0.51812744140625, -0.479095458984375, -0.4400634765625, -0.401031494140625, -0.36199951171875, -0.322967529296875, -0.283935546875, -0.244903564453125, -0.20587158203125, -0.166839599609375, -0.1278076171875, -0.088775634765625, -0.04974365234375, -0.010711669921875, 0.0283203125, 0.067352294921875, 0.10638427734375, 0.145416259765625, 0.1844482421875, 0.223480224609375, 0.26251220703125, 0.301544189453125, 0.340576171875, 0.379608154296875, 0.41864013671875, 0.457672119140625, 0.4967041015625, 0.535736083984375, 0.57476806640625, 0.613800048828125, 0.65283203125, 0.691864013671875, 0.73089599609375, 0.769927978515625, 0.8089599609375, 0.847991943359375, 0.88702392578125, 0.926055908203125, 0.965087890625, 1.004119873046875, 1.04315185546875, 1.082183837890625, 1.1212158203125, 1.160247802734375, 1.19927978515625, 1.238311767578125, 1.27734375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 5.0, 9.0, 9.0, 12.0, 9.0, 26.0, 18.0, 17.0, 29.0, 27.0, 33.0, 37.0, 32.0, 44.0, 46.0, 40.0, 55.0, 53.0, 56.0, 57.0, 53.0, 46.0, 48.0, 43.0, 36.0, 30.0, 24.0, 19.0, 14.0, 16.0, 10.0, 6.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0997314453125, -0.0966501235961914, -0.09356880187988281, -0.09048748016357422, -0.08740615844726562, -0.08432483673095703, -0.08124351501464844, -0.07816219329833984, -0.07508087158203125, -0.07199954986572266, -0.06891822814941406, -0.06583690643310547, -0.06275558471679688, -0.05967426300048828, -0.05659294128417969, -0.053511619567871094, -0.0504302978515625, -0.047348976135253906, -0.04426765441894531, -0.04118633270263672, -0.038105010986328125, -0.03502368927001953, -0.03194236755371094, -0.028861045837402344, -0.02577972412109375, -0.022698402404785156, -0.019617080688476562, -0.01653575897216797, -0.013454437255859375, -0.010373115539550781, -0.0072917938232421875, -0.004210472106933594, -0.001129150390625, 0.0019521713256835938, 0.0050334930419921875, 0.008114814758300781, 0.011196136474609375, 0.014277458190917969, 0.017358779907226562, 0.020440101623535156, 0.02352142333984375, 0.026602745056152344, 0.029684066772460938, 0.03276538848876953, 0.035846710205078125, 0.03892803192138672, 0.04200935363769531, 0.045090675354003906, 0.0481719970703125, 0.051253318786621094, 0.05433464050292969, 0.05741596221923828, 0.060497283935546875, 0.06357860565185547, 0.06665992736816406, 0.06974124908447266, 0.07282257080078125, 0.07590389251708984, 0.07898521423339844, 0.08206653594970703, 0.08514785766601562, 0.08822917938232422, 0.09131050109863281, 0.0943918228149414, 0.09747314453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 9.0, 11.0, 14.0, 32.0, 42.0, 55.0, 77.0, 66.0, 48.0, 32.0, 32.0, 16.0, 11.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3021215796470642, -0.29052022099494934, -0.2789188623428345, -0.2673175036907196, -0.25571614503860474, -0.24411478638648987, -0.232513427734375, -0.22091206908226013, -0.20931071043014526, -0.1977093517780304, -0.18610799312591553, -0.17450663447380066, -0.1629052758216858, -0.15130391716957092, -0.13970255851745605, -0.1281011998653412, -0.11649984121322632, -0.10489848256111145, -0.09329712390899658, -0.08169576525688171, -0.07009440660476685, -0.05849304795265198, -0.04689168930053711, -0.03529033064842224, -0.023688971996307373, -0.012087613344192505, -0.0004862546920776367, 0.011115103960037231, 0.0227164626121521, 0.03431782126426697, 0.045919179916381836, 0.057520538568496704, 0.06912189722061157, 0.08072325587272644, 0.09232461452484131, 0.10392597317695618, 0.11552733182907104, 0.1271286904811859, 0.13873004913330078, 0.15033140778541565, 0.16193276643753052, 0.17353412508964539, 0.18513548374176025, 0.19673684239387512, 0.20833820104599, 0.21993955969810486, 0.23154091835021973, 0.2431422770023346, 0.25474363565444946, 0.26634499430656433, 0.2779463529586792, 0.28954771161079407, 0.30114907026290894, 0.3127504289150238, 0.32435178756713867, 0.33595314621925354, 0.3475545048713684, 0.3591558635234833, 0.37075722217559814, 0.382358580827713, 0.3939599394798279, 0.40556129813194275, 0.4171626567840576, 0.4287640154361725, 0.44036537408828735]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 8.0, 8.0, 6.0, 2.0, 4.0, 7.0, 14.0, 16.0, 60.0, 107.0, 83.0, 35.0, 17.0, 9.0, 14.0, 9.0, 9.0, 8.0, 10.0, 4.0, 8.0, 3.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3772903084754944, -0.3655451238155365, -0.3537999391555786, -0.3420547544956207, -0.33030956983566284, -0.31856435537338257, -0.30681920051574707, -0.2950739860534668, -0.2833288013935089, -0.271583616733551, -0.25983843207359314, -0.24809324741363525, -0.23634804785251617, -0.2246028631925583, -0.2128576785326004, -0.20111247897148132, -0.18936730921268463, -0.17762212455272675, -0.16587693989276886, -0.15413174033164978, -0.1423865556716919, -0.130641371011734, -0.11889618635177612, -0.10715099424123764, -0.09540580958127975, -0.08366062492132187, -0.07191543281078339, -0.0601702481508255, -0.048425059765577316, -0.03667987138032913, -0.024934686720371246, -0.013189494609832764, -0.001444309949874878, 0.010300877504050732, 0.02204606495797634, 0.033791251480579376, 0.04553643986582756, 0.057281628251075745, 0.06902681291103363, 0.08077200502157211, 0.09251718968153, 0.10426237434148788, 0.11600756645202637, 0.12775275111198425, 0.13949793577194214, 0.15124312043190002, 0.1629883050918579, 0.174733504652977, 0.18647868931293488, 0.19822387397289276, 0.20996905863285065, 0.22171425819396973, 0.2334594428539276, 0.2452046275138855, 0.2569498121738434, 0.26869499683380127, 0.28044018149375916, 0.29218536615371704, 0.3039305508136749, 0.3156757354736328, 0.3274209201335907, 0.3391661047935486, 0.35091131925582886, 0.36265650391578674, 0.37440168857574463]}, "eval/loss": 2.2451658248901367, "eval/bleu": 2.3052062590891975e-13, "eval/runtime": 2533.9805, "eval/samples_per_second": 5.825, "eval/steps_per_second": 0.728} \ No newline at end of file