diff --git "a/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" "b/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" --- "a/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" +++ "b/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0134, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 10.0, "train/global_step": 2230, "_runtime": 51756, "_timestamp": 1648366446, "_step": 2234, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 30.0, 111.0, 200.0, 305.0, 216.0, 87.0, 40.0, 11.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3592593669891357, -2.3074288368225098, -2.255598545074463, -2.203768014907837, -2.151937484741211, -2.100106954574585, -2.048276662826538, -1.996446132659912, -1.9446156024932861, -1.8927851915359497, -1.8409546613693237, -1.7891242504119873, -1.7372937202453613, -1.685463309288025, -1.633632779121399, -1.5818023681640625, -1.5299718379974365, -1.4781414270401, -1.4263108968734741, -1.3744804859161377, -1.3226499557495117, -1.2708195447921753, -1.2189890146255493, -1.167158603668213, -1.1153281927108765, -1.06349778175354, -1.011667251586914, -0.9598367810249329, -0.9080063104629517, -0.8561758995056152, -0.8043453693389893, -0.7525149583816528, -0.7006843686103821, -0.6488538980484009, -0.5970234274864197, -0.5451929569244385, -0.4933624863624573, -0.44153204560279846, -0.38970157504081726, -0.33787110447883606, -0.28604063391685486, -0.23421016335487366, -0.18237969279289246, -0.13054923713207245, -0.07871876657009125, -0.02688831090927124, 0.02494215965270996, 0.07677263021469116, 0.12860310077667236, 0.18043357133865356, 0.23226404190063477, 0.28409451246261597, 0.33592498302459717, 0.387755423784256, 0.4395858943462372, 0.4914163649082184, 0.543246865272522, 0.5950773358345032, 0.6469078063964844, 0.6987382769584656, 0.7505687475204468, 0.8023991584777832, 0.8542296886444092, 0.9060600996017456, 0.9578905701637268]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 11.0, 15.0, 19.0, 22.0, 24.0, 39.0, 22.0, 38.0, 43.0, 41.0, 48.0, 48.0, 49.0, 51.0, 56.0, 44.0, 49.0, 42.0, 36.0, 39.0, 35.0, 28.0, 34.0, 18.0, 24.0, 25.0, 18.0, 17.0, 13.0, 6.0, 10.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4530882239341736, -0.4375229775905609, -0.42195773124694824, -0.40639248490333557, -0.3908272385597229, -0.37526199221611023, -0.35969674587249756, -0.3441315293312073, -0.3285662531852722, -0.31300100684165955, -0.2974357604980469, -0.2818705141544342, -0.26630526781082153, -0.25074002146720886, -0.23517479002475739, -0.21960954368114471, -0.20404431223869324, -0.18847906589508057, -0.1729138195514679, -0.15734857320785522, -0.14178332686424255, -0.12621808052062988, -0.1106528490781784, -0.09508760273456573, -0.07952235639095306, -0.0639571100473404, -0.04839186742901802, -0.03282662481069565, -0.017261378467082977, -0.0016961321234703064, 0.013869106769561768, 0.02943435311317444, 0.04499959945678711, 0.06056484580039978, 0.07613009214401245, 0.09169533103704453, 0.1072605773806572, 0.12282582372426987, 0.13839106261730194, 0.1539563089609146, 0.16952155530452728, 0.18508680164813995, 0.20065204799175262, 0.2162172794342041, 0.23178252577781677, 0.24734777212142944, 0.2629130184650421, 0.2784782648086548, 0.29404351115226746, 0.3096087574958801, 0.3251740038394928, 0.34073925018310547, 0.35630449652671814, 0.3718697428703308, 0.3874349594116211, 0.40300023555755615, 0.41856545209884644, 0.4341306984424591, 0.4496959447860718, 0.46526119112968445, 0.4808264374732971, 0.4963916838169098, 0.5119569301605225, 0.5275221467018127, 0.5430874228477478]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 14.0, 13.0, 14.0, 21.0, 30.0, 36.0, 48.0, 62.0, 98.0, 147.0, 212.0, 322.0, 507.0, 747.0, 1173.0, 1811.0, 3182.0, 6017.0, 12088.0, 30614.0, 128466.0, 602238.0, 2024053.0, 1052782.0, 239315.0, 55238.0, 17617.0, 7380.0, 3974.0, 2237.0, 1354.0, 854.0, 546.0, 349.0, 221.0, 154.0, 102.0, 71.0, 47.0, 35.0, 37.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.86083984375, -0.835296630859375, -0.80975341796875, -0.784210205078125, -0.7586669921875, -0.733123779296875, -0.70758056640625, -0.682037353515625, -0.656494140625, -0.630950927734375, -0.60540771484375, -0.579864501953125, -0.5543212890625, -0.528778076171875, -0.50323486328125, -0.477691650390625, -0.4521484375, -0.426605224609375, -0.40106201171875, -0.375518798828125, -0.3499755859375, -0.324432373046875, -0.29888916015625, -0.273345947265625, -0.247802734375, -0.222259521484375, -0.19671630859375, -0.171173095703125, -0.1456298828125, -0.120086669921875, -0.09454345703125, -0.069000244140625, -0.04345703125, -0.017913818359375, 0.00762939453125, 0.033172607421875, 0.0587158203125, 0.084259033203125, 0.10980224609375, 0.135345458984375, 0.160888671875, 0.186431884765625, 0.21197509765625, 0.237518310546875, 0.2630615234375, 0.288604736328125, 0.31414794921875, 0.339691162109375, 0.365234375, 0.390777587890625, 0.41632080078125, 0.441864013671875, 0.4674072265625, 0.492950439453125, 0.51849365234375, 0.544036865234375, 0.569580078125, 0.595123291015625, 0.62066650390625, 0.646209716796875, 0.6717529296875, 0.697296142578125, 0.72283935546875, 0.748382568359375, 0.77392578125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 2.0, 5.0, 15.0, 16.0, 10.0, 27.0, 24.0, 27.0, 25.0, 40.0, 51.0, 38.0, 33.0, 52.0, 66.0, 52.0, 44.0, 41.0, 41.0, 56.0, 35.0, 50.0, 41.0, 25.0, 27.0, 22.0, 25.0, 16.0, 19.0, 12.0, 14.0, 16.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69384765625, -0.668426513671875, -0.64300537109375, -0.617584228515625, -0.5921630859375, -0.566741943359375, -0.54132080078125, -0.515899658203125, -0.490478515625, -0.465057373046875, -0.43963623046875, -0.414215087890625, -0.3887939453125, -0.363372802734375, -0.33795166015625, -0.312530517578125, -0.287109375, -0.261688232421875, -0.23626708984375, -0.210845947265625, -0.1854248046875, -0.160003662109375, -0.13458251953125, -0.109161376953125, -0.083740234375, -0.058319091796875, -0.03289794921875, -0.007476806640625, 0.0179443359375, 0.043365478515625, 0.06878662109375, 0.094207763671875, 0.11962890625, 0.145050048828125, 0.17047119140625, 0.195892333984375, 0.2213134765625, 0.246734619140625, 0.27215576171875, 0.297576904296875, 0.322998046875, 0.348419189453125, 0.37384033203125, 0.399261474609375, 0.4246826171875, 0.450103759765625, 0.47552490234375, 0.500946044921875, 0.5263671875, 0.551788330078125, 0.57720947265625, 0.602630615234375, 0.6280517578125, 0.653472900390625, 0.67889404296875, 0.704315185546875, 0.729736328125, 0.755157470703125, 0.78057861328125, 0.805999755859375, 0.8314208984375, 0.856842041015625, 0.88226318359375, 0.907684326171875, 0.93310546875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 19.0, 37.0, 79.0, 590.0, 4178993.0, 14102.0, 338.0, 69.0, 27.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.251220703125, -16.42431640625, -15.597412109375, -14.7705078125, -13.943603515625, -13.11669921875, -12.289794921875, -11.462890625, -10.635986328125, -9.80908203125, -8.982177734375, -8.1552734375, -7.328369140625, -6.50146484375, -5.674560546875, -4.84765625, -4.020751953125, -3.19384765625, -2.366943359375, -1.5400390625, -0.713134765625, 0.11376953125, 0.940673828125, 1.767578125, 2.594482421875, 3.42138671875, 4.248291015625, 5.0751953125, 5.902099609375, 6.72900390625, 7.555908203125, 8.3828125, 9.209716796875, 10.03662109375, 10.863525390625, 11.6904296875, 12.517333984375, 13.34423828125, 14.171142578125, 14.998046875, 15.824951171875, 16.65185546875, 17.478759765625, 18.3056640625, 19.132568359375, 19.95947265625, 20.786376953125, 21.61328125, 22.440185546875, 23.26708984375, 24.093994140625, 24.9208984375, 25.747802734375, 26.57470703125, 27.401611328125, 28.228515625, 29.055419921875, 29.88232421875, 30.709228515625, 31.5361328125, 32.363037109375, 33.18994140625, 34.016845703125, 34.84375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 29.0, 38.0, 139.0, 570.0, 2697.0, 421.0, 114.0, 35.0, 13.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9287796020507812, -0.8922271728515625, -0.8556747436523438, -0.819122314453125, -0.7825698852539062, -0.7460174560546875, -0.7094650268554688, -0.67291259765625, -0.6363601684570312, -0.5998077392578125, -0.5632553100585938, -0.526702880859375, -0.49015045166015625, -0.4535980224609375, -0.41704559326171875, -0.3804931640625, -0.34394073486328125, -0.3073883056640625, -0.27083587646484375, -0.234283447265625, -0.19773101806640625, -0.1611785888671875, -0.12462615966796875, -0.08807373046875, -0.05152130126953125, -0.0149688720703125, 0.02158355712890625, 0.058135986328125, 0.09468841552734375, 0.1312408447265625, 0.16779327392578125, 0.204345703125, 0.24089813232421875, 0.2774505615234375, 0.31400299072265625, 0.350555419921875, 0.38710784912109375, 0.4236602783203125, 0.46021270751953125, 0.49676513671875, 0.5333175659179688, 0.5698699951171875, 0.6064224243164062, 0.642974853515625, 0.6795272827148438, 0.7160797119140625, 0.7526321411132812, 0.7891845703125, 0.8257369995117188, 0.8622894287109375, 0.8988418579101562, 0.935394287109375, 0.9719467163085938, 1.0084991455078125, 1.0450515747070312, 1.08160400390625, 1.1181564331054688, 1.1547088623046875, 1.1912612915039062, 1.227813720703125, 1.2643661499023438, 1.3009185791015625, 1.3374710083007812, 1.3740234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 11.0, 13.0, 15.0, 18.0, 31.0, 30.0, 35.0, 51.0, 69.0, 69.0, 78.0, 91.0, 106.0, 73.0, 57.0, 56.0, 46.0, 29.0, 34.0, 18.0, 14.0, 14.0, 6.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1353092193603516, -1.1050784587860107, -1.0748478174209595, -1.0446170568466187, -1.0143862962722778, -0.9841555953025818, -0.9539248943328857, -0.9236941337585449, -0.8934634327888489, -0.8632327318191528, -0.833001971244812, -0.802771270275116, -0.7725405693054199, -0.7423098087310791, -0.7120791077613831, -0.681848406791687, -0.6516176462173462, -0.6213869452476501, -0.5911561846733093, -0.5609254837036133, -0.5306947231292725, -0.5004640221595764, -0.47023332118988037, -0.44000259041786194, -0.4097718596458435, -0.3795411288738251, -0.34931039810180664, -0.3190796971321106, -0.28884896636009216, -0.25861823558807373, -0.2283875197172165, -0.19815680384635925, -0.16792601346969604, -0.1376952826976776, -0.10746456682682037, -0.07723384350538254, -0.0470031201839447, -0.01677238941192627, 0.01345832645893097, 0.04368904232978821, 0.07391977310180664, 0.10415049642324448, 0.1343812197446823, 0.16461193561553955, 0.19484266638755798, 0.22507339715957642, 0.25530409812927246, 0.2855348289012909, 0.3157655596733093, 0.34599629044532776, 0.3762270212173462, 0.40645772218704224, 0.43668845295906067, 0.4669191837310791, 0.49714988470077515, 0.5273805856704712, 0.557611346244812, 0.5878420472145081, 0.6180728077888489, 0.6483035087585449, 0.6785342693328857, 0.7087649703025818, 0.7389956712722778, 0.7692264318466187, 0.7994571328163147]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 8.0, 10.0, 8.0, 11.0, 26.0, 22.0, 29.0, 32.0, 23.0, 43.0, 37.0, 45.0, 41.0, 28.0, 50.0, 45.0, 46.0, 40.0, 44.0, 47.0, 35.0, 44.0, 53.0, 28.0, 36.0, 24.0, 25.0, 21.0, 9.0, 17.0, 11.0, 20.0, 9.0, 7.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6483617424964905, -0.6281723380088806, -0.607982873916626, -0.5877934694290161, -0.5676040053367615, -0.5474146008491516, -0.527225136756897, -0.5070357322692871, -0.48684626817703247, -0.4666568338871002, -0.44646739959716797, -0.4262779653072357, -0.40608853101730347, -0.3858990967273712, -0.36570966243743896, -0.3455202579498291, -0.32533082365989685, -0.3051413893699646, -0.28495195508003235, -0.2647625207901001, -0.24457308650016785, -0.2243836522102356, -0.20419423282146454, -0.1840047985315323, -0.16381536424160004, -0.14362592995166779, -0.12343649566173553, -0.10324706882238388, -0.08305763453245163, -0.06286820024251938, -0.042678773403167725, -0.022489339113235474, -0.0022999048233032227, 0.01788952760398388, 0.03807896003127098, 0.05826839059591293, 0.07845782488584518, 0.09864725917577744, 0.11883668601512909, 0.13902612030506134, 0.1592155545949936, 0.17940498888492584, 0.1995944231748581, 0.21978384256362915, 0.2399732768535614, 0.26016271114349365, 0.2803521454334259, 0.30054157972335815, 0.3207310140132904, 0.34092044830322266, 0.3611098825931549, 0.38129931688308716, 0.4014887511730194, 0.42167818546295166, 0.4418675899505615, 0.46205705404281616, 0.482246458530426, 0.5024358630180359, 0.5226253271102905, 0.5428147315979004, 0.563004195690155, 0.5831936001777649, 0.6033830642700195, 0.6235724687576294, 0.643761932849884]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 1.0, 7.0, 12.0, 21.0, 28.0, 34.0, 58.0, 73.0, 147.0, 208.0, 310.0, 539.0, 842.0, 1393.0, 2397.0, 4277.0, 7140.0, 12779.0, 23155.0, 42211.0, 77846.0, 141425.0, 236640.0, 218332.0, 125422.0, 68411.0, 37037.0, 20560.0, 11411.0, 6471.0, 3693.0, 2276.0, 1323.0, 760.0, 479.0, 308.0, 183.0, 101.0, 86.0, 43.0, 35.0, 21.0, 19.0, 14.0, 15.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2308349609375, -0.22359848022460938, -0.21636199951171875, -0.20912551879882812, -0.2018890380859375, -0.19465255737304688, -0.18741607666015625, -0.18017959594726562, -0.172943115234375, -0.16570663452148438, -0.15847015380859375, -0.15123367309570312, -0.1439971923828125, -0.13676071166992188, -0.12952423095703125, -0.12228775024414062, -0.11505126953125, -0.10781478881835938, -0.10057830810546875, -0.09334182739257812, -0.0861053466796875, -0.07886886596679688, -0.07163238525390625, -0.06439590454101562, -0.057159423828125, -0.049922943115234375, -0.04268646240234375, -0.035449981689453125, -0.0282135009765625, -0.020977020263671875, -0.01374053955078125, -0.006504058837890625, 0.000732421875, 0.007968902587890625, 0.01520538330078125, 0.022441864013671875, 0.0296783447265625, 0.036914825439453125, 0.04415130615234375, 0.051387786865234375, 0.058624267578125, 0.06586074829101562, 0.07309722900390625, 0.08033370971679688, 0.0875701904296875, 0.09480667114257812, 0.10204315185546875, 0.10927963256835938, 0.11651611328125, 0.12375259399414062, 0.13098907470703125, 0.13822555541992188, 0.1454620361328125, 0.15269851684570312, 0.15993499755859375, 0.16717147827148438, 0.174407958984375, 0.18164443969726562, 0.18888092041015625, 0.19611740112304688, 0.2033538818359375, 0.21059036254882812, 0.21782684326171875, 0.22506332397460938, 0.2322998046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 9.0, 13.0, 32.0, 21.0, 24.0, 29.0, 40.0, 30.0, 44.0, 37.0, 49.0, 35.0, 50.0, 51.0, 61.0, 40.0, 49.0, 45.0, 45.0, 35.0, 30.0, 40.0, 32.0, 22.0, 25.0, 19.0, 9.0, 11.0, 13.0, 11.0, 9.0, 6.0, 9.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45654296875, -0.4424400329589844, -0.42833709716796875, -0.4142341613769531, -0.4001312255859375, -0.3860282897949219, -0.37192535400390625, -0.3578224182128906, -0.343719482421875, -0.3296165466308594, -0.31551361083984375, -0.3014106750488281, -0.2873077392578125, -0.2732048034667969, -0.25910186767578125, -0.24499893188476562, -0.23089599609375, -0.21679306030273438, -0.20269012451171875, -0.18858718872070312, -0.1744842529296875, -0.16038131713867188, -0.14627838134765625, -0.13217544555664062, -0.118072509765625, -0.10396957397460938, -0.08986663818359375, -0.07576370239257812, -0.0616607666015625, -0.047557830810546875, -0.03345489501953125, -0.019351959228515625, -0.0052490234375, 0.008853912353515625, 0.02295684814453125, 0.037059783935546875, 0.0511627197265625, 0.06526565551757812, 0.07936859130859375, 0.09347152709960938, 0.107574462890625, 0.12167739868164062, 0.13578033447265625, 0.14988327026367188, 0.1639862060546875, 0.17808914184570312, 0.19219207763671875, 0.20629501342773438, 0.22039794921875, 0.23450088500976562, 0.24860382080078125, 0.2627067565917969, 0.2768096923828125, 0.2909126281738281, 0.30501556396484375, 0.3191184997558594, 0.333221435546875, 0.3473243713378906, 0.36142730712890625, 0.3755302429199219, 0.3896331787109375, 0.4037361145019531, 0.41783905029296875, 0.4319419860839844, 0.446044921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 16.0, 13.0, 30.0, 28.0, 52.0, 66.0, 109.0, 234.0, 364.0, 769.0, 1422.0, 3143.0, 8148.0, 23704.0, 77312.0, 283738.0, 445985.0, 140916.0, 40421.0, 13068.0, 4750.0, 2090.0, 991.0, 468.0, 267.0, 173.0, 94.0, 56.0, 43.0, 23.0, 16.0, 12.0, 7.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37480926513671875, -0.3624114990234375, -0.35001373291015625, -0.337615966796875, -0.32521820068359375, -0.3128204345703125, -0.30042266845703125, -0.28802490234375, -0.27562713623046875, -0.2632293701171875, -0.25083160400390625, -0.238433837890625, -0.22603607177734375, -0.2136383056640625, -0.20124053955078125, -0.1888427734375, -0.17644500732421875, -0.1640472412109375, -0.15164947509765625, -0.139251708984375, -0.12685394287109375, -0.1144561767578125, -0.10205841064453125, -0.08966064453125, -0.07726287841796875, -0.0648651123046875, -0.05246734619140625, -0.040069580078125, -0.02767181396484375, -0.0152740478515625, -0.00287628173828125, 0.009521484375, 0.02191925048828125, 0.0343170166015625, 0.04671478271484375, 0.059112548828125, 0.07151031494140625, 0.0839080810546875, 0.09630584716796875, 0.10870361328125, 0.12110137939453125, 0.1334991455078125, 0.14589691162109375, 0.158294677734375, 0.17069244384765625, 0.1830902099609375, 0.19548797607421875, 0.2078857421875, 0.22028350830078125, 0.2326812744140625, 0.24507904052734375, 0.257476806640625, 0.26987457275390625, 0.2822723388671875, 0.29467010498046875, 0.30706787109375, 0.31946563720703125, 0.3318634033203125, 0.34426116943359375, 0.356658935546875, 0.36905670166015625, 0.3814544677734375, 0.39385223388671875, 0.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 11.0, 11.0, 17.0, 12.0, 15.0, 14.0, 26.0, 29.0, 25.0, 29.0, 35.0, 21.0, 31.0, 49.0, 43.0, 46.0, 48.0, 44.0, 34.0, 36.0, 34.0, 32.0, 41.0, 32.0, 34.0, 25.0, 29.0, 26.0, 15.0, 24.0, 18.0, 17.0, 13.0, 12.0, 7.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7140655517578125, -0.688873291015625, -0.6636810302734375, -0.63848876953125, -0.6132965087890625, -0.588104248046875, -0.5629119873046875, -0.5377197265625, -0.5125274658203125, -0.487335205078125, -0.4621429443359375, -0.43695068359375, -0.4117584228515625, -0.386566162109375, -0.3613739013671875, -0.336181640625, -0.3109893798828125, -0.285797119140625, -0.2606048583984375, -0.23541259765625, -0.2102203369140625, -0.185028076171875, -0.1598358154296875, -0.1346435546875, -0.1094512939453125, -0.084259033203125, -0.0590667724609375, -0.03387451171875, -0.0086822509765625, 0.016510009765625, 0.0417022705078125, 0.06689453125, 0.0920867919921875, 0.117279052734375, 0.1424713134765625, 0.16766357421875, 0.1928558349609375, 0.218048095703125, 0.2432403564453125, 0.2684326171875, 0.2936248779296875, 0.318817138671875, 0.3440093994140625, 0.36920166015625, 0.3943939208984375, 0.419586181640625, 0.4447784423828125, 0.469970703125, 0.4951629638671875, 0.520355224609375, 0.5455474853515625, 0.57073974609375, 0.5959320068359375, 0.621124267578125, 0.6463165283203125, 0.6715087890625, 0.6967010498046875, 0.721893310546875, 0.7470855712890625, 0.77227783203125, 0.7974700927734375, 0.822662353515625, 0.8478546142578125, 0.873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 7.0, 5.0, 18.0, 31.0, 34.0, 57.0, 87.0, 134.0, 254.0, 420.0, 728.0, 1376.0, 2871.0, 5907.0, 13614.0, 37320.0, 123114.0, 424889.0, 309507.0, 81611.0, 26653.0, 10439.0, 4590.0, 2218.0, 1147.0, 629.0, 348.0, 219.0, 110.0, 88.0, 46.0, 32.0, 17.0, 12.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.06044912338256836, -0.05855083465576172, -0.05665254592895508, -0.05475425720214844, -0.0528559684753418, -0.050957679748535156, -0.049059391021728516, -0.047161102294921875, -0.045262813568115234, -0.043364524841308594, -0.04146623611450195, -0.03956794738769531, -0.03766965866088867, -0.03577136993408203, -0.03387308120727539, -0.03197479248046875, -0.03007650375366211, -0.02817821502685547, -0.026279926300048828, -0.024381637573242188, -0.022483348846435547, -0.020585060119628906, -0.018686771392822266, -0.016788482666015625, -0.014890193939208984, -0.012991905212402344, -0.011093616485595703, -0.009195327758789062, -0.007297039031982422, -0.005398750305175781, -0.0035004615783691406, -0.0016021728515625, 0.0002961158752441406, 0.0021944046020507812, 0.004092693328857422, 0.0059909820556640625, 0.007889270782470703, 0.009787559509277344, 0.011685848236083984, 0.013584136962890625, 0.015482425689697266, 0.017380714416503906, 0.019279003143310547, 0.021177291870117188, 0.023075580596923828, 0.02497386932373047, 0.02687215805053711, 0.02877044677734375, 0.03066873550415039, 0.03256702423095703, 0.03446531295776367, 0.03636360168457031, 0.03826189041137695, 0.040160179138183594, 0.042058467864990234, 0.043956756591796875, 0.045855045318603516, 0.047753334045410156, 0.0496516227722168, 0.05154991149902344, 0.05344820022583008, 0.05534648895263672, 0.05724477767944336, 0.05914306640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 22.0, 22.0, 14.0, 27.0, 43.0, 65.0, 87.0, 124.0, 128.0, 106.0, 103.0, 56.0, 58.0, 25.0, 28.0, 16.0, 13.0, 9.0, 4.0, 9.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-05, -4.5666471123695374e-05, -4.364922642707825e-05, -4.163198173046112e-05, -3.9614737033843994e-05, -3.759749233722687e-05, -3.558024764060974e-05, -3.3563002943992615e-05, -3.154575824737549e-05, -2.9528513550758362e-05, -2.7511268854141235e-05, -2.549402415752411e-05, -2.3476779460906982e-05, -2.1459534764289856e-05, -1.944229006767273e-05, -1.7425045371055603e-05, -1.5407800674438477e-05, -1.339055597782135e-05, -1.1373311281204224e-05, -9.356066584587097e-06, -7.338821887969971e-06, -5.321577191352844e-06, -3.3043324947357178e-06, -1.2870877981185913e-06, 7.301568984985352e-07, 2.7474015951156616e-06, 4.764646291732788e-06, 6.7818909883499146e-06, 8.799135684967041e-06, 1.0816380381584167e-05, 1.2833625078201294e-05, 1.485086977481842e-05, 1.6868114471435547e-05, 1.8885359168052673e-05, 2.09026038646698e-05, 2.2919848561286926e-05, 2.4937093257904053e-05, 2.695433795452118e-05, 2.8971582651138306e-05, 3.098882734775543e-05, 3.300607204437256e-05, 3.5023316740989685e-05, 3.704056143760681e-05, 3.905780613422394e-05, 4.1075050830841064e-05, 4.309229552745819e-05, 4.510954022407532e-05, 4.7126784920692444e-05, 4.914402961730957e-05, 5.11612743139267e-05, 5.317851901054382e-05, 5.519576370716095e-05, 5.7213008403778076e-05, 5.92302531003952e-05, 6.124749779701233e-05, 6.326474249362946e-05, 6.528198719024658e-05, 6.729923188686371e-05, 6.931647658348083e-05, 7.133372128009796e-05, 7.335096597671509e-05, 7.536821067333221e-05, 7.738545536994934e-05, 7.940270006656647e-05, 8.14199447631836e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 18.0, 15.0, 24.0, 30.0, 33.0, 62.0, 62.0, 156.0, 288.0, 586.0, 1592.0, 4758.0, 17727.0, 106463.0, 641518.0, 232467.0, 31445.0, 7188.0, 2350.0, 918.0, 338.0, 174.0, 99.0, 63.0, 47.0, 32.0, 20.0, 11.0, 13.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09949684143066406, -0.09602737426757812, -0.09255790710449219, -0.08908843994140625, -0.08561897277832031, -0.08214950561523438, -0.07868003845214844, -0.0752105712890625, -0.07174110412597656, -0.06827163696289062, -0.06480216979980469, -0.06133270263671875, -0.05786323547363281, -0.054393768310546875, -0.05092430114746094, -0.047454833984375, -0.04398536682128906, -0.040515899658203125, -0.03704643249511719, -0.03357696533203125, -0.030107498168945312, -0.026638031005859375, -0.023168563842773438, -0.0196990966796875, -0.016229629516601562, -0.012760162353515625, -0.009290695190429688, -0.00582122802734375, -0.0023517608642578125, 0.001117706298828125, 0.0045871734619140625, 0.008056640625, 0.011526107788085938, 0.014995574951171875, 0.018465042114257812, 0.02193450927734375, 0.025403976440429688, 0.028873443603515625, 0.03234291076660156, 0.0358123779296875, 0.03928184509277344, 0.042751312255859375, 0.04622077941894531, 0.04969024658203125, 0.05315971374511719, 0.056629180908203125, 0.06009864807128906, 0.063568115234375, 0.06703758239746094, 0.07050704956054688, 0.07397651672363281, 0.07744598388671875, 0.08091545104980469, 0.08438491821289062, 0.08785438537597656, 0.0913238525390625, 0.09479331970214844, 0.09826278686523438, 0.10173225402832031, 0.10520172119140625, 0.10867118835449219, 0.11214065551757812, 0.11561012268066406, 0.11907958984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 7.0, 5.0, 7.0, 11.0, 18.0, 15.0, 19.0, 21.0, 26.0, 30.0, 36.0, 51.0, 53.0, 56.0, 66.0, 68.0, 59.0, 71.0, 45.0, 57.0, 43.0, 45.0, 42.0, 28.0, 27.0, 17.0, 8.0, 5.0, 20.0, 7.0, 1.0, 7.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179901123046875, -0.0174102783203125, -0.0168304443359375, -0.0162506103515625, -0.0156707763671875, -0.0150909423828125, -0.0145111083984375, -0.0139312744140625, -0.0133514404296875, -0.0127716064453125, -0.0121917724609375, -0.0116119384765625, -0.0110321044921875, -0.0104522705078125, -0.0098724365234375, -0.0092926025390625, -0.0087127685546875, -0.0081329345703125, -0.0075531005859375, -0.0069732666015625, -0.0063934326171875, -0.0058135986328125, -0.0052337646484375, -0.0046539306640625, -0.0040740966796875, -0.0034942626953125, -0.0029144287109375, -0.0023345947265625, -0.0017547607421875, -0.0011749267578125, -0.0005950927734375, -1.52587890625e-05, 0.0005645751953125, 0.0011444091796875, 0.0017242431640625, 0.0023040771484375, 0.0028839111328125, 0.0034637451171875, 0.0040435791015625, 0.0046234130859375, 0.0052032470703125, 0.0057830810546875, 0.0063629150390625, 0.0069427490234375, 0.0075225830078125, 0.0081024169921875, 0.0086822509765625, 0.0092620849609375, 0.0098419189453125, 0.0104217529296875, 0.0110015869140625, 0.0115814208984375, 0.0121612548828125, 0.0127410888671875, 0.0133209228515625, 0.0139007568359375, 0.0144805908203125, 0.0150604248046875, 0.0156402587890625, 0.0162200927734375, 0.0167999267578125, 0.0173797607421875, 0.0179595947265625, 0.0185394287109375, 0.0191192626953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 16.0, 23.0, 64.0, 117.0, 210.0, 237.0, 164.0, 92.0, 37.0, 24.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1237847805023193, -2.073493719100952, -2.023202896118164, -1.9729118347167969, -1.9226207733154297, -1.872329831123352, -1.8220388889312744, -1.7717478275299072, -1.7214568853378296, -1.671165943145752, -1.6208748817443848, -1.5705839395523071, -1.5202929973602295, -1.4700019359588623, -1.4197109937667847, -1.369420051574707, -1.3191289901733398, -1.2688380479812622, -1.218546986579895, -1.1682560443878174, -1.1179649829864502, -1.0676740407943726, -1.017383098602295, -0.9670920968055725, -0.9168010950088501, -0.8665100932121277, -0.8162190914154053, -0.7659281492233276, -0.7156371474266052, -0.6653461456298828, -0.6150552034378052, -0.5647642016410828, -0.5144731998443604, -0.46418219804763794, -0.4138912260532379, -0.3636002540588379, -0.3133092522621155, -0.26301825046539307, -0.21272727847099304, -0.16243630647659302, -0.1121453046798706, -0.06185431778430939, -0.011563330888748169, 0.03872765600681305, 0.08901864290237427, 0.13930964469909668, 0.1896006166934967, 0.23989158868789673, 0.29018259048461914, 0.34047359228134155, 0.3907645642757416, 0.4410555362701416, 0.491346538066864, 0.5416375398635864, 0.5919284820556641, 0.6422194838523865, 0.6925104856491089, 0.7428014874458313, 0.7930924892425537, 0.8433834314346313, 0.8936744332313538, 0.9439654350280762, 0.9942563772201538, 1.0445473194122314, 1.0948383808135986]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 10.0, 14.0, 13.0, 13.0, 21.0, 32.0, 25.0, 25.0, 43.0, 35.0, 39.0, 36.0, 36.0, 37.0, 44.0, 45.0, 39.0, 41.0, 40.0, 43.0, 40.0, 40.0, 40.0, 35.0, 34.0, 24.0, 21.0, 24.0, 17.0, 15.0, 11.0, 9.0, 11.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.4222990870475769, -0.41003358364105225, -0.3977680802345276, -0.38550257682800293, -0.37323707342147827, -0.3609715700149536, -0.34870606660842896, -0.3364405632019043, -0.32417505979537964, -0.311909556388855, -0.2996440529823303, -0.28737854957580566, -0.275113046169281, -0.26284754276275635, -0.2505820393562317, -0.23831652104854584, -0.22605100274085999, -0.21378549933433533, -0.20151999592781067, -0.189254492521286, -0.17698898911476135, -0.1647234857082367, -0.15245796740055084, -0.14019246399402618, -0.12792696058750153, -0.11566145718097687, -0.10339595377445221, -0.09113044291734695, -0.0788649395108223, -0.06659943610429764, -0.05433392524719238, -0.042068421840667725, -0.02980288863182068, -0.01753738336265087, -0.005271878093481064, 0.006993629038333893, 0.01925913244485855, 0.03152463585138321, 0.043790146708488464, 0.05605565011501312, 0.06832115352153778, 0.08058665692806244, 0.0928521603345871, 0.10511767119169235, 0.11738317459821701, 0.12964868545532227, 0.14191418886184692, 0.15417969226837158, 0.16644519567489624, 0.1787106990814209, 0.19097620248794556, 0.20324170589447021, 0.21550720930099487, 0.22777271270751953, 0.24003823101520538, 0.25230371952056885, 0.2645692229270935, 0.27683472633361816, 0.2891002297401428, 0.3013657331466675, 0.31363123655319214, 0.3258967399597168, 0.33816224336624146, 0.3504277467727661, 0.36269327998161316]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 7.0, 15.0, 20.0, 26.0, 55.0, 78.0, 114.0, 155.0, 246.0, 389.0, 573.0, 1034.0, 1737.0, 3066.0, 5587.0, 10471.0, 22530.0, 57423.0, 212048.0, 499490.0, 149416.0, 45008.0, 18690.0, 9018.0, 4624.0, 2624.0, 1553.0, 992.0, 551.0, 370.0, 211.0, 143.0, 99.0, 59.0, 41.0, 36.0, 19.0, 15.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.16472816467285156, -0.15892410278320312, -0.1531200408935547, -0.14731597900390625, -0.1415119171142578, -0.13570785522460938, -0.12990379333496094, -0.1240997314453125, -0.11829566955566406, -0.11249160766601562, -0.10668754577636719, -0.10088348388671875, -0.09507942199707031, -0.08927536010742188, -0.08347129821777344, -0.077667236328125, -0.07186317443847656, -0.06605911254882812, -0.06025505065917969, -0.05445098876953125, -0.04864692687988281, -0.042842864990234375, -0.03703880310058594, -0.0312347412109375, -0.025430679321289062, -0.019626617431640625, -0.013822555541992188, -0.00801849365234375, -0.0022144317626953125, 0.003589630126953125, 0.009393692016601562, 0.01519775390625, 0.021001815795898438, 0.026805877685546875, 0.03260993957519531, 0.03841400146484375, 0.04421806335449219, 0.050022125244140625, 0.05582618713378906, 0.0616302490234375, 0.06743431091308594, 0.07323837280273438, 0.07904243469238281, 0.08484649658203125, 0.09065055847167969, 0.09645462036132812, 0.10225868225097656, 0.108062744140625, 0.11386680603027344, 0.11967086791992188, 0.1254749298095703, 0.13127899169921875, 0.1370830535888672, 0.14288711547851562, 0.14869117736816406, 0.1544952392578125, 0.16029930114746094, 0.16610336303710938, 0.1719074249267578, 0.17771148681640625, 0.1835155487060547, 0.18931961059570312, 0.19512367248535156, 0.200927734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 18.0, 15.0, 9.0, 27.0, 25.0, 19.0, 23.0, 33.0, 33.0, 37.0, 33.0, 53.0, 38.0, 44.0, 32.0, 49.0, 47.0, 55.0, 28.0, 51.0, 46.0, 27.0, 40.0, 19.0, 34.0, 18.0, 23.0, 20.0, 14.0, 14.0, 13.0, 6.0, 12.0, 1.0, 5.0, 9.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6416015625, -0.6213302612304688, -0.6010589599609375, -0.5807876586914062, -0.560516357421875, -0.5402450561523438, -0.5199737548828125, -0.49970245361328125, -0.47943115234375, -0.45915985107421875, -0.4388885498046875, -0.41861724853515625, -0.398345947265625, -0.37807464599609375, -0.3578033447265625, -0.33753204345703125, -0.3172607421875, -0.29698944091796875, -0.2767181396484375, -0.25644683837890625, -0.236175537109375, -0.21590423583984375, -0.1956329345703125, -0.17536163330078125, -0.15509033203125, -0.13481903076171875, -0.1145477294921875, -0.09427642822265625, -0.074005126953125, -0.05373382568359375, -0.0334625244140625, -0.01319122314453125, 0.007080078125, 0.02735137939453125, 0.0476226806640625, 0.06789398193359375, 0.088165283203125, 0.10843658447265625, 0.1287078857421875, 0.14897918701171875, 0.16925048828125, 0.18952178955078125, 0.2097930908203125, 0.23006439208984375, 0.250335693359375, 0.27060699462890625, 0.2908782958984375, 0.31114959716796875, 0.3314208984375, 0.35169219970703125, 0.3719635009765625, 0.39223480224609375, 0.412506103515625, 0.43277740478515625, 0.4530487060546875, 0.47332000732421875, 0.49359130859375, 0.5138626098632812, 0.5341339111328125, 0.5544052124023438, 0.574676513671875, 0.5949478149414062, 0.6152191162109375, 0.6354904174804688, 0.65576171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 5.0, 7.0, 7.0, 11.0, 20.0, 20.0, 31.0, 45.0, 35.0, 64.0, 63.0, 105.0, 140.0, 230.0, 399.0, 907.0, 2536.0, 8960.0, 50186.0, 777342.0, 182263.0, 17903.0, 4347.0, 1399.0, 565.0, 298.0, 182.0, 116.0, 78.0, 53.0, 47.0, 47.0, 28.0, 34.0, 18.0, 17.0, 13.0, 5.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.51806640625, -0.5035667419433594, -0.48906707763671875, -0.4745674133300781, -0.4600677490234375, -0.4455680847167969, -0.43106842041015625, -0.4165687561035156, -0.402069091796875, -0.3875694274902344, -0.37306976318359375, -0.3585700988769531, -0.3440704345703125, -0.3295707702636719, -0.31507110595703125, -0.3005714416503906, -0.28607177734375, -0.2715721130371094, -0.25707244873046875, -0.24257278442382812, -0.2280731201171875, -0.21357345581054688, -0.19907379150390625, -0.18457412719726562, -0.170074462890625, -0.15557479858398438, -0.14107513427734375, -0.12657546997070312, -0.1120758056640625, -0.09757614135742188, -0.08307647705078125, -0.06857681274414062, -0.0540771484375, -0.039577484130859375, -0.02507781982421875, -0.010578155517578125, 0.0039215087890625, 0.018421173095703125, 0.03292083740234375, 0.047420501708984375, 0.061920166015625, 0.07641983032226562, 0.09091949462890625, 0.10541915893554688, 0.1199188232421875, 0.13441848754882812, 0.14891815185546875, 0.16341781616210938, 0.17791748046875, 0.19241714477539062, 0.20691680908203125, 0.22141647338867188, 0.2359161376953125, 0.2504158020019531, 0.26491546630859375, 0.2794151306152344, 0.293914794921875, 0.3084144592285156, 0.32291412353515625, 0.3374137878417969, 0.3519134521484375, 0.3664131164550781, 0.38091278076171875, 0.3954124450683594, 0.409912109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 3.0, 7.0, 8.0, 12.0, 12.0, 16.0, 28.0, 24.0, 14.0, 23.0, 31.0, 29.0, 35.0, 37.0, 33.0, 51.0, 57.0, 47.0, 51.0, 57.0, 47.0, 36.0, 50.0, 50.0, 36.0, 29.0, 27.0, 23.0, 30.0, 26.0, 10.0, 20.0, 7.0, 8.0, 7.0, 6.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79541015625, -0.7721786499023438, -0.7489471435546875, -0.7257156372070312, -0.702484130859375, -0.6792526245117188, -0.6560211181640625, -0.6327896118164062, -0.60955810546875, -0.5863265991210938, -0.5630950927734375, -0.5398635864257812, -0.516632080078125, -0.49340057373046875, -0.4701690673828125, -0.44693756103515625, -0.4237060546875, -0.40047454833984375, -0.3772430419921875, -0.35401153564453125, -0.330780029296875, -0.30754852294921875, -0.2843170166015625, -0.26108551025390625, -0.23785400390625, -0.21462249755859375, -0.1913909912109375, -0.16815948486328125, -0.144927978515625, -0.12169647216796875, -0.0984649658203125, -0.07523345947265625, -0.052001953125, -0.02877044677734375, -0.0055389404296875, 0.01769256591796875, 0.040924072265625, 0.06415557861328125, 0.0873870849609375, 0.11061859130859375, 0.13385009765625, 0.15708160400390625, 0.1803131103515625, 0.20354461669921875, 0.226776123046875, 0.25000762939453125, 0.2732391357421875, 0.29647064208984375, 0.3197021484375, 0.34293365478515625, 0.3661651611328125, 0.38939666748046875, 0.412628173828125, 0.43585968017578125, 0.4590911865234375, 0.48232269287109375, 0.50555419921875, 0.5287857055664062, 0.5520172119140625, 0.5752487182617188, 0.598480224609375, 0.6217117309570312, 0.6449432373046875, 0.6681747436523438, 0.69140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 9.0, 12.0, 24.0, 27.0, 50.0, 88.0, 114.0, 242.0, 440.0, 1079.0, 2847.0, 10486.0, 65506.0, 848404.0, 99958.0, 13405.0, 3406.0, 1276.0, 535.0, 269.0, 148.0, 73.0, 55.0, 26.0, 18.0, 10.0, 10.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1649169921875, -0.1607503890991211, -0.1565837860107422, -0.15241718292236328, -0.14825057983398438, -0.14408397674560547, -0.13991737365722656, -0.13575077056884766, -0.13158416748046875, -0.12741756439208984, -0.12325096130371094, -0.11908435821533203, -0.11491775512695312, -0.11075115203857422, -0.10658454895019531, -0.1024179458618164, -0.0982513427734375, -0.0940847396850586, -0.08991813659667969, -0.08575153350830078, -0.08158493041992188, -0.07741832733154297, -0.07325172424316406, -0.06908512115478516, -0.06491851806640625, -0.060751914978027344, -0.05658531188964844, -0.05241870880126953, -0.048252105712890625, -0.04408550262451172, -0.03991889953613281, -0.035752296447753906, -0.031585693359375, -0.027419090270996094, -0.023252487182617188, -0.01908588409423828, -0.014919281005859375, -0.010752677917480469, -0.0065860748291015625, -0.0024194717407226562, 0.00174713134765625, 0.005913734436035156, 0.010080337524414062, 0.014246940612792969, 0.018413543701171875, 0.02258014678955078, 0.026746749877929688, 0.030913352966308594, 0.0350799560546875, 0.039246559143066406, 0.04341316223144531, 0.04757976531982422, 0.051746368408203125, 0.05591297149658203, 0.06007957458496094, 0.06424617767333984, 0.06841278076171875, 0.07257938385009766, 0.07674598693847656, 0.08091259002685547, 0.08507919311523438, 0.08924579620361328, 0.09341239929199219, 0.0975790023803711, 0.10174560546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 10.0, 10.0, 12.0, 16.0, 19.0, 28.0, 44.0, 75.0, 152.0, 149.0, 176.0, 83.0, 64.0, 38.0, 23.0, 27.0, 23.0, 7.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8656253814697266e-05, -1.815054565668106e-05, -1.7644837498664856e-05, -1.713912934064865e-05, -1.6633421182632446e-05, -1.612771302461624e-05, -1.5622004866600037e-05, -1.5116296708583832e-05, -1.4610588550567627e-05, -1.4104880392551422e-05, -1.3599172234535217e-05, -1.3093464076519012e-05, -1.2587755918502808e-05, -1.2082047760486603e-05, -1.1576339602470398e-05, -1.1070631444454193e-05, -1.0564923286437988e-05, -1.0059215128421783e-05, -9.553506970405579e-06, -9.047798812389374e-06, -8.542090654373169e-06, -8.036382496356964e-06, -7.530674338340759e-06, -7.0249661803245544e-06, -6.51925802230835e-06, -6.013549864292145e-06, -5.50784170627594e-06, -5.002133548259735e-06, -4.49642539024353e-06, -3.9907172322273254e-06, -3.4850090742111206e-06, -2.9793009161949158e-06, -2.473592758178711e-06, -1.967884600162506e-06, -1.4621764421463013e-06, -9.564682841300964e-07, -4.507601261138916e-07, 5.494803190231323e-08, 5.606561899185181e-07, 1.066364347934723e-06, 1.5720725059509277e-06, 2.0777806639671326e-06, 2.5834888219833374e-06, 3.0891969799995422e-06, 3.594905138015747e-06, 4.100613296031952e-06, 4.606321454048157e-06, 5.1120296120643616e-06, 5.617737770080566e-06, 6.123445928096771e-06, 6.629154086112976e-06, 7.134862244129181e-06, 7.640570402145386e-06, 8.14627856016159e-06, 8.651986718177795e-06, 9.157694876194e-06, 9.663403034210205e-06, 1.016911119222641e-05, 1.0674819350242615e-05, 1.118052750825882e-05, 1.1686235666275024e-05, 1.219194382429123e-05, 1.2697651982307434e-05, 1.3203360140323639e-05, 1.3709068298339844e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 13.0, 8.0, 19.0, 37.0, 35.0, 71.0, 133.0, 259.0, 518.0, 1150.0, 3111.0, 9861.0, 45615.0, 672559.0, 275747.0, 28397.0, 6984.0, 2262.0, 848.0, 396.0, 192.0, 120.0, 70.0, 40.0, 23.0, 21.0, 8.0, 11.0, 7.0, 5.0, 8.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.101806640625, -0.09839725494384766, -0.09498786926269531, -0.09157848358154297, -0.08816909790039062, -0.08475971221923828, -0.08135032653808594, -0.0779409408569336, -0.07453155517578125, -0.0711221694946289, -0.06771278381347656, -0.06430339813232422, -0.060894012451171875, -0.05748462677001953, -0.05407524108886719, -0.050665855407714844, -0.0472564697265625, -0.043847084045410156, -0.04043769836425781, -0.03702831268310547, -0.033618927001953125, -0.03020954132080078, -0.026800155639648438, -0.023390769958496094, -0.01998138427734375, -0.016571998596191406, -0.013162612915039062, -0.009753227233886719, -0.006343841552734375, -0.0029344558715820312, 0.0004749298095703125, 0.0038843154907226562, 0.007293701171875, 0.010703086853027344, 0.014112472534179688, 0.01752185821533203, 0.020931243896484375, 0.02434062957763672, 0.027750015258789062, 0.031159400939941406, 0.03456878662109375, 0.037978172302246094, 0.04138755798339844, 0.04479694366455078, 0.048206329345703125, 0.05161571502685547, 0.05502510070800781, 0.058434486389160156, 0.0618438720703125, 0.06525325775146484, 0.06866264343261719, 0.07207202911376953, 0.07548141479492188, 0.07889080047607422, 0.08230018615722656, 0.0857095718383789, 0.08911895751953125, 0.0925283432006836, 0.09593772888183594, 0.09934711456298828, 0.10275650024414062, 0.10616588592529297, 0.10957527160644531, 0.11298465728759766, 0.11639404296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 7.0, 9.0, 20.0, 24.0, 39.0, 44.0, 70.0, 94.0, 139.0, 147.0, 114.0, 70.0, 47.0, 38.0, 27.0, 18.0, 16.0, 11.0, 13.0, 9.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.037109375, -0.03587675094604492, -0.034644126892089844, -0.033411502838134766, -0.03217887878417969, -0.03094625473022461, -0.02971363067626953, -0.028481006622314453, -0.027248382568359375, -0.026015758514404297, -0.02478313446044922, -0.02355051040649414, -0.022317886352539062, -0.021085262298583984, -0.019852638244628906, -0.018620014190673828, -0.01738739013671875, -0.016154766082763672, -0.014922142028808594, -0.013689517974853516, -0.012456893920898438, -0.01122426986694336, -0.009991645812988281, -0.008759021759033203, -0.007526397705078125, -0.006293773651123047, -0.005061149597167969, -0.0038285255432128906, -0.0025959014892578125, -0.0013632774353027344, -0.00013065338134765625, 0.0011019706726074219, 0.0023345947265625, 0.003567218780517578, 0.004799842834472656, 0.006032466888427734, 0.0072650909423828125, 0.00849771499633789, 0.009730339050292969, 0.010962963104248047, 0.012195587158203125, 0.013428211212158203, 0.014660835266113281, 0.01589345932006836, 0.017126083374023438, 0.018358707427978516, 0.019591331481933594, 0.020823955535888672, 0.02205657958984375, 0.023289203643798828, 0.024521827697753906, 0.025754451751708984, 0.026987075805664062, 0.02821969985961914, 0.02945232391357422, 0.030684947967529297, 0.031917572021484375, 0.03315019607543945, 0.03438282012939453, 0.03561544418334961, 0.03684806823730469, 0.038080692291259766, 0.039313316345214844, 0.04054594039916992, 0.041778564453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 23.0, 50.0, 110.0, 205.0, 255.0, 197.0, 95.0, 37.0, 19.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.405527591705322, -4.316229820251465, -4.226932048797607, -4.13763427734375, -4.048336505889893, -3.959038734436035, -3.8697409629821777, -3.780442953109741, -3.691145181655884, -3.6018474102020264, -3.512549638748169, -3.4232518672943115, -3.333954095840454, -3.2446560859680176, -3.15535831451416, -3.0660605430603027, -2.9767627716064453, -2.887465000152588, -2.7981672286987305, -2.708869457244873, -2.6195716857910156, -2.530273914337158, -2.440976142883301, -2.3516781330108643, -2.262380599975586, -2.1730828285217285, -2.083785057067871, -1.9944872856140137, -1.9051893949508667, -1.8158916234970093, -1.7265938520431519, -1.6372959613800049, -1.547998070716858, -1.4587002992630005, -1.369402527809143, -1.280104637145996, -1.1908068656921387, -1.1015090942382812, -1.0122113227844238, -0.9229134917259216, -0.8336157202720642, -0.7443179488182068, -0.6550201177597046, -0.5657223463058472, -0.47642454504966736, -0.38712674379348755, -0.2978289723396301, -0.20853114128112793, -0.11923336982727051, -0.029935576021671295, 0.05936221778392792, 0.14866000413894653, 0.23795780539512634, 0.32725560665130615, 0.4165533781051636, 0.5058512091636658, 0.5951489806175232, 0.6844467520713806, 0.7737445831298828, 0.8630423545837402, 0.9523401260375977, 1.041637897491455, 1.1309356689453125, 1.2202335596084595, 1.309531331062317]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 6.0, 2.0, 6.0, 12.0, 8.0, 7.0, 11.0, 10.0, 23.0, 15.0, 15.0, 23.0, 26.0, 38.0, 32.0, 45.0, 34.0, 37.0, 41.0, 34.0, 48.0, 40.0, 47.0, 47.0, 38.0, 29.0, 31.0, 35.0, 23.0, 21.0, 33.0, 28.0, 24.0, 20.0, 22.0, 13.0, 11.0, 12.0, 10.0, 8.0, 5.0, 7.0, 4.0, 10.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0377143621444702, -1.0079102516174316, -0.9781060218811035, -0.9483018517494202, -0.9184976816177368, -0.8886935710906982, -0.8588893413543701, -0.8290852308273315, -0.7992810606956482, -0.7694768905639648, -0.7396727204322815, -0.7098685503005981, -0.6800643801689148, -0.6502602100372314, -0.6204560995101929, -0.5906519293785095, -0.5608477592468262, -0.5310435891151428, -0.5012394189834595, -0.4714352488517761, -0.44163110852241516, -0.4118269383907318, -0.38202276825904846, -0.3522186279296875, -0.3224143981933594, -0.292610228061676, -0.2628060579299927, -0.23300190269947052, -0.20319774746894836, -0.17339357733726501, -0.14358940720558167, -0.11378525197505951, -0.08398109674453735, -0.0541769340634346, -0.02437276765704155, 0.0054313987493515015, 0.035235561430454254, 0.065039724111557, 0.09484389424324036, 0.12464804947376251, 0.15445221960544586, 0.1842563897371292, 0.21406054496765137, 0.24386471509933472, 0.27366888523101807, 0.3034730553627014, 0.33327722549438477, 0.3630813658237457, 0.3928855359554291, 0.4226897060871124, 0.4524938762187958, 0.48229801654815674, 0.5121021866798401, 0.5419063568115234, 0.5717105269432068, 0.6015146970748901, 0.6313188672065735, 0.6611230373382568, 0.6909272074699402, 0.7207313776016235, 0.7505355477333069, 0.7803397178649902, 0.8101438283920288, 0.8399479985237122, 0.8697521686553955]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 7.0, 6.0, 11.0, 12.0, 20.0, 28.0, 38.0, 52.0, 101.0, 191.0, 368.0, 665.0, 1303.0, 2569.0, 5659.0, 14074.0, 48434.0, 298387.0, 2137336.0, 1473472.0, 161060.0, 30380.0, 10894.0, 4602.0, 2203.0, 1074.0, 563.0, 309.0, 161.0, 112.0, 62.0, 42.0, 22.0, 13.0, 17.0, 16.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66943359375, -0.6462478637695312, -0.6230621337890625, -0.5998764038085938, -0.576690673828125, -0.5535049438476562, -0.5303192138671875, -0.5071334838867188, -0.48394775390625, -0.46076202392578125, -0.4375762939453125, -0.41439056396484375, -0.391204833984375, -0.36801910400390625, -0.3448333740234375, -0.32164764404296875, -0.2984619140625, -0.27527618408203125, -0.2520904541015625, -0.22890472412109375, -0.205718994140625, -0.18253326416015625, -0.1593475341796875, -0.13616180419921875, -0.11297607421875, -0.08979034423828125, -0.0666046142578125, -0.04341888427734375, -0.020233154296875, 0.00295257568359375, 0.0261383056640625, 0.04932403564453125, 0.072509765625, 0.09569549560546875, 0.1188812255859375, 0.14206695556640625, 0.165252685546875, 0.18843841552734375, 0.2116241455078125, 0.23480987548828125, 0.25799560546875, 0.28118133544921875, 0.3043670654296875, 0.32755279541015625, 0.350738525390625, 0.37392425537109375, 0.3971099853515625, 0.42029571533203125, 0.4434814453125, 0.46666717529296875, 0.4898529052734375, 0.5130386352539062, 0.536224365234375, 0.5594100952148438, 0.5825958251953125, 0.6057815551757812, 0.62896728515625, 0.6521530151367188, 0.6753387451171875, 0.6985244750976562, 0.721710205078125, 0.7448959350585938, 0.7680816650390625, 0.7912673950195312, 0.814453125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 8.0, 8.0, 6.0, 12.0, 17.0, 36.0, 21.0, 36.0, 31.0, 43.0, 45.0, 47.0, 51.0, 50.0, 48.0, 64.0, 46.0, 59.0, 51.0, 44.0, 53.0, 45.0, 28.0, 23.0, 24.0, 21.0, 18.0, 12.0, 12.0, 11.0, 4.0, 5.0, 2.0, 1.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4658851623535156, -0.44959259033203125, -0.4333000183105469, -0.4170074462890625, -0.4007148742675781, -0.38442230224609375, -0.3681297302246094, -0.351837158203125, -0.3355445861816406, -0.31925201416015625, -0.3029594421386719, -0.2866668701171875, -0.2703742980957031, -0.25408172607421875, -0.23778915405273438, -0.22149658203125, -0.20520401000976562, -0.18891143798828125, -0.17261886596679688, -0.1563262939453125, -0.14003372192382812, -0.12374114990234375, -0.10744857788085938, -0.091156005859375, -0.07486343383789062, -0.05857086181640625, -0.042278289794921875, -0.0259857177734375, -0.009693145751953125, 0.00659942626953125, 0.022891998291015625, 0.0391845703125, 0.055477142333984375, 0.07176971435546875, 0.08806228637695312, 0.1043548583984375, 0.12064743041992188, 0.13694000244140625, 0.15323257446289062, 0.169525146484375, 0.18581771850585938, 0.20211029052734375, 0.21840286254882812, 0.2346954345703125, 0.2509880065917969, 0.26728057861328125, 0.2835731506347656, 0.29986572265625, 0.3161582946777344, 0.33245086669921875, 0.3487434387207031, 0.3650360107421875, 0.3813285827636719, 0.39762115478515625, 0.4139137268066406, 0.430206298828125, 0.4464988708496094, 0.46279144287109375, 0.4790840148925781, 0.4953765869140625, 0.5116691589355469, 0.5279617309570312, 0.5442543029785156, 0.560546875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 2.0, 11.0, 10.0, 20.0, 57.0, 127.0, 377.0, 2546.0, 721511.0, 3465932.0, 2991.0, 436.0, 130.0, 60.0, 23.0, 17.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.04296875, -6.871368408203125, -6.69976806640625, -6.528167724609375, -6.3565673828125, -6.184967041015625, -6.01336669921875, -5.841766357421875, -5.670166015625, -5.498565673828125, -5.32696533203125, -5.155364990234375, -4.9837646484375, -4.812164306640625, -4.64056396484375, -4.468963623046875, -4.29736328125, -4.125762939453125, -3.95416259765625, -3.782562255859375, -3.6109619140625, -3.439361572265625, -3.26776123046875, -3.096160888671875, -2.924560546875, -2.752960205078125, -2.58135986328125, -2.409759521484375, -2.2381591796875, -2.066558837890625, -1.89495849609375, -1.723358154296875, -1.5517578125, -1.380157470703125, -1.20855712890625, -1.036956787109375, -0.8653564453125, -0.693756103515625, -0.52215576171875, -0.350555419921875, -0.178955078125, -0.007354736328125, 0.16424560546875, 0.335845947265625, 0.5074462890625, 0.679046630859375, 0.85064697265625, 1.022247314453125, 1.19384765625, 1.365447998046875, 1.53704833984375, 1.708648681640625, 1.8802490234375, 2.051849365234375, 2.22344970703125, 2.395050048828125, 2.566650390625, 2.738250732421875, 2.90985107421875, 3.081451416015625, 3.2530517578125, 3.424652099609375, 3.59625244140625, 3.767852783203125, 3.939453125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 8.0, 11.0, 21.0, 39.0, 69.0, 104.0, 168.0, 361.0, 755.0, 1198.0, 629.0, 297.0, 147.0, 83.0, 63.0, 29.0, 23.0, 12.0, 14.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.415283203125, -0.4035491943359375, -0.391815185546875, -0.3800811767578125, -0.36834716796875, -0.3566131591796875, -0.344879150390625, -0.3331451416015625, -0.3214111328125, -0.3096771240234375, -0.297943115234375, -0.2862091064453125, -0.27447509765625, -0.2627410888671875, -0.251007080078125, -0.2392730712890625, -0.2275390625, -0.2158050537109375, -0.204071044921875, -0.1923370361328125, -0.18060302734375, -0.1688690185546875, -0.157135009765625, -0.1454010009765625, -0.1336669921875, -0.1219329833984375, -0.110198974609375, -0.0984649658203125, -0.08673095703125, -0.0749969482421875, -0.063262939453125, -0.0515289306640625, -0.039794921875, -0.0280609130859375, -0.016326904296875, -0.0045928955078125, 0.00714111328125, 0.0188751220703125, 0.030609130859375, 0.0423431396484375, 0.0540771484375, 0.0658111572265625, 0.077545166015625, 0.0892791748046875, 0.10101318359375, 0.1127471923828125, 0.124481201171875, 0.1362152099609375, 0.14794921875, 0.1596832275390625, 0.171417236328125, 0.1831512451171875, 0.19488525390625, 0.2066192626953125, 0.218353271484375, 0.2300872802734375, 0.2418212890625, 0.2535552978515625, 0.265289306640625, 0.2770233154296875, 0.28875732421875, 0.3004913330078125, 0.312225341796875, 0.3239593505859375, 0.335693359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 13.0, 15.0, 23.0, 34.0, 37.0, 67.0, 96.0, 103.0, 117.0, 106.0, 96.0, 81.0, 77.0, 39.0, 31.0, 21.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5571964979171753, -1.5232477188110352, -1.4892988204956055, -1.4553499221801758, -1.4214011430740356, -1.3874523639678955, -1.3535034656524658, -1.3195545673370361, -1.285605788230896, -1.2516570091247559, -1.2177081108093262, -1.1837592124938965, -1.1498104333877563, -1.1158616542816162, -1.0819127559661865, -1.0479638576507568, -1.0140150785446167, -0.9800662398338318, -0.9461174011230469, -0.912168562412262, -0.878219723701477, -0.8442708849906921, -0.8103220462799072, -0.7763732075691223, -0.7424243688583374, -0.7084755301475525, -0.6745266914367676, -0.6405778527259827, -0.6066290140151978, -0.5726801753044128, -0.5387313365936279, -0.504782497882843, -0.47083377838134766, -0.43688493967056274, -0.40293610095977783, -0.3689872622489929, -0.335038423538208, -0.3010895848274231, -0.2671407461166382, -0.23319190740585327, -0.19924306869506836, -0.16529422998428345, -0.13134539127349854, -0.09739655256271362, -0.06344771385192871, -0.0294988751411438, 0.004449963569641113, 0.038398802280426025, 0.07234764099121094, 0.10629647970199585, 0.14024531841278076, 0.17419415712356567, 0.20814299583435059, 0.2420918345451355, 0.2760406732559204, 0.3099895119667053, 0.34393835067749023, 0.37788718938827515, 0.41183602809906006, 0.44578486680984497, 0.4797337055206299, 0.5136825442314148, 0.5476313829421997, 0.5815802216529846, 0.6155290603637695]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 18.0, 20.0, 17.0, 18.0, 28.0, 32.0, 41.0, 41.0, 33.0, 36.0, 41.0, 51.0, 58.0, 51.0, 48.0, 40.0, 44.0, 42.0, 41.0, 32.0, 35.0, 24.0, 30.0, 14.0, 20.0, 15.0, 22.0, 23.0, 14.0, 8.0, 8.0, 8.0, 10.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5627540349960327, -0.5461817383766174, -0.5296093821525574, -0.5130370855331421, -0.4964647889137268, -0.47989246249198914, -0.46332013607025146, -0.4467478394508362, -0.4301755130290985, -0.41360318660736084, -0.39703088998794556, -0.3804585635662079, -0.3638862371444702, -0.34731394052505493, -0.33074161410331726, -0.3141692876815796, -0.2975969910621643, -0.28102466464042664, -0.26445236802101135, -0.24788004159927368, -0.2313077300786972, -0.21473541855812073, -0.19816309213638306, -0.18159078061580658, -0.1650184690952301, -0.14844615757465363, -0.13187384605407715, -0.11530151963233948, -0.098729208111763, -0.08215689659118652, -0.06558457762002945, -0.049012258648872375, -0.03243991732597351, -0.015867602080106735, 0.0007047131657600403, 0.017277028411626816, 0.03384934365749359, 0.05042165517807007, 0.06699397414922714, 0.08356629312038422, 0.1001386046409607, 0.11671091616153717, 0.13328322768211365, 0.14985555410385132, 0.1664278656244278, 0.18300017714500427, 0.19957250356674194, 0.21614481508731842, 0.2327171266078949, 0.24928943812847137, 0.26586174964904785, 0.2824340760707855, 0.2990064024925232, 0.3155786991119385, 0.33215102553367615, 0.3487233519554138, 0.3652956485748291, 0.3818679749965668, 0.39844027161598206, 0.4150125980377197, 0.431584894657135, 0.4481572210788727, 0.46472954750061035, 0.48130184412002563, 0.4978741705417633]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 22.0, 34.0, 77.0, 107.0, 210.0, 367.0, 718.0, 1344.0, 2875.0, 5810.0, 13400.0, 31588.0, 76092.0, 184385.0, 356732.0, 217726.0, 90977.0, 37119.0, 15361.0, 7021.0, 3207.0, 1602.0, 818.0, 409.0, 243.0, 134.0, 63.0, 37.0, 23.0, 15.0, 11.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24895668029785156, -0.24107742309570312, -0.2331981658935547, -0.22531890869140625, -0.2174396514892578, -0.20956039428710938, -0.20168113708496094, -0.1938018798828125, -0.18592262268066406, -0.17804336547851562, -0.1701641082763672, -0.16228485107421875, -0.1544055938720703, -0.14652633666992188, -0.13864707946777344, -0.130767822265625, -0.12288856506347656, -0.11500930786132812, -0.10713005065917969, -0.09925079345703125, -0.09137153625488281, -0.08349227905273438, -0.07561302185058594, -0.0677337646484375, -0.05985450744628906, -0.051975250244140625, -0.04409599304199219, -0.03621673583984375, -0.028337478637695312, -0.020458221435546875, -0.012578964233398438, -0.00469970703125, 0.0031795501708984375, 0.011058807373046875, 0.018938064575195312, 0.02681732177734375, 0.03469657897949219, 0.042575836181640625, 0.05045509338378906, 0.0583343505859375, 0.06621360778808594, 0.07409286499023438, 0.08197212219238281, 0.08985137939453125, 0.09773063659667969, 0.10560989379882812, 0.11348915100097656, 0.121368408203125, 0.12924766540527344, 0.13712692260742188, 0.1450061798095703, 0.15288543701171875, 0.1607646942138672, 0.16864395141601562, 0.17652320861816406, 0.1844024658203125, 0.19228172302246094, 0.20016098022460938, 0.2080402374267578, 0.21591949462890625, 0.2237987518310547, 0.23167800903320312, 0.23955726623535156, 0.2474365234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 14.0, 16.0, 17.0, 17.0, 29.0, 29.0, 38.0, 32.0, 42.0, 41.0, 48.0, 56.0, 55.0, 64.0, 58.0, 48.0, 52.0, 45.0, 54.0, 42.0, 26.0, 30.0, 28.0, 19.0, 19.0, 23.0, 14.0, 10.0, 15.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.42119598388671875, -0.4080657958984375, -0.39493560791015625, -0.381805419921875, -0.36867523193359375, -0.3555450439453125, -0.34241485595703125, -0.32928466796875, -0.31615447998046875, -0.3030242919921875, -0.28989410400390625, -0.276763916015625, -0.26363372802734375, -0.2505035400390625, -0.23737335205078125, -0.2242431640625, -0.21111297607421875, -0.1979827880859375, -0.18485260009765625, -0.171722412109375, -0.15859222412109375, -0.1454620361328125, -0.13233184814453125, -0.11920166015625, -0.10607147216796875, -0.0929412841796875, -0.07981109619140625, -0.066680908203125, -0.05355072021484375, -0.0404205322265625, -0.02729034423828125, -0.01416015625, -0.00102996826171875, 0.0121002197265625, 0.02523040771484375, 0.038360595703125, 0.05149078369140625, 0.0646209716796875, 0.07775115966796875, 0.09088134765625, 0.10401153564453125, 0.1171417236328125, 0.13027191162109375, 0.143402099609375, 0.15653228759765625, 0.1696624755859375, 0.18279266357421875, 0.1959228515625, 0.20905303955078125, 0.2221832275390625, 0.23531341552734375, 0.248443603515625, 0.26157379150390625, 0.2747039794921875, 0.28783416748046875, 0.30096435546875, 0.31409454345703125, 0.3272247314453125, 0.34035491943359375, 0.353485107421875, 0.36661529541015625, 0.3797454833984375, 0.39287567138671875, 0.406005859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 12.0, 16.0, 27.0, 43.0, 70.0, 176.0, 423.0, 959.0, 3360.0, 13699.0, 78940.0, 528683.0, 358609.0, 50168.0, 9350.0, 2519.0, 848.0, 325.0, 137.0, 68.0, 44.0, 21.0, 24.0, 5.0, 7.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5400390625, -0.5245552062988281, -0.5090713500976562, -0.4935874938964844, -0.4781036376953125, -0.4626197814941406, -0.44713592529296875, -0.4316520690917969, -0.416168212890625, -0.4006843566894531, -0.38520050048828125, -0.3697166442871094, -0.3542327880859375, -0.3387489318847656, -0.32326507568359375, -0.3077812194824219, -0.29229736328125, -0.2768135070800781, -0.26132965087890625, -0.24584579467773438, -0.2303619384765625, -0.21487808227539062, -0.19939422607421875, -0.18391036987304688, -0.168426513671875, -0.15294265747070312, -0.13745880126953125, -0.12197494506835938, -0.1064910888671875, -0.09100723266601562, -0.07552337646484375, -0.060039520263671875, -0.0445556640625, -0.029071807861328125, -0.01358795166015625, 0.001895904541015625, 0.0173797607421875, 0.032863616943359375, 0.04834747314453125, 0.06383132934570312, 0.079315185546875, 0.09479904174804688, 0.11028289794921875, 0.12576675415039062, 0.1412506103515625, 0.15673446655273438, 0.17221832275390625, 0.18770217895507812, 0.20318603515625, 0.21866989135742188, 0.23415374755859375, 0.24963760375976562, 0.2651214599609375, 0.2806053161621094, 0.29608917236328125, 0.3115730285644531, 0.327056884765625, 0.3425407409667969, 0.35802459716796875, 0.3735084533691406, 0.3889923095703125, 0.4044761657714844, 0.41996002197265625, 0.4354438781738281, 0.450927734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 3.0, 7.0, 11.0, 7.0, 12.0, 17.0, 25.0, 20.0, 22.0, 24.0, 35.0, 27.0, 35.0, 35.0, 24.0, 32.0, 35.0, 46.0, 37.0, 31.0, 44.0, 42.0, 39.0, 39.0, 37.0, 33.0, 46.0, 32.0, 29.0, 21.0, 22.0, 16.0, 18.0, 25.0, 7.0, 12.0, 9.0, 8.0, 8.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.59521484375, -0.5749588012695312, -0.5547027587890625, -0.5344467163085938, -0.514190673828125, -0.49393463134765625, -0.4736785888671875, -0.45342254638671875, -0.43316650390625, -0.41291046142578125, -0.3926544189453125, -0.37239837646484375, -0.352142333984375, -0.33188629150390625, -0.3116302490234375, -0.29137420654296875, -0.2711181640625, -0.25086212158203125, -0.2306060791015625, -0.21035003662109375, -0.190093994140625, -0.16983795166015625, -0.1495819091796875, -0.12932586669921875, -0.10906982421875, -0.08881378173828125, -0.0685577392578125, -0.04830169677734375, -0.028045654296875, -0.00778961181640625, 0.0124664306640625, 0.03272247314453125, 0.052978515625, 0.07323455810546875, 0.0934906005859375, 0.11374664306640625, 0.134002685546875, 0.15425872802734375, 0.1745147705078125, 0.19477081298828125, 0.21502685546875, 0.23528289794921875, 0.2555389404296875, 0.27579498291015625, 0.296051025390625, 0.31630706787109375, 0.3365631103515625, 0.35681915283203125, 0.3770751953125, 0.39733123779296875, 0.4175872802734375, 0.43784332275390625, 0.458099365234375, 0.47835540771484375, 0.4986114501953125, 0.5188674926757812, 0.53912353515625, 0.5593795776367188, 0.5796356201171875, 0.5998916625976562, 0.620147705078125, 0.6404037475585938, 0.6606597900390625, 0.6809158325195312, 0.701171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 15.0, 29.0, 51.0, 75.0, 135.0, 225.0, 364.0, 649.0, 1301.0, 2535.0, 5617.0, 13629.0, 40155.0, 158484.0, 516153.0, 224654.0, 53934.0, 17226.0, 6829.0, 3153.0, 1475.0, 788.0, 446.0, 255.0, 131.0, 96.0, 50.0, 28.0, 23.0, 14.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05572509765625, -0.0540165901184082, -0.052308082580566406, -0.05059957504272461, -0.04889106750488281, -0.047182559967041016, -0.04547405242919922, -0.04376554489135742, -0.042057037353515625, -0.04034852981567383, -0.03864002227783203, -0.036931514739990234, -0.03522300720214844, -0.03351449966430664, -0.031805992126464844, -0.030097484588623047, -0.02838897705078125, -0.026680469512939453, -0.024971961975097656, -0.02326345443725586, -0.021554946899414062, -0.019846439361572266, -0.01813793182373047, -0.016429424285888672, -0.014720916748046875, -0.013012409210205078, -0.011303901672363281, -0.009595394134521484, -0.007886886596679688, -0.006178379058837891, -0.004469871520996094, -0.002761363983154297, -0.0010528564453125, 0.0006556510925292969, 0.0023641586303710938, 0.004072666168212891, 0.0057811737060546875, 0.007489681243896484, 0.009198188781738281, 0.010906696319580078, 0.012615203857421875, 0.014323711395263672, 0.01603221893310547, 0.017740726470947266, 0.019449234008789062, 0.02115774154663086, 0.022866249084472656, 0.024574756622314453, 0.02628326416015625, 0.027991771697998047, 0.029700279235839844, 0.03140878677368164, 0.03311729431152344, 0.034825801849365234, 0.03653430938720703, 0.03824281692504883, 0.039951324462890625, 0.04165983200073242, 0.04336833953857422, 0.045076847076416016, 0.04678535461425781, 0.04849386215209961, 0.050202369689941406, 0.0519108772277832, 0.053619384765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 6.0, 15.0, 25.0, 29.0, 54.0, 97.0, 152.0, 173.0, 130.0, 108.0, 70.0, 31.0, 34.0, 17.0, 11.0, 6.0, 7.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.838010787963867e-05, -7.603969424962997e-05, -7.369928061962128e-05, -7.135886698961258e-05, -6.901845335960388e-05, -6.667803972959518e-05, -6.433762609958649e-05, -6.199721246957779e-05, -5.965679883956909e-05, -5.7316385209560394e-05, -5.49759715795517e-05, -5.2635557949543e-05, -5.02951443195343e-05, -4.7954730689525604e-05, -4.561431705951691e-05, -4.327390342950821e-05, -4.093348979949951e-05, -3.8593076169490814e-05, -3.625266253948212e-05, -3.391224890947342e-05, -3.157183527946472e-05, -2.9231421649456024e-05, -2.6891008019447327e-05, -2.455059438943863e-05, -2.221018075942993e-05, -1.9869767129421234e-05, -1.7529353499412537e-05, -1.5188939869403839e-05, -1.2848526239395142e-05, -1.0508112609386444e-05, -8.167698979377747e-06, -5.827285349369049e-06, -3.4868717193603516e-06, -1.146458089351654e-06, 1.1939555406570435e-06, 3.534369170665741e-06, 5.8747828006744385e-06, 8.215196430683136e-06, 1.0555610060691833e-05, 1.2896023690700531e-05, 1.5236437320709229e-05, 1.7576850950717926e-05, 1.9917264580726624e-05, 2.225767821073532e-05, 2.459809184074402e-05, 2.6938505470752716e-05, 2.9278919100761414e-05, 3.161933273077011e-05, 3.395974636077881e-05, 3.6300159990787506e-05, 3.8640573620796204e-05, 4.09809872508049e-05, 4.33214008808136e-05, 4.5661814510822296e-05, 4.8002228140830994e-05, 5.034264177083969e-05, 5.268305540084839e-05, 5.5023469030857086e-05, 5.7363882660865784e-05, 5.970429629087448e-05, 6.204470992088318e-05, 6.438512355089188e-05, 6.672553718090057e-05, 6.906595081090927e-05, 7.140636444091797e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 15.0, 18.0, 27.0, 50.0, 78.0, 125.0, 231.0, 385.0, 850.0, 1974.0, 5439.0, 16495.0, 63447.0, 292651.0, 494909.0, 127484.0, 30042.0, 8807.0, 3065.0, 1239.0, 549.0, 283.0, 137.0, 77.0, 37.0, 37.0, 21.0, 22.0, 7.0, 9.0, 7.0, 1.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.051788330078125, -0.04995393753051758, -0.048119544982910156, -0.046285152435302734, -0.04445075988769531, -0.04261636734008789, -0.04078197479248047, -0.03894758224487305, -0.037113189697265625, -0.0352787971496582, -0.03344440460205078, -0.03161001205444336, -0.029775619506835938, -0.027941226959228516, -0.026106834411621094, -0.024272441864013672, -0.02243804931640625, -0.020603656768798828, -0.018769264221191406, -0.016934871673583984, -0.015100479125976562, -0.01326608657836914, -0.011431694030761719, -0.009597301483154297, -0.007762908935546875, -0.005928516387939453, -0.004094123840332031, -0.0022597312927246094, -0.0004253387451171875, 0.0014090538024902344, 0.0032434463500976562, 0.005077838897705078, 0.0069122314453125, 0.008746623992919922, 0.010581016540527344, 0.012415409088134766, 0.014249801635742188, 0.01608419418334961, 0.01791858673095703, 0.019752979278564453, 0.021587371826171875, 0.023421764373779297, 0.02525615692138672, 0.02709054946899414, 0.028924942016601562, 0.030759334564208984, 0.032593727111816406, 0.03442811965942383, 0.03626251220703125, 0.03809690475463867, 0.039931297302246094, 0.041765689849853516, 0.04360008239746094, 0.04543447494506836, 0.04726886749267578, 0.0491032600402832, 0.050937652587890625, 0.05277204513549805, 0.05460643768310547, 0.05644083023071289, 0.05827522277832031, 0.060109615325927734, 0.061944007873535156, 0.06377840042114258, 0.06561279296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 13.0, 7.0, 10.0, 10.0, 16.0, 18.0, 17.0, 23.0, 28.0, 35.0, 46.0, 63.0, 69.0, 84.0, 90.0, 78.0, 87.0, 68.0, 48.0, 42.0, 25.0, 34.0, 21.0, 14.0, 11.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01470947265625, -0.014224767684936523, -0.013740062713623047, -0.01325535774230957, -0.012770652770996094, -0.012285947799682617, -0.01180124282836914, -0.011316537857055664, -0.010831832885742188, -0.010347127914428711, -0.009862422943115234, -0.009377717971801758, -0.008893013000488281, -0.008408308029174805, -0.007923603057861328, -0.0074388980865478516, -0.006954193115234375, -0.0064694881439208984, -0.005984783172607422, -0.005500078201293945, -0.005015373229980469, -0.004530668258666992, -0.004045963287353516, -0.003561258316040039, -0.0030765533447265625, -0.002591848373413086, -0.0021071434020996094, -0.0016224384307861328, -0.0011377334594726562, -0.0006530284881591797, -0.00016832351684570312, 0.00031638145446777344, 0.00080108642578125, 0.0012857913970947266, 0.0017704963684082031, 0.0022552013397216797, 0.0027399063110351562, 0.003224611282348633, 0.0037093162536621094, 0.004194021224975586, 0.0046787261962890625, 0.005163431167602539, 0.005648136138916016, 0.006132841110229492, 0.006617546081542969, 0.007102251052856445, 0.007586956024169922, 0.008071660995483398, 0.008556365966796875, 0.009041070938110352, 0.009525775909423828, 0.010010480880737305, 0.010495185852050781, 0.010979890823364258, 0.011464595794677734, 0.011949300765991211, 0.012434005737304688, 0.012918710708618164, 0.01340341567993164, 0.013888120651245117, 0.014372825622558594, 0.01485753059387207, 0.015342235565185547, 0.015826940536499023, 0.0163116455078125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 11.0, 23.0, 39.0, 34.0, 76.0, 93.0, 108.0, 110.0, 120.0, 96.0, 72.0, 74.0, 31.0, 26.0, 23.0, 11.0, 12.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.8066639304161072, -0.7877929210662842, -0.768921971321106, -0.750050961971283, -0.7311800122261047, -0.7123090028762817, -0.6934380531311035, -0.6745670437812805, -0.6556960344314575, -0.6368250250816345, -0.6179540753364563, -0.5990830659866333, -0.5802121162414551, -0.5613411068916321, -0.5424701571464539, -0.5235991477966309, -0.5047281980514526, -0.485857218503952, -0.4669862389564514, -0.4481152594089508, -0.4292442798614502, -0.4103732705116272, -0.3915022909641266, -0.372631311416626, -0.35376033186912537, -0.33488935232162476, -0.31601837277412415, -0.29714739322662354, -0.27827638387680054, -0.2594054341316223, -0.24053442478179932, -0.2216634452342987, -0.20279240608215332, -0.1839214265346527, -0.1650504469871521, -0.1461794525384903, -0.12730847299098969, -0.10843749344348907, -0.08956650644540787, -0.07069551944732666, -0.05182453989982605, -0.03295355662703514, -0.014082573354244232, 0.004788409918546677, 0.023659393191337585, 0.042530372738838196, 0.0614013597369194, 0.08027234673500061, 0.09914332628250122, 0.11801430583000183, 0.13688528537750244, 0.15575627982616425, 0.17462725937366486, 0.19349823892116547, 0.21236923336982727, 0.23124021291732788, 0.2501111924648285, 0.2689821720123291, 0.2878531515598297, 0.3067241311073303, 0.3255951404571533, 0.34446609020233154, 0.36333709955215454, 0.38220807909965515, 0.40107905864715576]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 5.0, 10.0, 14.0, 17.0, 21.0, 17.0, 23.0, 26.0, 46.0, 42.0, 36.0, 40.0, 46.0, 42.0, 57.0, 59.0, 51.0, 46.0, 54.0, 40.0, 42.0, 35.0, 39.0, 29.0, 19.0, 17.0, 29.0, 15.0, 20.0, 11.0, 11.0, 11.0, 12.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3913864493370056, -0.3797988295555115, -0.36821120977401733, -0.3566235899925232, -0.34503600001335144, -0.3334483802318573, -0.32186076045036316, -0.310273140668869, -0.2986855208873749, -0.28709790110588074, -0.2755102813243866, -0.26392269134521484, -0.2523350715637207, -0.24074745178222656, -0.22915983200073242, -0.21757221221923828, -0.20598460733890533, -0.1943969875574112, -0.18280938267707825, -0.1712217628955841, -0.15963414311408997, -0.14804652333259583, -0.13645891845226288, -0.12487129867076874, -0.1132836863398552, -0.10169607400894165, -0.09010845422744751, -0.07852084189653397, -0.06693322956562042, -0.05534560978412628, -0.04375799745321274, -0.0321703776717186, -0.020582765340805054, -0.008995150215923786, 0.0025924649089574814, 0.014180079102516174, 0.025767695158720016, 0.03735531121492386, 0.0489429235458374, 0.06053054332733154, 0.07211815565824509, 0.08370576798915863, 0.09529338777065277, 0.10688100010156631, 0.11846861243247986, 0.130056232213974, 0.14164385199546814, 0.15323147177696228, 0.16481907665729523, 0.17640669643878937, 0.18799430131912231, 0.19958192110061646, 0.2111695408821106, 0.22275716066360474, 0.23434476554393768, 0.24593238532543182, 0.25751999020576477, 0.2691076099872589, 0.28069522976875305, 0.2922828197479248, 0.30387043952941895, 0.3154580593109131, 0.3270456790924072, 0.33863329887390137, 0.3502209186553955]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 10.0, 18.0, 23.0, 41.0, 65.0, 82.0, 124.0, 199.0, 296.0, 416.0, 618.0, 918.0, 1441.0, 2015.0, 3241.0, 5295.0, 8581.0, 14935.0, 27754.0, 57524.0, 145658.0, 393674.0, 224425.0, 78790.0, 35759.0, 18661.0, 10564.0, 6178.0, 3891.0, 2531.0, 1609.0, 1058.0, 703.0, 448.0, 317.0, 203.0, 144.0, 98.0, 71.0, 60.0, 34.0, 23.0, 27.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.20263671875, -0.197113037109375, -0.19158935546875, -0.186065673828125, -0.1805419921875, -0.175018310546875, -0.16949462890625, -0.163970947265625, -0.158447265625, -0.152923583984375, -0.14739990234375, -0.141876220703125, -0.1363525390625, -0.130828857421875, -0.12530517578125, -0.119781494140625, -0.1142578125, -0.108734130859375, -0.10321044921875, -0.097686767578125, -0.0921630859375, -0.086639404296875, -0.08111572265625, -0.075592041015625, -0.070068359375, -0.064544677734375, -0.05902099609375, -0.053497314453125, -0.0479736328125, -0.042449951171875, -0.03692626953125, -0.031402587890625, -0.02587890625, -0.020355224609375, -0.01483154296875, -0.009307861328125, -0.0037841796875, 0.001739501953125, 0.00726318359375, 0.012786865234375, 0.018310546875, 0.023834228515625, 0.02935791015625, 0.034881591796875, 0.0404052734375, 0.045928955078125, 0.05145263671875, 0.056976318359375, 0.0625, 0.068023681640625, 0.07354736328125, 0.079071044921875, 0.0845947265625, 0.090118408203125, 0.09564208984375, 0.101165771484375, 0.106689453125, 0.112213134765625, 0.11773681640625, 0.123260498046875, 0.1287841796875, 0.134307861328125, 0.13983154296875, 0.145355224609375, 0.15087890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 9.0, 16.0, 11.0, 16.0, 26.0, 20.0, 18.0, 34.0, 34.0, 41.0, 35.0, 40.0, 40.0, 57.0, 47.0, 55.0, 50.0, 46.0, 48.0, 52.0, 47.0, 25.0, 35.0, 30.0, 27.0, 26.0, 16.0, 17.0, 8.0, 12.0, 11.0, 12.0, 7.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74853515625, -0.7275390625, -0.70654296875, -0.685546875, -0.66455078125, -0.6435546875, -0.62255859375, -0.6015625, -0.58056640625, -0.5595703125, -0.53857421875, -0.517578125, -0.49658203125, -0.4755859375, -0.45458984375, -0.43359375, -0.41259765625, -0.3916015625, -0.37060546875, -0.349609375, -0.32861328125, -0.3076171875, -0.28662109375, -0.265625, -0.24462890625, -0.2236328125, -0.20263671875, -0.181640625, -0.16064453125, -0.1396484375, -0.11865234375, -0.09765625, -0.07666015625, -0.0556640625, -0.03466796875, -0.013671875, 0.00732421875, 0.0283203125, 0.04931640625, 0.0703125, 0.09130859375, 0.1123046875, 0.13330078125, 0.154296875, 0.17529296875, 0.1962890625, 0.21728515625, 0.23828125, 0.25927734375, 0.2802734375, 0.30126953125, 0.322265625, 0.34326171875, 0.3642578125, 0.38525390625, 0.40625, 0.42724609375, 0.4482421875, 0.46923828125, 0.490234375, 0.51123046875, 0.5322265625, 0.55322265625, 0.57421875, 0.59521484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 14.0, 18.0, 9.0, 9.0, 25.0, 26.0, 40.0, 60.0, 61.0, 74.0, 100.0, 223.0, 2284.0, 1000399.0, 44165.0, 484.0, 139.0, 87.0, 69.0, 59.0, 39.0, 42.0, 27.0, 26.0, 16.0, 15.0, 10.0, 7.0, 7.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.173736572265625, -2.10528564453125, -2.036834716796875, -1.9683837890625, -1.899932861328125, -1.83148193359375, -1.763031005859375, -1.694580078125, -1.626129150390625, -1.55767822265625, -1.489227294921875, -1.4207763671875, -1.352325439453125, -1.28387451171875, -1.215423583984375, -1.14697265625, -1.078521728515625, -1.01007080078125, -0.941619873046875, -0.8731689453125, -0.804718017578125, -0.73626708984375, -0.667816162109375, -0.599365234375, -0.530914306640625, -0.46246337890625, -0.394012451171875, -0.3255615234375, -0.257110595703125, -0.18865966796875, -0.120208740234375, -0.0517578125, 0.016693115234375, 0.08514404296875, 0.153594970703125, 0.2220458984375, 0.290496826171875, 0.35894775390625, 0.427398681640625, 0.495849609375, 0.564300537109375, 0.63275146484375, 0.701202392578125, 0.7696533203125, 0.838104248046875, 0.90655517578125, 0.975006103515625, 1.04345703125, 1.111907958984375, 1.18035888671875, 1.248809814453125, 1.3172607421875, 1.385711669921875, 1.45416259765625, 1.522613525390625, 1.591064453125, 1.659515380859375, 1.72796630859375, 1.796417236328125, 1.8648681640625, 1.933319091796875, 2.00177001953125, 2.070220947265625, 2.138671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 10.0, 16.0, 12.0, 11.0, 15.0, 14.0, 28.0, 30.0, 52.0, 51.0, 48.0, 41.0, 54.0, 57.0, 57.0, 65.0, 50.0, 47.0, 46.0, 47.0, 38.0, 38.0, 34.0, 26.0, 27.0, 18.0, 16.0, 15.0, 9.0, 5.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90185546875, -0.8743362426757812, -0.8468170166015625, -0.8192977905273438, -0.791778564453125, -0.7642593383789062, -0.7367401123046875, -0.7092208862304688, -0.68170166015625, -0.6541824340820312, -0.6266632080078125, -0.5991439819335938, -0.571624755859375, -0.5441055297851562, -0.5165863037109375, -0.48906707763671875, -0.4615478515625, -0.43402862548828125, -0.4065093994140625, -0.37899017333984375, -0.351470947265625, -0.32395172119140625, -0.2964324951171875, -0.26891326904296875, -0.24139404296875, -0.21387481689453125, -0.1863555908203125, -0.15883636474609375, -0.131317138671875, -0.10379791259765625, -0.0762786865234375, -0.04875946044921875, -0.021240234375, 0.00627899169921875, 0.0337982177734375, 0.06131744384765625, 0.088836669921875, 0.11635589599609375, 0.1438751220703125, 0.17139434814453125, 0.19891357421875, 0.22643280029296875, 0.2539520263671875, 0.28147125244140625, 0.308990478515625, 0.33650970458984375, 0.3640289306640625, 0.39154815673828125, 0.4190673828125, 0.44658660888671875, 0.4741058349609375, 0.5016250610351562, 0.529144287109375, 0.5566635131835938, 0.5841827392578125, 0.6117019653320312, 0.63922119140625, 0.6667404174804688, 0.6942596435546875, 0.7217788696289062, 0.749298095703125, 0.7768173217773438, 0.8043365478515625, 0.8318557739257812, 0.859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 6.0, 9.0, 20.0, 25.0, 30.0, 50.0, 80.0, 170.0, 472.0, 1888.0, 12088.0, 718777.0, 302768.0, 9614.0, 1701.0, 451.0, 163.0, 82.0, 40.0, 28.0, 15.0, 13.0, 9.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.434326171875, -0.41982269287109375, -0.4053192138671875, -0.39081573486328125, -0.376312255859375, -0.36180877685546875, -0.3473052978515625, -0.33280181884765625, -0.31829833984375, -0.30379486083984375, -0.2892913818359375, -0.27478790283203125, -0.260284423828125, -0.24578094482421875, -0.2312774658203125, -0.21677398681640625, -0.2022705078125, -0.18776702880859375, -0.1732635498046875, -0.15876007080078125, -0.144256591796875, -0.12975311279296875, -0.1152496337890625, -0.10074615478515625, -0.08624267578125, -0.07173919677734375, -0.0572357177734375, -0.04273223876953125, -0.028228759765625, -0.01372528076171875, 0.0007781982421875, 0.01528167724609375, 0.02978515625, 0.04428863525390625, 0.0587921142578125, 0.07329559326171875, 0.087799072265625, 0.10230255126953125, 0.1168060302734375, 0.13130950927734375, 0.14581298828125, 0.16031646728515625, 0.1748199462890625, 0.18932342529296875, 0.203826904296875, 0.21833038330078125, 0.2328338623046875, 0.24733734130859375, 0.2618408203125, 0.27634429931640625, 0.2908477783203125, 0.30535125732421875, 0.319854736328125, 0.33435821533203125, 0.3488616943359375, 0.36336517333984375, 0.37786865234375, 0.39237213134765625, 0.4068756103515625, 0.42137908935546875, 0.435882568359375, 0.45038604736328125, 0.4648895263671875, 0.47939300537109375, 0.493896484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 22.0, 28.0, 31.0, 64.0, 194.0, 343.0, 131.0, 58.0, 26.0, 23.0, 16.0, 7.0, 7.0, 1.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2498111724853516e-05, -4.1048042476177216e-05, -3.9597973227500916e-05, -3.8147903978824615e-05, -3.6697834730148315e-05, -3.5247765481472015e-05, -3.3797696232795715e-05, -3.2347626984119415e-05, -3.0897557735443115e-05, -2.9447488486766815e-05, -2.7997419238090515e-05, -2.6547349989414215e-05, -2.5097280740737915e-05, -2.3647211492061615e-05, -2.2197142243385315e-05, -2.0747072994709015e-05, -1.9297003746032715e-05, -1.7846934497356415e-05, -1.6396865248680115e-05, -1.4946796000003815e-05, -1.3496726751327515e-05, -1.2046657502651215e-05, -1.0596588253974915e-05, -9.146519005298615e-06, -7.696449756622314e-06, -6.246380507946014e-06, -4.796311259269714e-06, -3.3462420105934143e-06, -1.8961727619171143e-06, -4.461035132408142e-07, 1.0039657354354858e-06, 2.454034984111786e-06, 3.904104232788086e-06, 5.354173481464386e-06, 6.804242730140686e-06, 8.254311978816986e-06, 9.704381227493286e-06, 1.1154450476169586e-05, 1.2604519724845886e-05, 1.4054588973522186e-05, 1.5504658222198486e-05, 1.6954727470874786e-05, 1.8404796719551086e-05, 1.9854865968227386e-05, 2.1304935216903687e-05, 2.2755004465579987e-05, 2.4205073714256287e-05, 2.5655142962932587e-05, 2.7105212211608887e-05, 2.8555281460285187e-05, 3.0005350708961487e-05, 3.145541995763779e-05, 3.290548920631409e-05, 3.435555845499039e-05, 3.580562770366669e-05, 3.725569695234299e-05, 3.870576620101929e-05, 4.015583544969559e-05, 4.160590469837189e-05, 4.305597394704819e-05, 4.450604319572449e-05, 4.595611244440079e-05, 4.740618169307709e-05, 4.885625094175339e-05, 5.030632019042969e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 13.0, 11.0, 58.0, 116.0, 452.0, 3053.0, 166903.0, 872791.0, 4281.0, 585.0, 147.0, 54.0, 26.0, 21.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76220703125, -0.7360000610351562, -0.7097930908203125, -0.6835861206054688, -0.657379150390625, -0.6311721801757812, -0.6049652099609375, -0.5787582397460938, -0.55255126953125, -0.5263442993164062, -0.5001373291015625, -0.47393035888671875, -0.447723388671875, -0.42151641845703125, -0.3953094482421875, -0.36910247802734375, -0.3428955078125, -0.31668853759765625, -0.2904815673828125, -0.26427459716796875, -0.238067626953125, -0.21186065673828125, -0.1856536865234375, -0.15944671630859375, -0.13323974609375, -0.10703277587890625, -0.0808258056640625, -0.05461883544921875, -0.028411865234375, -0.00220489501953125, 0.0240020751953125, 0.05020904541015625, 0.076416015625, 0.10262298583984375, 0.1288299560546875, 0.15503692626953125, 0.181243896484375, 0.20745086669921875, 0.2336578369140625, 0.25986480712890625, 0.28607177734375, 0.31227874755859375, 0.3384857177734375, 0.36469268798828125, 0.390899658203125, 0.41710662841796875, 0.4433135986328125, 0.46952056884765625, 0.4957275390625, 0.5219345092773438, 0.5481414794921875, 0.5743484497070312, 0.600555419921875, 0.6267623901367188, 0.6529693603515625, 0.6791763305664062, 0.70538330078125, 0.7315902709960938, 0.7577972412109375, 0.7840042114257812, 0.810211181640625, 0.8364181518554688, 0.8626251220703125, 0.8888320922851562, 0.9150390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 15.0, 11.0, 21.0, 20.0, 47.0, 83.0, 164.0, 297.0, 132.0, 76.0, 42.0, 27.0, 11.0, 15.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.11989498138427734, -0.11607170104980469, -0.11224842071533203, -0.10842514038085938, -0.10460186004638672, -0.10077857971191406, -0.0969552993774414, -0.09313201904296875, -0.0893087387084961, -0.08548545837402344, -0.08166217803955078, -0.07783889770507812, -0.07401561737060547, -0.07019233703613281, -0.06636905670166016, -0.0625457763671875, -0.058722496032714844, -0.05489921569824219, -0.05107593536376953, -0.047252655029296875, -0.04342937469482422, -0.03960609436035156, -0.035782814025878906, -0.03195953369140625, -0.028136253356933594, -0.024312973022460938, -0.02048969268798828, -0.016666412353515625, -0.012843132019042969, -0.009019851684570312, -0.005196571350097656, -0.001373291015625, 0.0024499893188476562, 0.0062732696533203125, 0.010096549987792969, 0.013919830322265625, 0.01774311065673828, 0.021566390991210938, 0.025389671325683594, 0.02921295166015625, 0.033036231994628906, 0.03685951232910156, 0.04068279266357422, 0.044506072998046875, 0.04832935333251953, 0.05215263366699219, 0.055975914001464844, 0.0597991943359375, 0.06362247467041016, 0.06744575500488281, 0.07126903533935547, 0.07509231567382812, 0.07891559600830078, 0.08273887634277344, 0.0865621566772461, 0.09038543701171875, 0.0942087173461914, 0.09803199768066406, 0.10185527801513672, 0.10567855834960938, 0.10950183868408203, 0.11332511901855469, 0.11714839935302734, 0.1209716796875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [19.0, 374.0, 585.0, 39.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6702286005020142, -0.35472747683525085, -0.03922635316848755, 0.27627480030059814, 0.5917758941650391, 0.90727698802948, 1.2227782011032104, 1.5382791757583618, 1.8537803888320923, 2.169281482696533, 2.4847826957702637, 2.800283908843994, 3.1157848834991455, 3.431285858154297, 3.7467870712280273, 4.062288284301758, 4.377789497375488, 4.693290710449219, 5.008791923522949, 5.32429313659668, 5.639793872833252, 5.955295085906982, 6.270796298980713, 6.586297035217285, 6.901798248291016, 7.217299461364746, 7.532800674438477, 7.848301887512207, 8.163803100585938, 8.479303359985352, 8.794805526733398, 9.110305786132812, 9.425806999206543, 9.741308212280273, 10.056809425354004, 10.372310638427734, 10.687811851501465, 11.003313064575195, 11.31881332397461, 11.63431453704834, 11.94981575012207, 12.2653169631958, 12.580818176269531, 12.896319389343262, 13.211820602416992, 13.527320861816406, 13.842823028564453, 14.158323287963867, 14.473825454711914, 14.789326667785645, 15.104827880859375, 15.420329093933105, 15.735830307006836, 16.05133056640625, 16.366832733154297, 16.68233299255371, 16.997833251953125, 17.31333351135254, 17.628835678100586, 17.9443359375, 18.259838104248047, 18.57533836364746, 18.890840530395508, 19.206340789794922, 19.52184295654297]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 13.0, 11.0, 12.0, 7.0, 10.0, 18.0, 27.0, 20.0, 28.0, 29.0, 24.0, 35.0, 28.0, 31.0, 45.0, 41.0, 49.0, 50.0, 34.0, 34.0, 37.0, 52.0, 44.0, 39.0, 39.0, 33.0, 25.0, 29.0, 25.0, 21.0, 14.0, 17.0, 16.0, 12.0, 10.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.803426206111908, -0.7724162340164185, -0.7414062023162842, -0.7103962302207947, -0.6793862581253052, -0.6483762264251709, -0.6173662543296814, -0.5863562822341919, -0.5553462505340576, -0.5243362784385681, -0.49332624673843384, -0.46231627464294434, -0.43130627274513245, -0.40029627084732056, -0.36928629875183105, -0.33827629685401917, -0.3072662949562073, -0.2762562930583954, -0.2452463060617447, -0.214236319065094, -0.1832263171672821, -0.15221631526947021, -0.12120632827281952, -0.09019634127616882, -0.059186339378356934, -0.02817634493112564, 0.002833649516105652, 0.033843643963336945, 0.06485363841056824, 0.09586364030838013, 0.12687362730503082, 0.15788361430168152, 0.18889367580413818, 0.21990367770195007, 0.25091367959976196, 0.28192365169525146, 0.31293365359306335, 0.34394365549087524, 0.37495362758636475, 0.40596362948417664, 0.4369736313819885, 0.4679836332798004, 0.4989936351776123, 0.5300036072731018, 0.5610135793685913, 0.5920236110687256, 0.6230335831642151, 0.6540435552597046, 0.6850535869598389, 0.7160635590553284, 0.7470735907554626, 0.7780835628509521, 0.8090935945510864, 0.8401035666465759, 0.8711135387420654, 0.9021235704421997, 0.9331335425376892, 0.9641435146331787, 0.995153546333313, 1.0261635780334473, 1.057173490524292, 1.0881835222244263, 1.1191935539245605, 1.1502034664154053, 1.1812134981155396]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 9.0, 12.0, 13.0, 24.0, 25.0, 26.0, 53.0, 60.0, 93.0, 160.0, 195.0, 295.0, 579.0, 948.0, 1631.0, 3216.0, 6991.0, 18275.0, 64984.0, 407807.0, 2128040.0, 1307615.0, 192519.0, 37977.0, 11951.0, 4904.0, 2497.0, 1314.0, 775.0, 475.0, 256.0, 172.0, 127.0, 65.0, 57.0, 46.0, 24.0, 23.0, 18.0, 6.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59375, -0.5744781494140625, -0.555206298828125, -0.5359344482421875, -0.51666259765625, -0.4973907470703125, -0.478118896484375, -0.4588470458984375, -0.4395751953125, -0.4203033447265625, -0.401031494140625, -0.3817596435546875, -0.36248779296875, -0.3432159423828125, -0.323944091796875, -0.3046722412109375, -0.285400390625, -0.2661285400390625, -0.246856689453125, -0.2275848388671875, -0.20831298828125, -0.1890411376953125, -0.169769287109375, -0.1504974365234375, -0.1312255859375, -0.1119537353515625, -0.092681884765625, -0.0734100341796875, -0.05413818359375, -0.0348663330078125, -0.015594482421875, 0.0036773681640625, 0.02294921875, 0.0422210693359375, 0.061492919921875, 0.0807647705078125, 0.10003662109375, 0.1193084716796875, 0.138580322265625, 0.1578521728515625, 0.1771240234375, 0.1963958740234375, 0.215667724609375, 0.2349395751953125, 0.25421142578125, 0.2734832763671875, 0.292755126953125, 0.3120269775390625, 0.331298828125, 0.3505706787109375, 0.369842529296875, 0.3891143798828125, 0.40838623046875, 0.4276580810546875, 0.446929931640625, 0.4662017822265625, 0.4854736328125, 0.5047454833984375, 0.524017333984375, 0.5432891845703125, 0.56256103515625, 0.5818328857421875, 0.601104736328125, 0.6203765869140625, 0.6396484375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 7.0, 9.0, 17.0, 14.0, 18.0, 29.0, 19.0, 27.0, 37.0, 30.0, 49.0, 42.0, 44.0, 38.0, 39.0, 53.0, 46.0, 53.0, 57.0, 46.0, 43.0, 53.0, 37.0, 27.0, 29.0, 23.0, 25.0, 16.0, 16.0, 11.0, 11.0, 2.0, 6.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.438720703125, -0.42501068115234375, -0.4113006591796875, -0.39759063720703125, -0.383880615234375, -0.37017059326171875, -0.3564605712890625, -0.34275054931640625, -0.32904052734375, -0.31533050537109375, -0.3016204833984375, -0.28791046142578125, -0.274200439453125, -0.26049041748046875, -0.2467803955078125, -0.23307037353515625, -0.2193603515625, -0.20565032958984375, -0.1919403076171875, -0.17823028564453125, -0.164520263671875, -0.15081024169921875, -0.1371002197265625, -0.12339019775390625, -0.10968017578125, -0.09597015380859375, -0.0822601318359375, -0.06855010986328125, -0.054840087890625, -0.04113006591796875, -0.0274200439453125, -0.01371002197265625, 0.0, 0.01371002197265625, 0.0274200439453125, 0.04113006591796875, 0.054840087890625, 0.06855010986328125, 0.0822601318359375, 0.09597015380859375, 0.10968017578125, 0.12339019775390625, 0.1371002197265625, 0.15081024169921875, 0.164520263671875, 0.17823028564453125, 0.1919403076171875, 0.20565032958984375, 0.2193603515625, 0.23307037353515625, 0.2467803955078125, 0.26049041748046875, 0.274200439453125, 0.28791046142578125, 0.3016204833984375, 0.31533050537109375, 0.32904052734375, 0.34275054931640625, 0.3564605712890625, 0.37017059326171875, 0.383880615234375, 0.39759063720703125, 0.4113006591796875, 0.42501068115234375, 0.438720703125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 12.0, 14.0, 15.0, 34.0, 55.0, 122.0, 252.0, 713.0, 2180.0, 24322.0, 4040277.0, 120257.0, 4402.0, 924.0, 353.0, 166.0, 80.0, 42.0, 15.0, 15.0, 5.0, 9.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24212646484375, -2.1580810546875, -2.07403564453125, -1.989990234375, -1.90594482421875, -1.8218994140625, -1.73785400390625, -1.65380859375, -1.56976318359375, -1.4857177734375, -1.40167236328125, -1.317626953125, -1.23358154296875, -1.1495361328125, -1.06549072265625, -0.9814453125, -0.89739990234375, -0.8133544921875, -0.72930908203125, -0.645263671875, -0.56121826171875, -0.4771728515625, -0.39312744140625, -0.30908203125, -0.22503662109375, -0.1409912109375, -0.05694580078125, 0.027099609375, 0.11114501953125, 0.1951904296875, 0.27923583984375, 0.36328125, 0.44732666015625, 0.5313720703125, 0.61541748046875, 0.699462890625, 0.78350830078125, 0.8675537109375, 0.95159912109375, 1.03564453125, 1.11968994140625, 1.2037353515625, 1.28778076171875, 1.371826171875, 1.45587158203125, 1.5399169921875, 1.62396240234375, 1.7080078125, 1.79205322265625, 1.8760986328125, 1.96014404296875, 2.044189453125, 2.12823486328125, 2.2122802734375, 2.29632568359375, 2.38037109375, 2.46441650390625, 2.5484619140625, 2.63250732421875, 2.716552734375, 2.80059814453125, 2.8846435546875, 2.96868896484375, 3.052734375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 9.0, 15.0, 21.0, 44.0, 90.0, 170.0, 389.0, 1061.0, 1315.0, 513.0, 208.0, 115.0, 58.0, 30.0, 15.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400390625, -0.5242156982421875, -0.508392333984375, -0.4925689697265625, -0.47674560546875, -0.4609222412109375, -0.445098876953125, -0.4292755126953125, -0.4134521484375, -0.3976287841796875, -0.381805419921875, -0.3659820556640625, -0.35015869140625, -0.3343353271484375, -0.318511962890625, -0.3026885986328125, -0.286865234375, -0.2710418701171875, -0.255218505859375, -0.2393951416015625, -0.22357177734375, -0.2077484130859375, -0.191925048828125, -0.1761016845703125, -0.1602783203125, -0.1444549560546875, -0.128631591796875, -0.1128082275390625, -0.09698486328125, -0.0811614990234375, -0.065338134765625, -0.0495147705078125, -0.03369140625, -0.0178680419921875, -0.002044677734375, 0.0137786865234375, 0.02960205078125, 0.0454254150390625, 0.061248779296875, 0.0770721435546875, 0.0928955078125, 0.1087188720703125, 0.124542236328125, 0.1403656005859375, 0.15618896484375, 0.1720123291015625, 0.187835693359375, 0.2036590576171875, 0.219482421875, 0.2353057861328125, 0.251129150390625, 0.2669525146484375, 0.28277587890625, 0.2985992431640625, 0.314422607421875, 0.3302459716796875, 0.3460693359375, 0.3618927001953125, 0.377716064453125, 0.3935394287109375, 0.40936279296875, 0.4251861572265625, 0.441009521484375, 0.4568328857421875, 0.47265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 9.0, 12.0, 13.0, 16.0, 26.0, 34.0, 59.0, 51.0, 63.0, 95.0, 93.0, 92.0, 83.0, 72.0, 51.0, 61.0, 42.0, 28.0, 19.0, 11.0, 17.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.699211597442627, -0.6760556697845459, -0.6528997421264648, -0.6297438144683838, -0.6065878868103027, -0.5834318995475769, -0.5602759718894958, -0.5371200442314148, -0.5139641165733337, -0.4908081889152527, -0.46765226125717163, -0.4444963037967682, -0.42134037613868713, -0.3981844484806061, -0.37502849102020264, -0.3518725633621216, -0.3287166357040405, -0.3055607080459595, -0.2824047803878784, -0.259248822927475, -0.23609289526939392, -0.21293696761131287, -0.18978102505207062, -0.16662508249282837, -0.14346915483474731, -0.12031321972608566, -0.09715728461742401, -0.07400134950876236, -0.05084541440010071, -0.027689479291439056, -0.004533544182777405, 0.018622398376464844, 0.04177826642990112, 0.06493420153856277, 0.08809013664722443, 0.11124607175588608, 0.13440200686454773, 0.15755793452262878, 0.18071387708187103, 0.20386981964111328, 0.22702574729919434, 0.2501816749572754, 0.27333760261535645, 0.2964935600757599, 0.31964948773384094, 0.342805415391922, 0.36596137285232544, 0.3891173005104065, 0.41227322816848755, 0.4354291558265686, 0.45858508348464966, 0.4817410409450531, 0.5048969984054565, 0.5280529260635376, 0.5512088537216187, 0.5743647813796997, 0.5975207090377808, 0.6206766366958618, 0.6438325643539429, 0.6669884920120239, 0.690144419670105, 0.7133004069328308, 0.7364563345909119, 0.7596122622489929, 0.782768189907074]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 18.0, 17.0, 13.0, 20.0, 19.0, 27.0, 22.0, 26.0, 42.0, 40.0, 39.0, 38.0, 52.0, 40.0, 44.0, 44.0, 35.0, 49.0, 47.0, 43.0, 48.0, 30.0, 41.0, 33.0, 30.0, 16.0, 23.0, 23.0, 12.0, 18.0, 7.0, 9.0, 6.0, 0.0, 2.0, 7.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5059067606925964, -0.4903792440891266, -0.47485169768333435, -0.4593241810798645, -0.44379663467407227, -0.4282691180706024, -0.41274160146713257, -0.39721405506134033, -0.3816865384578705, -0.36615902185440063, -0.3506314754486084, -0.33510395884513855, -0.3195764422416687, -0.30404889583587646, -0.2885213792324066, -0.27299386262893677, -0.25746631622314453, -0.2419387847185135, -0.22641125321388245, -0.2108837366104126, -0.19535620510578156, -0.1798286736011505, -0.16430115699768066, -0.14877362549304962, -0.13324609398841858, -0.11771856248378754, -0.10219103842973709, -0.08666351437568665, -0.0711359828710556, -0.05560845136642456, -0.040080927312374115, -0.02455340325832367, -0.009025901556015015, 0.006501626223325729, 0.022029154002666473, 0.03755668178200722, 0.05308420956134796, 0.068611741065979, 0.08413926512002945, 0.0996667891740799, 0.11519432067871094, 0.13072185218334198, 0.14624938368797302, 0.16177690029144287, 0.1773044317960739, 0.19283196330070496, 0.2083594799041748, 0.22388701140880585, 0.2394145429134369, 0.25494205951690674, 0.270469605922699, 0.2859971225261688, 0.30152463912963867, 0.3170521855354309, 0.33257970213890076, 0.3481072187423706, 0.36363476514816284, 0.3791622817516327, 0.3946898281574249, 0.4102173447608948, 0.425744891166687, 0.44127240777015686, 0.4567999243736267, 0.47232747077941895, 0.4878549873828888]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 11.0, 28.0, 30.0, 43.0, 61.0, 84.0, 140.0, 201.0, 417.0, 671.0, 1205.0, 2156.0, 3900.0, 7597.0, 15276.0, 33023.0, 79385.0, 218782.0, 389526.0, 174699.0, 65599.0, 27926.0, 13227.0, 6635.0, 3494.0, 1833.0, 1033.0, 582.0, 398.0, 227.0, 119.0, 91.0, 53.0, 42.0, 21.0, 8.0, 7.0, 8.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2176513671875, -0.2111339569091797, -0.20461654663085938, -0.19809913635253906, -0.19158172607421875, -0.18506431579589844, -0.17854690551757812, -0.1720294952392578, -0.1655120849609375, -0.1589946746826172, -0.15247726440429688, -0.14595985412597656, -0.13944244384765625, -0.13292503356933594, -0.12640762329101562, -0.11989021301269531, -0.113372802734375, -0.10685539245605469, -0.10033798217773438, -0.09382057189941406, -0.08730316162109375, -0.08078575134277344, -0.07426834106445312, -0.06775093078613281, -0.0612335205078125, -0.05471611022949219, -0.048198699951171875, -0.04168128967285156, -0.03516387939453125, -0.028646469116210938, -0.022129058837890625, -0.015611648559570312, -0.00909423828125, -0.0025768280029296875, 0.003940582275390625, 0.010457992553710938, 0.01697540283203125, 0.023492813110351562, 0.030010223388671875, 0.03652763366699219, 0.0430450439453125, 0.04956245422363281, 0.056079864501953125, 0.06259727478027344, 0.06911468505859375, 0.07563209533691406, 0.08214950561523438, 0.08866691589355469, 0.095184326171875, 0.10170173645019531, 0.10821914672851562, 0.11473655700683594, 0.12125396728515625, 0.12777137756347656, 0.13428878784179688, 0.1408061981201172, 0.1473236083984375, 0.1538410186767578, 0.16035842895507812, 0.16687583923339844, 0.17339324951171875, 0.17991065979003906, 0.18642807006835938, 0.1929454803466797, 0.199462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 15.0, 11.0, 15.0, 21.0, 20.0, 21.0, 21.0, 43.0, 31.0, 45.0, 48.0, 60.0, 52.0, 61.0, 54.0, 48.0, 49.0, 46.0, 53.0, 35.0, 40.0, 35.0, 32.0, 25.0, 21.0, 21.0, 15.0, 16.0, 6.0, 8.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.3002510070800781, -0.28971099853515625, -0.2791709899902344, -0.2686309814453125, -0.2580909729003906, -0.24755096435546875, -0.23701095581054688, -0.226470947265625, -0.21593093872070312, -0.20539093017578125, -0.19485092163085938, -0.1843109130859375, -0.17377090454101562, -0.16323089599609375, -0.15269088745117188, -0.14215087890625, -0.13161087036132812, -0.12107086181640625, -0.11053085327148438, -0.0999908447265625, -0.08945083618164062, -0.07891082763671875, -0.06837081909179688, -0.057830810546875, -0.047290802001953125, -0.03675079345703125, -0.026210784912109375, -0.0156707763671875, -0.005130767822265625, 0.00540924072265625, 0.015949249267578125, 0.0264892578125, 0.037029266357421875, 0.04756927490234375, 0.058109283447265625, 0.0686492919921875, 0.07918930053710938, 0.08972930908203125, 0.10026931762695312, 0.110809326171875, 0.12134933471679688, 0.13188934326171875, 0.14242935180664062, 0.1529693603515625, 0.16350936889648438, 0.17404937744140625, 0.18458938598632812, 0.19512939453125, 0.20566940307617188, 0.21620941162109375, 0.22674942016601562, 0.2372894287109375, 0.24782943725585938, 0.25836944580078125, 0.2689094543457031, 0.279449462890625, 0.2899894714355469, 0.30052947998046875, 0.3110694885253906, 0.3216094970703125, 0.3321495056152344, 0.34268951416015625, 0.3532295227050781, 0.36376953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 12.0, 11.0, 24.0, 28.0, 45.0, 54.0, 97.0, 164.0, 241.0, 348.0, 599.0, 1003.0, 1881.0, 3519.0, 7202.0, 16436.0, 39745.0, 112087.0, 337862.0, 341775.0, 113687.0, 40159.0, 16202.0, 7314.0, 3657.0, 1779.0, 1077.0, 555.0, 333.0, 211.0, 140.0, 96.0, 62.0, 41.0, 35.0, 25.0, 11.0, 13.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2132568359375, -0.20764541625976562, -0.20203399658203125, -0.19642257690429688, -0.1908111572265625, -0.18519973754882812, -0.17958831787109375, -0.17397689819335938, -0.168365478515625, -0.16275405883789062, -0.15714263916015625, -0.15153121948242188, -0.1459197998046875, -0.14030838012695312, -0.13469696044921875, -0.12908554077148438, -0.12347412109375, -0.11786270141601562, -0.11225128173828125, -0.10663986206054688, -0.1010284423828125, -0.09541702270507812, -0.08980560302734375, -0.08419418334960938, -0.078582763671875, -0.07297134399414062, -0.06735992431640625, -0.061748504638671875, -0.0561370849609375, -0.050525665283203125, -0.04491424560546875, -0.039302825927734375, -0.03369140625, -0.028079986572265625, -0.02246856689453125, -0.016857147216796875, -0.0112457275390625, -0.005634307861328125, -2.288818359375e-05, 0.005588531494140625, 0.011199951171875, 0.016811370849609375, 0.02242279052734375, 0.028034210205078125, 0.0336456298828125, 0.039257049560546875, 0.04486846923828125, 0.050479888916015625, 0.05609130859375, 0.061702728271484375, 0.06731414794921875, 0.07292556762695312, 0.0785369873046875, 0.08414840698242188, 0.08975982666015625, 0.09537124633789062, 0.100982666015625, 0.10659408569335938, 0.11220550537109375, 0.11781692504882812, 0.1234283447265625, 0.12903976440429688, 0.13465118408203125, 0.14026260375976562, 0.1458740234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 11.0, 8.0, 17.0, 10.0, 24.0, 22.0, 35.0, 29.0, 39.0, 47.0, 39.0, 45.0, 48.0, 58.0, 54.0, 49.0, 52.0, 48.0, 52.0, 57.0, 36.0, 32.0, 36.0, 32.0, 24.0, 13.0, 15.0, 14.0, 19.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74072265625, -0.7204437255859375, -0.700164794921875, -0.6798858642578125, -0.65960693359375, -0.6393280029296875, -0.619049072265625, -0.5987701416015625, -0.5784912109375, -0.5582122802734375, -0.537933349609375, -0.5176544189453125, -0.49737548828125, -0.4770965576171875, -0.456817626953125, -0.4365386962890625, -0.416259765625, -0.3959808349609375, -0.375701904296875, -0.3554229736328125, -0.33514404296875, -0.3148651123046875, -0.294586181640625, -0.2743072509765625, -0.2540283203125, -0.2337493896484375, -0.213470458984375, -0.1931915283203125, -0.17291259765625, -0.1526336669921875, -0.132354736328125, -0.1120758056640625, -0.091796875, -0.0715179443359375, -0.051239013671875, -0.0309600830078125, -0.01068115234375, 0.0095977783203125, 0.029876708984375, 0.0501556396484375, 0.0704345703125, 0.0907135009765625, 0.110992431640625, 0.1312713623046875, 0.15155029296875, 0.1718292236328125, 0.192108154296875, 0.2123870849609375, 0.232666015625, 0.2529449462890625, 0.273223876953125, 0.2935028076171875, 0.31378173828125, 0.3340606689453125, 0.354339599609375, 0.3746185302734375, 0.3948974609375, 0.4151763916015625, 0.435455322265625, 0.4557342529296875, 0.47601318359375, 0.4962921142578125, 0.516571044921875, 0.5368499755859375, 0.55712890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 11.0, 12.0, 25.0, 26.0, 35.0, 73.0, 129.0, 255.0, 559.0, 1359.0, 4002.0, 16515.0, 123834.0, 791252.0, 91163.0, 13523.0, 3487.0, 1230.0, 487.0, 265.0, 113.0, 64.0, 53.0, 24.0, 9.0, 14.0, 7.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17678070068359375, -0.1724090576171875, -0.16803741455078125, -0.163665771484375, -0.15929412841796875, -0.1549224853515625, -0.15055084228515625, -0.14617919921875, -0.14180755615234375, -0.1374359130859375, -0.13306427001953125, -0.128692626953125, -0.12432098388671875, -0.1199493408203125, -0.11557769775390625, -0.1112060546875, -0.10683441162109375, -0.1024627685546875, -0.09809112548828125, -0.093719482421875, -0.08934783935546875, -0.0849761962890625, -0.08060455322265625, -0.07623291015625, -0.07186126708984375, -0.0674896240234375, -0.06311798095703125, -0.058746337890625, -0.05437469482421875, -0.0500030517578125, -0.04563140869140625, -0.041259765625, -0.03688812255859375, -0.0325164794921875, -0.02814483642578125, -0.023773193359375, -0.01940155029296875, -0.0150299072265625, -0.01065826416015625, -0.00628662109375, -0.00191497802734375, 0.0024566650390625, 0.00682830810546875, 0.011199951171875, 0.01557159423828125, 0.0199432373046875, 0.02431488037109375, 0.0286865234375, 0.03305816650390625, 0.0374298095703125, 0.04180145263671875, 0.046173095703125, 0.05054473876953125, 0.0549163818359375, 0.05928802490234375, 0.06365966796875, 0.06803131103515625, 0.0724029541015625, 0.07677459716796875, 0.081146240234375, 0.08551788330078125, 0.0898895263671875, 0.09426116943359375, 0.0986328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 8.0, 11.0, 15.0, 20.0, 33.0, 26.0, 40.0, 74.0, 106.0, 164.0, 154.0, 105.0, 58.0, 37.0, 21.0, 29.0, 13.0, 12.0, 8.0, 10.0, 3.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.103515625e-05, -5.9118494391441345e-05, -5.720183253288269e-05, -5.5285170674324036e-05, -5.336850881576538e-05, -5.1451846957206726e-05, -4.953518509864807e-05, -4.7618523240089417e-05, -4.570186138153076e-05, -4.378519952297211e-05, -4.186853766441345e-05, -3.99518758058548e-05, -3.803521394729614e-05, -3.611855208873749e-05, -3.420189023017883e-05, -3.228522837162018e-05, -3.0368566513061523e-05, -2.845190465450287e-05, -2.6535242795944214e-05, -2.461858093738556e-05, -2.2701919078826904e-05, -2.078525722026825e-05, -1.8868595361709595e-05, -1.695193350315094e-05, -1.5035271644592285e-05, -1.311860978603363e-05, -1.1201947927474976e-05, -9.28528606891632e-06, -7.368624210357666e-06, -5.451962351799011e-06, -3.5353004932403564e-06, -1.6186386346817017e-06, 2.980232238769531e-07, 2.214685082435608e-06, 4.131346940994263e-06, 6.0480087995529175e-06, 7.964670658111572e-06, 9.881332516670227e-06, 1.1797994375228882e-05, 1.3714656233787537e-05, 1.563131809234619e-05, 1.7547979950904846e-05, 1.94646418094635e-05, 2.1381303668022156e-05, 2.329796552658081e-05, 2.5214627385139465e-05, 2.713128924369812e-05, 2.9047951102256775e-05, 3.096461296081543e-05, 3.2881274819374084e-05, 3.479793667793274e-05, 3.6714598536491394e-05, 3.863126039505005e-05, 4.0547922253608704e-05, 4.246458411216736e-05, 4.438124597072601e-05, 4.629790782928467e-05, 4.821456968784332e-05, 5.013123154640198e-05, 5.204789340496063e-05, 5.396455526351929e-05, 5.588121712207794e-05, 5.77978789806366e-05, 5.971454083919525e-05, 6.16312026977539e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 8.0, 13.0, 21.0, 25.0, 37.0, 43.0, 77.0, 118.0, 232.0, 377.0, 647.0, 1354.0, 3065.0, 10284.0, 61848.0, 773106.0, 170673.0, 18286.0, 4558.0, 1747.0, 892.0, 416.0, 254.0, 152.0, 97.0, 67.0, 42.0, 24.0, 26.0, 18.0, 11.0, 8.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.15673828125, -0.1522197723388672, -0.14770126342773438, -0.14318275451660156, -0.13866424560546875, -0.13414573669433594, -0.12962722778320312, -0.1251087188720703, -0.1205902099609375, -0.11607170104980469, -0.11155319213867188, -0.10703468322753906, -0.10251617431640625, -0.09799766540527344, -0.09347915649414062, -0.08896064758300781, -0.084442138671875, -0.07992362976074219, -0.07540512084960938, -0.07088661193847656, -0.06636810302734375, -0.06184959411621094, -0.057331085205078125, -0.05281257629394531, -0.0482940673828125, -0.04377555847167969, -0.039257049560546875, -0.03473854064941406, -0.03022003173828125, -0.025701522827148438, -0.021183013916015625, -0.016664505004882812, -0.01214599609375, -0.0076274871826171875, -0.003108978271484375, 0.0014095306396484375, 0.00592803955078125, 0.010446548461914062, 0.014965057373046875, 0.019483566284179688, 0.0240020751953125, 0.028520584106445312, 0.033039093017578125, 0.03755760192871094, 0.04207611083984375, 0.04659461975097656, 0.051113128662109375, 0.05563163757324219, 0.060150146484375, 0.06466865539550781, 0.06918716430664062, 0.07370567321777344, 0.07822418212890625, 0.08274269104003906, 0.08726119995117188, 0.09177970886230469, 0.0962982177734375, 0.10081672668457031, 0.10533523559570312, 0.10985374450683594, 0.11437225341796875, 0.11889076232910156, 0.12340927124023438, 0.1279277801513672, 0.1324462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 19.0, 19.0, 37.0, 38.0, 55.0, 105.0, 131.0, 189.0, 124.0, 87.0, 47.0, 45.0, 21.0, 17.0, 19.0, 10.0, 3.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0301666259765625, -0.029288768768310547, -0.028410911560058594, -0.02753305435180664, -0.026655197143554688, -0.025777339935302734, -0.02489948272705078, -0.024021625518798828, -0.023143768310546875, -0.022265911102294922, -0.02138805389404297, -0.020510196685791016, -0.019632339477539062, -0.01875448226928711, -0.017876625061035156, -0.016998767852783203, -0.01612091064453125, -0.015243053436279297, -0.014365196228027344, -0.01348733901977539, -0.012609481811523438, -0.011731624603271484, -0.010853767395019531, -0.009975910186767578, -0.009098052978515625, -0.008220195770263672, -0.007342338562011719, -0.006464481353759766, -0.0055866241455078125, -0.004708766937255859, -0.0038309097290039062, -0.002953052520751953, -0.0020751953125, -0.0011973381042480469, -0.00031948089599609375, 0.0005583763122558594, 0.0014362335205078125, 0.0023140907287597656, 0.0031919479370117188, 0.004069805145263672, 0.004947662353515625, 0.005825519561767578, 0.006703376770019531, 0.007581233978271484, 0.008459091186523438, 0.00933694839477539, 0.010214805603027344, 0.011092662811279297, 0.01197052001953125, 0.012848377227783203, 0.013726234436035156, 0.01460409164428711, 0.015481948852539062, 0.016359806060791016, 0.01723766326904297, 0.018115520477294922, 0.018993377685546875, 0.019871234893798828, 0.02074909210205078, 0.021626949310302734, 0.022504806518554688, 0.02338266372680664, 0.024260520935058594, 0.025138378143310547, 0.0260162353515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 9.0, 16.0, 20.0, 27.0, 37.0, 44.0, 44.0, 59.0, 89.0, 73.0, 115.0, 107.0, 78.0, 61.0, 50.0, 39.0, 32.0, 25.0, 13.0, 9.0, 6.0, 4.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.45680394768714905, -0.44278910756111145, -0.42877423763275146, -0.41475939750671387, -0.40074455738067627, -0.3867296874523163, -0.3727148473262787, -0.3586999773979187, -0.3446851372718811, -0.3306702971458435, -0.3166554272174835, -0.3026405870914459, -0.28862571716308594, -0.27461087703704834, -0.26059603691101074, -0.24658118188381195, -0.23256632685661316, -0.21855147182941437, -0.20453661680221558, -0.19052177667617798, -0.1765069216489792, -0.1624920666217804, -0.1484772264957428, -0.134462371468544, -0.12044751644134521, -0.10643266141414642, -0.09241781383752823, -0.07840296626091003, -0.06438811123371124, -0.05037325620651245, -0.03635840862989426, -0.022343561053276062, -0.008328676223754883, 0.00568617507815361, 0.019701026380062103, 0.033715877681970596, 0.04773072898387909, 0.06174558401107788, 0.07576043158769608, 0.08977527916431427, 0.10379013419151306, 0.11780498921871185, 0.13181984424591064, 0.14583468437194824, 0.15984953939914703, 0.17386439442634583, 0.18787923455238342, 0.20189408957958221, 0.215908944606781, 0.2299237996339798, 0.2439386546611786, 0.2579534947872162, 0.27196836471557617, 0.28598320484161377, 0.29999804496765137, 0.31401288509368896, 0.32802775502204895, 0.34204259514808655, 0.35605746507644653, 0.37007230520248413, 0.38408714532852173, 0.3981020152568817, 0.4121168553829193, 0.4261317253112793, 0.4401465654373169]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 7.0, 19.0, 24.0, 28.0, 22.0, 33.0, 34.0, 47.0, 45.0, 51.0, 53.0, 58.0, 54.0, 68.0, 53.0, 58.0, 52.0, 51.0, 36.0, 41.0, 32.0, 23.0, 23.0, 24.0, 20.0, 9.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3513355851173401, -0.34003373980522156, -0.328731894493103, -0.3174300789833069, -0.30612823367118835, -0.2948263883590698, -0.2835245728492737, -0.27222272753715515, -0.2609208822250366, -0.2496190369129181, -0.23831720650196075, -0.22701537609100342, -0.2157135307788849, -0.20441168546676636, -0.19310985505580902, -0.18180802464485168, -0.17050617933273315, -0.15920433402061462, -0.1479025036096573, -0.13660067319869995, -0.12529882788658142, -0.11399699002504349, -0.10269515216350555, -0.09139331430196762, -0.08009147644042969, -0.06878963857889175, -0.05748780071735382, -0.04618596285581589, -0.034884124994277954, -0.02358228713274002, -0.012280449271202087, -0.000978611409664154, 0.010323196649551392, 0.021625034511089325, 0.03292687237262726, 0.04422871023416519, 0.055530548095703125, 0.06683238595724106, 0.07813422381877899, 0.08943606168031693, 0.10073789954185486, 0.11203973740339279, 0.12334157526493073, 0.13464340567588806, 0.1459452509880066, 0.15724709630012512, 0.16854892671108246, 0.1798507571220398, 0.19115260243415833, 0.20245444774627686, 0.2137562781572342, 0.22505810856819153, 0.23635995388031006, 0.2476617991924286, 0.2589636445045471, 0.27026546001434326, 0.2815673053264618, 0.2928691506385803, 0.30417096614837646, 0.315472811460495, 0.3267746567726135, 0.33807650208473206, 0.3493783473968506, 0.36068016290664673, 0.37198200821876526]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 10.0, 14.0, 18.0, 54.0, 52.0, 110.0, 148.0, 262.0, 445.0, 807.0, 1521.0, 3102.0, 6527.0, 14966.0, 37959.0, 134551.0, 658078.0, 125997.0, 36655.0, 14495.0, 6435.0, 2963.0, 1481.0, 799.0, 419.0, 261.0, 142.0, 94.0, 64.0, 34.0, 18.0, 14.0, 16.0, 17.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0], "bins": [-0.537109375, -0.5231513977050781, -0.5091934204101562, -0.4952354431152344, -0.4812774658203125, -0.4673194885253906, -0.45336151123046875, -0.4394035339355469, -0.425445556640625, -0.4114875793457031, -0.39752960205078125, -0.3835716247558594, -0.3696136474609375, -0.3556556701660156, -0.34169769287109375, -0.3277397155761719, -0.31378173828125, -0.2998237609863281, -0.28586578369140625, -0.2719078063964844, -0.2579498291015625, -0.24399185180664062, -0.23003387451171875, -0.21607589721679688, -0.202117919921875, -0.18815994262695312, -0.17420196533203125, -0.16024398803710938, -0.1462860107421875, -0.13232803344726562, -0.11837005615234375, -0.10441207885742188, -0.0904541015625, -0.07649612426757812, -0.06253814697265625, -0.048580169677734375, -0.0346221923828125, -0.020664215087890625, -0.00670623779296875, 0.007251739501953125, 0.021209716796875, 0.035167694091796875, 0.04912567138671875, 0.06308364868164062, 0.0770416259765625, 0.09099960327148438, 0.10495758056640625, 0.11891555786132812, 0.13287353515625, 0.14683151245117188, 0.16078948974609375, 0.17474746704101562, 0.1887054443359375, 0.20266342163085938, 0.21662139892578125, 0.23057937622070312, 0.244537353515625, 0.2584953308105469, 0.27245330810546875, 0.2864112854003906, 0.3003692626953125, 0.3143272399902344, 0.32828521728515625, 0.3422431945800781, 0.356201171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 12.0, 16.0, 18.0, 28.0, 38.0, 33.0, 23.0, 43.0, 45.0, 60.0, 50.0, 55.0, 60.0, 62.0, 67.0, 50.0, 46.0, 44.0, 51.0, 35.0, 28.0, 22.0, 21.0, 16.0, 20.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.744140625, -0.7214736938476562, -0.6988067626953125, -0.6761398315429688, -0.653472900390625, -0.6308059692382812, -0.6081390380859375, -0.5854721069335938, -0.56280517578125, -0.5401382446289062, -0.5174713134765625, -0.49480438232421875, -0.472137451171875, -0.44947052001953125, -0.4268035888671875, -0.40413665771484375, -0.3814697265625, -0.35880279541015625, -0.3361358642578125, -0.31346893310546875, -0.290802001953125, -0.26813507080078125, -0.2454681396484375, -0.22280120849609375, -0.20013427734375, -0.17746734619140625, -0.1548004150390625, -0.13213348388671875, -0.109466552734375, -0.08679962158203125, -0.0641326904296875, -0.04146575927734375, -0.018798828125, 0.00386810302734375, 0.0265350341796875, 0.04920196533203125, 0.071868896484375, 0.09453582763671875, 0.1172027587890625, 0.13986968994140625, 0.16253662109375, 0.18520355224609375, 0.2078704833984375, 0.23053741455078125, 0.253204345703125, 0.27587127685546875, 0.2985382080078125, 0.32120513916015625, 0.3438720703125, 0.36653900146484375, 0.3892059326171875, 0.41187286376953125, 0.434539794921875, 0.45720672607421875, 0.4798736572265625, 0.5025405883789062, 0.52520751953125, 0.5478744506835938, 0.5705413818359375, 0.5932083129882812, 0.615875244140625, 0.6385421752929688, 0.6612091064453125, 0.6838760375976562, 0.70654296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 3.0, 7.0, 5.0, 13.0, 5.0, 13.0, 16.0, 17.0, 17.0, 16.0, 26.0, 24.0, 35.0, 52.0, 57.0, 75.0, 187.0, 957.0, 26887.0, 1009751.0, 9382.0, 533.0, 128.0, 74.0, 42.0, 43.0, 31.0, 24.0, 20.0, 25.0, 16.0, 15.0, 14.0, 9.0, 13.0, 4.0, 8.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.3345947265625, -2.255126953125, -2.1756591796875, -2.09619140625, -2.0167236328125, -1.937255859375, -1.8577880859375, -1.7783203125, -1.6988525390625, -1.619384765625, -1.5399169921875, -1.46044921875, -1.3809814453125, -1.301513671875, -1.2220458984375, -1.142578125, -1.0631103515625, -0.983642578125, -0.9041748046875, -0.82470703125, -0.7452392578125, -0.665771484375, -0.5863037109375, -0.5068359375, -0.4273681640625, -0.347900390625, -0.2684326171875, -0.18896484375, -0.1094970703125, -0.030029296875, 0.0494384765625, 0.12890625, 0.2083740234375, 0.287841796875, 0.3673095703125, 0.44677734375, 0.5262451171875, 0.605712890625, 0.6851806640625, 0.7646484375, 0.8441162109375, 0.923583984375, 1.0030517578125, 1.08251953125, 1.1619873046875, 1.241455078125, 1.3209228515625, 1.400390625, 1.4798583984375, 1.559326171875, 1.6387939453125, 1.71826171875, 1.7977294921875, 1.877197265625, 1.9566650390625, 2.0361328125, 2.1156005859375, 2.195068359375, 2.2745361328125, 2.35400390625, 2.4334716796875, 2.512939453125, 2.5924072265625, 2.671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 5.0, 8.0, 12.0, 15.0, 8.0, 18.0, 16.0, 16.0, 22.0, 31.0, 36.0, 35.0, 34.0, 46.0, 31.0, 37.0, 41.0, 50.0, 33.0, 48.0, 42.0, 45.0, 41.0, 40.0, 30.0, 26.0, 24.0, 31.0, 27.0, 19.0, 21.0, 20.0, 16.0, 12.0, 15.0, 12.0, 7.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5302734375, -0.5126495361328125, -0.495025634765625, -0.4774017333984375, -0.45977783203125, -0.4421539306640625, -0.424530029296875, -0.4069061279296875, -0.3892822265625, -0.3716583251953125, -0.354034423828125, -0.3364105224609375, -0.31878662109375, -0.3011627197265625, -0.283538818359375, -0.2659149169921875, -0.248291015625, -0.2306671142578125, -0.213043212890625, -0.1954193115234375, -0.17779541015625, -0.1601715087890625, -0.142547607421875, -0.1249237060546875, -0.1072998046875, -0.0896759033203125, -0.072052001953125, -0.0544281005859375, -0.03680419921875, -0.0191802978515625, -0.001556396484375, 0.0160675048828125, 0.03369140625, 0.0513153076171875, 0.068939208984375, 0.0865631103515625, 0.10418701171875, 0.1218109130859375, 0.139434814453125, 0.1570587158203125, 0.1746826171875, 0.1923065185546875, 0.209930419921875, 0.2275543212890625, 0.24517822265625, 0.2628021240234375, 0.280426025390625, 0.2980499267578125, 0.315673828125, 0.3332977294921875, 0.350921630859375, 0.3685455322265625, 0.38616943359375, 0.4037933349609375, 0.421417236328125, 0.4390411376953125, 0.4566650390625, 0.4742889404296875, 0.491912841796875, 0.5095367431640625, 0.52716064453125, 0.5447845458984375, 0.562408447265625, 0.5800323486328125, 0.59765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 9.0, 11.0, 10.0, 14.0, 19.0, 45.0, 78.0, 201.0, 520.0, 1743.0, 7682.0, 165736.0, 855921.0, 12883.0, 2512.0, 710.0, 225.0, 98.0, 41.0, 31.0, 16.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.508514404296875, -0.49163818359375, -0.474761962890625, -0.4578857421875, -0.441009521484375, -0.42413330078125, -0.407257080078125, -0.390380859375, -0.373504638671875, -0.35662841796875, -0.339752197265625, -0.3228759765625, -0.305999755859375, -0.28912353515625, -0.272247314453125, -0.25537109375, -0.238494873046875, -0.22161865234375, -0.204742431640625, -0.1878662109375, -0.170989990234375, -0.15411376953125, -0.137237548828125, -0.120361328125, -0.103485107421875, -0.08660888671875, -0.069732666015625, -0.0528564453125, -0.035980224609375, -0.01910400390625, -0.002227783203125, 0.0146484375, 0.031524658203125, 0.04840087890625, 0.065277099609375, 0.0821533203125, 0.099029541015625, 0.11590576171875, 0.132781982421875, 0.149658203125, 0.166534423828125, 0.18341064453125, 0.200286865234375, 0.2171630859375, 0.234039306640625, 0.25091552734375, 0.267791748046875, 0.28466796875, 0.301544189453125, 0.31842041015625, 0.335296630859375, 0.3521728515625, 0.369049072265625, 0.38592529296875, 0.402801513671875, 0.419677734375, 0.436553955078125, 0.45343017578125, 0.470306396484375, 0.4871826171875, 0.504058837890625, 0.52093505859375, 0.537811279296875, 0.5546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 17.0, 21.0, 32.0, 74.0, 234.0, 339.0, 100.0, 56.0, 30.0, 21.0, 14.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40614128112793e-05, -5.2072107791900635e-05, -5.008280277252197e-05, -4.809349775314331e-05, -4.610419273376465e-05, -4.4114887714385986e-05, -4.2125582695007324e-05, -4.013627767562866e-05, -3.814697265625e-05, -3.615766763687134e-05, -3.4168362617492676e-05, -3.2179057598114014e-05, -3.018975257873535e-05, -2.820044755935669e-05, -2.6211142539978027e-05, -2.4221837520599365e-05, -2.2232532501220703e-05, -2.024322748184204e-05, -1.825392246246338e-05, -1.6264617443084717e-05, -1.4275312423706055e-05, -1.2286007404327393e-05, -1.029670238494873e-05, -8.307397365570068e-06, -6.318092346191406e-06, -4.328787326812744e-06, -2.339482307434082e-06, -3.501772880554199e-07, 1.6391277313232422e-06, 3.6284327507019043e-06, 5.617737770080566e-06, 7.6070427894592285e-06, 9.59634780883789e-06, 1.1585652828216553e-05, 1.3574957847595215e-05, 1.5564262866973877e-05, 1.755356788635254e-05, 1.95428729057312e-05, 2.1532177925109863e-05, 2.3521482944488525e-05, 2.5510787963867188e-05, 2.750009298324585e-05, 2.9489398002624512e-05, 3.1478703022003174e-05, 3.3468008041381836e-05, 3.54573130607605e-05, 3.744661808013916e-05, 3.943592309951782e-05, 4.1425228118896484e-05, 4.3414533138275146e-05, 4.540383815765381e-05, 4.739314317703247e-05, 4.938244819641113e-05, 5.1371753215789795e-05, 5.336105823516846e-05, 5.535036325454712e-05, 5.733966827392578e-05, 5.932897329330444e-05, 6.13182783126831e-05, 6.330758333206177e-05, 6.529688835144043e-05, 6.728619337081909e-05, 6.927549839019775e-05, 7.126480340957642e-05, 7.325410842895508e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 10.0, 18.0, 23.0, 35.0, 60.0, 104.0, 198.0, 463.0, 1233.0, 4783.0, 39781.0, 944849.0, 49509.0, 5241.0, 1321.0, 446.0, 195.0, 117.0, 60.0, 36.0, 30.0, 7.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409423828125, -0.39556121826171875, -0.3816986083984375, -0.36783599853515625, -0.353973388671875, -0.34011077880859375, -0.3262481689453125, -0.31238555908203125, -0.29852294921875, -0.28466033935546875, -0.2707977294921875, -0.25693511962890625, -0.243072509765625, -0.22920989990234375, -0.2153472900390625, -0.20148468017578125, -0.1876220703125, -0.17375946044921875, -0.1598968505859375, -0.14603424072265625, -0.132171630859375, -0.11830902099609375, -0.1044464111328125, -0.09058380126953125, -0.07672119140625, -0.06285858154296875, -0.0489959716796875, -0.03513336181640625, -0.021270751953125, -0.00740814208984375, 0.0064544677734375, 0.02031707763671875, 0.0341796875, 0.04804229736328125, 0.0619049072265625, 0.07576751708984375, 0.089630126953125, 0.10349273681640625, 0.1173553466796875, 0.13121795654296875, 0.14508056640625, 0.15894317626953125, 0.1728057861328125, 0.18666839599609375, 0.200531005859375, 0.21439361572265625, 0.2282562255859375, 0.24211883544921875, 0.2559814453125, 0.26984405517578125, 0.2837066650390625, 0.29756927490234375, 0.311431884765625, 0.32529449462890625, 0.3391571044921875, 0.35301971435546875, 0.36688232421875, 0.38074493408203125, 0.3946075439453125, 0.40847015380859375, 0.422332763671875, 0.43619537353515625, 0.4500579833984375, 0.46392059326171875, 0.477783203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 22.0, 23.0, 43.0, 73.0, 187.0, 348.0, 123.0, 63.0, 42.0, 14.0, 14.0, 9.0, 3.0, 8.0, 7.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206298828125, -0.20142269134521484, -0.1965465545654297, -0.19167041778564453, -0.18679428100585938, -0.18191814422607422, -0.17704200744628906, -0.1721658706665039, -0.16728973388671875, -0.1624135971069336, -0.15753746032714844, -0.15266132354736328, -0.14778518676757812, -0.14290904998779297, -0.1380329132080078, -0.13315677642822266, -0.1282806396484375, -0.12340450286865234, -0.11852836608886719, -0.11365222930908203, -0.10877609252929688, -0.10389995574951172, -0.09902381896972656, -0.0941476821899414, -0.08927154541015625, -0.0843954086303711, -0.07951927185058594, -0.07464313507080078, -0.06976699829101562, -0.06489086151123047, -0.06001472473144531, -0.055138587951660156, -0.050262451171875, -0.045386314392089844, -0.04051017761230469, -0.03563404083251953, -0.030757904052734375, -0.02588176727294922, -0.021005630493164062, -0.016129493713378906, -0.01125335693359375, -0.006377220153808594, -0.0015010833740234375, 0.0033750534057617188, 0.008251190185546875, 0.013127326965332031, 0.018003463745117188, 0.022879600524902344, 0.0277557373046875, 0.032631874084472656, 0.03750801086425781, 0.04238414764404297, 0.047260284423828125, 0.05213642120361328, 0.05701255798339844, 0.061888694763183594, 0.06676483154296875, 0.0716409683227539, 0.07651710510253906, 0.08139324188232422, 0.08626937866210938, 0.09114551544189453, 0.09602165222167969, 0.10089778900146484, 0.10577392578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 32.0, 400.0, 524.0, 53.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85219407081604, -0.5773032307624817, -0.30241239070892334, -0.02752155065536499, 0.24736928939819336, 0.5222601890563965, 0.7971509695053101, 1.0720417499542236, 1.3469326496124268, 1.6218235492706299, 1.8967143297195435, 2.171605110168457, 2.44649600982666, 2.7213869094848633, 2.9962778091430664, 3.2711684703826904, 3.5460593700408936, 3.8209502696990967, 4.095840930938721, 4.370731830596924, 4.645622730255127, 4.92051362991333, 5.195404529571533, 5.470294952392578, 5.745185852050781, 6.020076751708984, 6.2949676513671875, 6.569858551025391, 6.844749450683594, 7.119640350341797, 7.394530773162842, 7.669421672821045, 7.944313049316406, 8.21920394897461, 8.494094848632812, 8.768985748291016, 9.043876647949219, 9.318767547607422, 9.593658447265625, 9.868549346923828, 10.143440246582031, 10.418331146240234, 10.693222045898438, 10.96811294555664, 11.243003845214844, 11.517894744873047, 11.79278564453125, 12.067676544189453, 12.34256649017334, 12.617457389831543, 12.892348289489746, 13.16723918914795, 13.442130088806152, 13.717020988464355, 13.991911888122559, 14.266801834106445, 14.541692733764648, 14.816583633422852, 15.091474533081055, 15.366365432739258, 15.641256332397461, 15.916147232055664, 16.191038131713867, 16.46592903137207, 16.740819931030273]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 7.0, 17.0, 20.0, 15.0, 29.0, 32.0, 33.0, 40.0, 47.0, 41.0, 46.0, 50.0, 44.0, 61.0, 50.0, 38.0, 57.0, 43.0, 49.0, 28.0, 34.0, 33.0, 25.0, 27.0, 20.0, 19.0, 9.0, 17.0, 10.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9638789892196655, -0.9347702264785767, -0.9056615233421326, -0.8765528202056885, -0.8474440574645996, -0.8183352947235107, -0.7892265915870667, -0.7601178884506226, -0.7310091257095337, -0.7019003629684448, -0.6727916598320007, -0.6436829566955566, -0.6145741939544678, -0.5854654312133789, -0.5563567280769348, -0.5272480249404907, -0.49813926219940186, -0.4690305292606354, -0.4399217963218689, -0.4108130633831024, -0.38170433044433594, -0.35259559750556946, -0.323486864566803, -0.2943781316280365, -0.26526939868927, -0.23616066575050354, -0.20705193281173706, -0.17794319987297058, -0.1488344669342041, -0.11972573399543762, -0.09061700105667114, -0.06150826811790466, -0.032399535179138184, -0.003290802240371704, 0.025817930698394775, 0.054926663637161255, 0.08403539657592773, 0.11314412951469421, 0.1422528624534607, 0.17136159539222717, 0.20047032833099365, 0.22957906126976013, 0.2586877942085266, 0.2877965271472931, 0.31690526008605957, 0.34601399302482605, 0.37512272596359253, 0.404231458902359, 0.4333401918411255, 0.46244892477989197, 0.49155765771865845, 0.5206663608551025, 0.5497751235961914, 0.5788838863372803, 0.6079925894737244, 0.6371012926101685, 0.6662100553512573, 0.6953188180923462, 0.7244275212287903, 0.7535362243652344, 0.7826449871063232, 0.8117537498474121, 0.8408624529838562, 0.8699711561203003, 0.8990799188613892]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 6.0, 9.0, 30.0, 37.0, 48.0, 98.0, 162.0, 312.0, 675.0, 1693.0, 5115.0, 23037.0, 282509.0, 3395522.0, 448645.0, 26894.0, 5934.0, 1939.0, 792.0, 337.0, 196.0, 110.0, 43.0, 43.0, 26.0, 20.0, 15.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.941131591796875, -0.90570068359375, -0.870269775390625, -0.8348388671875, -0.799407958984375, -0.76397705078125, -0.728546142578125, -0.693115234375, -0.657684326171875, -0.62225341796875, -0.586822509765625, -0.5513916015625, -0.515960693359375, -0.48052978515625, -0.445098876953125, -0.40966796875, -0.374237060546875, -0.33880615234375, -0.303375244140625, -0.2679443359375, -0.232513427734375, -0.19708251953125, -0.161651611328125, -0.126220703125, -0.090789794921875, -0.05535888671875, -0.019927978515625, 0.0155029296875, 0.050933837890625, 0.08636474609375, 0.121795654296875, 0.1572265625, 0.192657470703125, 0.22808837890625, 0.263519287109375, 0.2989501953125, 0.334381103515625, 0.36981201171875, 0.405242919921875, 0.440673828125, 0.476104736328125, 0.51153564453125, 0.546966552734375, 0.5823974609375, 0.617828369140625, 0.65325927734375, 0.688690185546875, 0.72412109375, 0.759552001953125, 0.79498291015625, 0.830413818359375, 0.8658447265625, 0.901275634765625, 0.93670654296875, 0.972137451171875, 1.007568359375, 1.042999267578125, 1.07843017578125, 1.113861083984375, 1.1492919921875, 1.184722900390625, 1.22015380859375, 1.255584716796875, 1.291015625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 9.0, 14.0, 18.0, 22.0, 19.0, 33.0, 32.0, 70.0, 39.0, 60.0, 53.0, 74.0, 84.0, 70.0, 77.0, 42.0, 53.0, 39.0, 38.0, 34.0, 25.0, 25.0, 17.0, 13.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453369140625, -0.4363441467285156, -0.41931915283203125, -0.4022941589355469, -0.3852691650390625, -0.3682441711425781, -0.35121917724609375, -0.3341941833496094, -0.317169189453125, -0.3001441955566406, -0.28311920166015625, -0.2660942077636719, -0.2490692138671875, -0.23204421997070312, -0.21501922607421875, -0.19799423217773438, -0.18096923828125, -0.16394424438476562, -0.14691925048828125, -0.12989425659179688, -0.1128692626953125, -0.09584426879882812, -0.07881927490234375, -0.061794281005859375, -0.044769287109375, -0.027744293212890625, -0.01071929931640625, 0.006305694580078125, 0.0233306884765625, 0.040355682373046875, 0.05738067626953125, 0.07440567016601562, 0.0914306640625, 0.10845565795898438, 0.12548065185546875, 0.14250564575195312, 0.1595306396484375, 0.17655563354492188, 0.19358062744140625, 0.21060562133789062, 0.227630615234375, 0.24465560913085938, 0.26168060302734375, 0.2787055969238281, 0.2957305908203125, 0.3127555847167969, 0.32978057861328125, 0.3468055725097656, 0.36383056640625, 0.3808555603027344, 0.39788055419921875, 0.4149055480957031, 0.4319305419921875, 0.4489555358886719, 0.46598052978515625, 0.4830055236816406, 0.500030517578125, 0.5170555114746094, 0.5340805053710938, 0.5511054992675781, 0.5681304931640625, 0.5851554870605469, 0.6021804809570312, 0.6192054748535156, 0.63623046875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 13.0, 18.0, 18.0, 20.0, 44.0, 61.0, 127.0, 252.0, 805.0, 3524.0, 39032.0, 3913388.0, 226365.0, 8401.0, 1383.0, 427.0, 166.0, 87.0, 49.0, 26.0, 17.0, 12.0, 9.0, 8.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8525390625, -1.79412841796875, -1.7357177734375, -1.67730712890625, -1.618896484375, -1.56048583984375, -1.5020751953125, -1.44366455078125, -1.38525390625, -1.32684326171875, -1.2684326171875, -1.21002197265625, -1.151611328125, -1.09320068359375, -1.0347900390625, -0.97637939453125, -0.91796875, -0.85955810546875, -0.8011474609375, -0.74273681640625, -0.684326171875, -0.62591552734375, -0.5675048828125, -0.50909423828125, -0.45068359375, -0.39227294921875, -0.3338623046875, -0.27545166015625, -0.217041015625, -0.15863037109375, -0.1002197265625, -0.04180908203125, 0.0166015625, 0.07501220703125, 0.1334228515625, 0.19183349609375, 0.250244140625, 0.30865478515625, 0.3670654296875, 0.42547607421875, 0.48388671875, 0.54229736328125, 0.6007080078125, 0.65911865234375, 0.717529296875, 0.77593994140625, 0.8343505859375, 0.89276123046875, 0.951171875, 1.00958251953125, 1.0679931640625, 1.12640380859375, 1.184814453125, 1.24322509765625, 1.3016357421875, 1.36004638671875, 1.41845703125, 1.47686767578125, 1.5352783203125, 1.59368896484375, 1.652099609375, 1.71051025390625, 1.7689208984375, 1.82733154296875, 1.8857421875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 12.0, 14.0, 32.0, 40.0, 55.0, 82.0, 163.0, 226.0, 403.0, 759.0, 813.0, 606.0, 298.0, 163.0, 124.0, 70.0, 36.0, 42.0, 23.0, 24.0, 17.0, 13.0, 4.0, 7.0, 10.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235595703125, -0.2275390625, -0.219482421875, -0.21142578125, -0.203369140625, -0.1953125, -0.187255859375, -0.17919921875, -0.171142578125, -0.1630859375, -0.155029296875, -0.14697265625, -0.138916015625, -0.130859375, -0.122802734375, -0.11474609375, -0.106689453125, -0.0986328125, -0.090576171875, -0.08251953125, -0.074462890625, -0.06640625, -0.058349609375, -0.05029296875, -0.042236328125, -0.0341796875, -0.026123046875, -0.01806640625, -0.010009765625, -0.001953125, 0.006103515625, 0.01416015625, 0.022216796875, 0.0302734375, 0.038330078125, 0.04638671875, 0.054443359375, 0.0625, 0.070556640625, 0.07861328125, 0.086669921875, 0.0947265625, 0.102783203125, 0.11083984375, 0.118896484375, 0.126953125, 0.135009765625, 0.14306640625, 0.151123046875, 0.1591796875, 0.167236328125, 0.17529296875, 0.183349609375, 0.19140625, 0.199462890625, 0.20751953125, 0.215576171875, 0.2236328125, 0.231689453125, 0.23974609375, 0.247802734375, 0.255859375, 0.263916015625, 0.27197265625, 0.280029296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 11.0, 15.0, 28.0, 38.0, 42.0, 61.0, 70.0, 93.0, 106.0, 99.0, 96.0, 71.0, 69.0, 44.0, 43.0, 25.0, 15.0, 13.0, 10.0, 12.0, 8.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021980285644531, -0.6773347854614258, -0.6524714827537537, -0.6276082396507263, -0.6027449369430542, -0.5778816938400269, -0.5530184507369995, -0.5281551480293274, -0.5032918453216553, -0.47842857241630554, -0.4535652995109558, -0.42870205640792847, -0.40383875370025635, -0.378975510597229, -0.3541122376918793, -0.32924896478652954, -0.3043857216835022, -0.27952244877815247, -0.25465917587280273, -0.2297959178686142, -0.20493264496326447, -0.18006937205791473, -0.1552061140537262, -0.13034284114837646, -0.10547956824302673, -0.080616295337677, -0.05575302988290787, -0.030889764428138733, -0.0060264915227890015, 0.01883678138256073, 0.04370003938674927, 0.068563312292099, 0.09342652559280396, 0.11828979849815369, 0.14315307140350342, 0.16801632940769196, 0.1928796023130417, 0.21774287521839142, 0.24260613322257996, 0.2674694061279297, 0.2923326790332794, 0.31719595193862915, 0.3420592248439789, 0.3669224977493286, 0.39178574085235596, 0.4166490435600281, 0.4415122866630554, 0.46637555956840515, 0.4912388324737549, 0.5161020755767822, 0.5409653782844543, 0.5658286213874817, 0.5906919240951538, 0.6155551671981812, 0.6404184103012085, 0.6652817130088806, 0.6901450157165527, 0.7150082588195801, 0.7398715615272522, 0.7647348046302795, 0.7895981073379517, 0.814461350440979, 0.8393245935440063, 0.8641878962516785, 0.8890511393547058]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 12.0, 9.0, 15.0, 18.0, 14.0, 17.0, 19.0, 37.0, 21.0, 38.0, 23.0, 29.0, 40.0, 38.0, 56.0, 50.0, 38.0, 57.0, 46.0, 51.0, 49.0, 32.0, 47.0, 36.0, 24.0, 34.0, 30.0, 25.0, 17.0, 17.0, 10.0, 16.0, 10.0, 5.0, 6.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4636613726615906, -0.44915205240249634, -0.4346427321434021, -0.42013341188430786, -0.4056240916252136, -0.3911147713661194, -0.37660548090934753, -0.3620961606502533, -0.34758684039115906, -0.3330775201320648, -0.3185681998729706, -0.30405887961387634, -0.2895495891571045, -0.27504026889801025, -0.260530948638916, -0.24602162837982178, -0.23151230812072754, -0.2170029878616333, -0.20249366760253906, -0.18798436224460602, -0.17347504198551178, -0.15896572172641754, -0.1444564163684845, -0.12994709610939026, -0.11543777585029602, -0.10092845559120178, -0.08641914278268814, -0.0719098299741745, -0.05740050971508026, -0.04289118945598602, -0.02838187664747238, -0.01387256383895874, 0.0006367862224578857, 0.015146102756261826, 0.029655419290065765, 0.044164735823869705, 0.058674052357673645, 0.07318337261676788, 0.08769268542528152, 0.10220199823379517, 0.1167113184928894, 0.13122063875198364, 0.14572995901107788, 0.16023926436901093, 0.17474858462810516, 0.1892579048871994, 0.20376721024513245, 0.21827653050422668, 0.23278585076332092, 0.24729517102241516, 0.2618044912815094, 0.27631381154060364, 0.2908231019973755, 0.3053324222564697, 0.31984174251556396, 0.3343510627746582, 0.34886038303375244, 0.3633697032928467, 0.3778790235519409, 0.39238834381103516, 0.4068976640701294, 0.42140698432922363, 0.4359162747859955, 0.4504255950450897, 0.46493491530418396]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 1.0, 2.0, 3.0, 7.0, 11.0, 13.0, 12.0, 17.0, 23.0, 47.0, 81.0, 127.0, 269.0, 505.0, 1013.0, 2067.0, 4761.0, 11396.0, 31371.0, 162695.0, 670164.0, 119628.0, 26590.0, 9917.0, 4123.0, 1808.0, 901.0, 431.0, 229.0, 129.0, 70.0, 29.0, 34.0, 15.0, 13.0, 7.0, 12.0, 7.0, 3.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.30810546875, -0.29915618896484375, -0.2902069091796875, -0.28125762939453125, -0.272308349609375, -0.26335906982421875, -0.2544097900390625, -0.24546051025390625, -0.23651123046875, -0.22756195068359375, -0.2186126708984375, -0.20966339111328125, -0.200714111328125, -0.19176483154296875, -0.1828155517578125, -0.17386627197265625, -0.1649169921875, -0.15596771240234375, -0.1470184326171875, -0.13806915283203125, -0.129119873046875, -0.12017059326171875, -0.1112213134765625, -0.10227203369140625, -0.09332275390625, -0.08437347412109375, -0.0754241943359375, -0.06647491455078125, -0.057525634765625, -0.04857635498046875, -0.0396270751953125, -0.03067779541015625, -0.021728515625, -0.01277923583984375, -0.0038299560546875, 0.00511932373046875, 0.014068603515625, 0.02301788330078125, 0.0319671630859375, 0.04091644287109375, 0.04986572265625, 0.05881500244140625, 0.0677642822265625, 0.07671356201171875, 0.085662841796875, 0.09461212158203125, 0.1035614013671875, 0.11251068115234375, 0.1214599609375, 0.13040924072265625, 0.1393585205078125, 0.14830780029296875, 0.157257080078125, 0.16620635986328125, 0.1751556396484375, 0.18410491943359375, 0.19305419921875, 0.20200347900390625, 0.2109527587890625, 0.21990203857421875, 0.228851318359375, 0.23780059814453125, 0.2467498779296875, 0.25569915771484375, 0.2646484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 14.0, 7.0, 19.0, 16.0, 15.0, 36.0, 33.0, 33.0, 37.0, 40.0, 59.0, 49.0, 69.0, 66.0, 66.0, 59.0, 61.0, 59.0, 40.0, 46.0, 37.0, 39.0, 27.0, 23.0, 10.0, 11.0, 11.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3577537536621094, -0.34661102294921875, -0.3354682922363281, -0.3243255615234375, -0.3131828308105469, -0.30204010009765625, -0.2908973693847656, -0.279754638671875, -0.2686119079589844, -0.25746917724609375, -0.24632644653320312, -0.2351837158203125, -0.22404098510742188, -0.21289825439453125, -0.20175552368164062, -0.19061279296875, -0.17947006225585938, -0.16832733154296875, -0.15718460083007812, -0.1460418701171875, -0.13489913940429688, -0.12375640869140625, -0.11261367797851562, -0.101470947265625, -0.09032821655273438, -0.07918548583984375, -0.06804275512695312, -0.0569000244140625, -0.045757293701171875, -0.03461456298828125, -0.023471832275390625, -0.0123291015625, -0.001186370849609375, 0.00995635986328125, 0.021099090576171875, 0.0322418212890625, 0.043384552001953125, 0.05452728271484375, 0.06567001342773438, 0.076812744140625, 0.08795547485351562, 0.09909820556640625, 0.11024093627929688, 0.1213836669921875, 0.13252639770507812, 0.14366912841796875, 0.15481185913085938, 0.16595458984375, 0.17709732055664062, 0.18824005126953125, 0.19938278198242188, 0.2105255126953125, 0.22166824340820312, 0.23281097412109375, 0.24395370483398438, 0.255096435546875, 0.2662391662597656, 0.27738189697265625, 0.2885246276855469, 0.2996673583984375, 0.3108100891113281, 0.32195281982421875, 0.3330955505371094, 0.34423828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 9.0, 8.0, 12.0, 18.0, 12.0, 35.0, 56.0, 68.0, 85.0, 151.0, 248.0, 367.0, 592.0, 1033.0, 1991.0, 3567.0, 7106.0, 15071.0, 34547.0, 96643.0, 310295.0, 373612.0, 124822.0, 42724.0, 17895.0, 8261.0, 4129.0, 2102.0, 1219.0, 677.0, 399.0, 291.0, 151.0, 109.0, 78.0, 52.0, 37.0, 27.0, 15.0, 14.0, 12.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.135986328125, -0.1323223114013672, -0.12865829467773438, -0.12499427795410156, -0.12133026123046875, -0.11766624450683594, -0.11400222778320312, -0.11033821105957031, -0.1066741943359375, -0.10301017761230469, -0.09934616088867188, -0.09568214416503906, -0.09201812744140625, -0.08835411071777344, -0.08469009399414062, -0.08102607727050781, -0.077362060546875, -0.07369804382324219, -0.07003402709960938, -0.06637001037597656, -0.06270599365234375, -0.05904197692871094, -0.055377960205078125, -0.05171394348144531, -0.0480499267578125, -0.04438591003417969, -0.040721893310546875, -0.03705787658691406, -0.03339385986328125, -0.029729843139648438, -0.026065826416015625, -0.022401809692382812, -0.01873779296875, -0.015073776245117188, -0.011409759521484375, -0.0077457427978515625, -0.00408172607421875, -0.0004177093505859375, 0.003246307373046875, 0.0069103240966796875, 0.0105743408203125, 0.014238357543945312, 0.017902374267578125, 0.021566390991210938, 0.02523040771484375, 0.028894424438476562, 0.032558441162109375, 0.03622245788574219, 0.039886474609375, 0.04355049133300781, 0.047214508056640625, 0.05087852478027344, 0.05454254150390625, 0.05820655822753906, 0.061870574951171875, 0.06553459167480469, 0.0691986083984375, 0.07286262512207031, 0.07652664184570312, 0.08019065856933594, 0.08385467529296875, 0.08751869201660156, 0.09118270874023438, 0.09484672546386719, 0.0985107421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 13.0, 7.0, 8.0, 9.0, 14.0, 17.0, 16.0, 26.0, 23.0, 24.0, 30.0, 24.0, 20.0, 40.0, 34.0, 39.0, 45.0, 41.0, 33.0, 42.0, 50.0, 67.0, 34.0, 41.0, 36.0, 37.0, 35.0, 23.0, 31.0, 18.0, 26.0, 24.0, 12.0, 10.0, 9.0, 13.0, 5.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.52294921875, -0.50732421875, -0.49169921875, -0.47607421875, -0.46044921875, -0.44482421875, -0.42919921875, -0.41357421875, -0.39794921875, -0.38232421875, -0.36669921875, -0.35107421875, -0.33544921875, -0.31982421875, -0.30419921875, -0.28857421875, -0.27294921875, -0.25732421875, -0.24169921875, -0.22607421875, -0.21044921875, -0.19482421875, -0.17919921875, -0.16357421875, -0.14794921875, -0.13232421875, -0.11669921875, -0.10107421875, -0.08544921875, -0.06982421875, -0.05419921875, -0.03857421875, -0.02294921875, -0.00732421875, 0.00830078125, 0.02392578125, 0.03955078125, 0.05517578125, 0.07080078125, 0.08642578125, 0.10205078125, 0.11767578125, 0.13330078125, 0.14892578125, 0.16455078125, 0.18017578125, 0.19580078125, 0.21142578125, 0.22705078125, 0.24267578125, 0.25830078125, 0.27392578125, 0.28955078125, 0.30517578125, 0.32080078125, 0.33642578125, 0.35205078125, 0.36767578125, 0.38330078125, 0.39892578125, 0.41455078125, 0.43017578125, 0.44580078125, 0.46142578125, 0.47705078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 7.0, 7.0, 16.0, 21.0, 29.0, 53.0, 89.0, 121.0, 210.0, 327.0, 618.0, 1163.0, 2157.0, 4606.0, 10656.0, 27263.0, 83628.0, 306648.0, 417874.0, 128443.0, 38732.0, 13961.0, 6059.0, 2718.0, 1364.0, 733.0, 400.0, 239.0, 142.0, 93.0, 62.0, 34.0, 28.0, 14.0, 8.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.035186767578125, -0.03409290313720703, -0.03299903869628906, -0.031905174255371094, -0.030811309814453125, -0.029717445373535156, -0.028623580932617188, -0.02752971649169922, -0.02643585205078125, -0.02534198760986328, -0.024248123168945312, -0.023154258728027344, -0.022060394287109375, -0.020966529846191406, -0.019872665405273438, -0.01877880096435547, -0.0176849365234375, -0.01659107208251953, -0.015497207641601562, -0.014403343200683594, -0.013309478759765625, -0.012215614318847656, -0.011121749877929688, -0.010027885437011719, -0.00893402099609375, -0.007840156555175781, -0.0067462921142578125, -0.005652427673339844, -0.004558563232421875, -0.0034646987915039062, -0.0023708343505859375, -0.0012769699096679688, -0.00018310546875, 0.0009107589721679688, 0.0020046234130859375, 0.0030984878540039062, 0.004192352294921875, 0.005286216735839844, 0.0063800811767578125, 0.007473945617675781, 0.00856781005859375, 0.009661674499511719, 0.010755538940429688, 0.011849403381347656, 0.012943267822265625, 0.014037132263183594, 0.015130996704101562, 0.01622486114501953, 0.0173187255859375, 0.01841259002685547, 0.019506454467773438, 0.020600318908691406, 0.021694183349609375, 0.022788047790527344, 0.023881912231445312, 0.02497577667236328, 0.02606964111328125, 0.02716350555419922, 0.028257369995117188, 0.029351234436035156, 0.030445098876953125, 0.031538963317871094, 0.03263282775878906, 0.03372669219970703, 0.034820556640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 4.0, 5.0, 11.0, 11.0, 20.0, 16.0, 30.0, 32.0, 43.0, 51.0, 55.0, 63.0, 93.0, 76.0, 84.0, 72.0, 72.0, 37.0, 47.0, 31.0, 26.0, 29.0, 12.0, 13.0, 11.0, 6.0, 7.0, 7.0, 3.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6702880859375e-05, -2.595502883195877e-05, -2.520717680454254e-05, -2.4459324777126312e-05, -2.3711472749710083e-05, -2.2963620722293854e-05, -2.2215768694877625e-05, -2.1467916667461395e-05, -2.0720064640045166e-05, -1.9972212612628937e-05, -1.9224360585212708e-05, -1.8476508557796478e-05, -1.772865653038025e-05, -1.698080450296402e-05, -1.623295247554779e-05, -1.548510044813156e-05, -1.4737248420715332e-05, -1.3989396393299103e-05, -1.3241544365882874e-05, -1.2493692338466644e-05, -1.1745840311050415e-05, -1.0997988283634186e-05, -1.0250136256217957e-05, -9.502284228801727e-06, -8.754432201385498e-06, -8.006580173969269e-06, -7.2587281465530396e-06, -6.51087611913681e-06, -5.763024091720581e-06, -5.015172064304352e-06, -4.2673200368881226e-06, -3.5194680094718933e-06, -2.771615982055664e-06, -2.023763954639435e-06, -1.2759119272232056e-06, -5.280598998069763e-07, 2.1979212760925293e-07, 9.676441550254822e-07, 1.7154961824417114e-06, 2.4633482098579407e-06, 3.21120023727417e-06, 3.959052264690399e-06, 4.706904292106628e-06, 5.454756319522858e-06, 6.202608346939087e-06, 6.950460374355316e-06, 7.698312401771545e-06, 8.446164429187775e-06, 9.194016456604004e-06, 9.941868484020233e-06, 1.0689720511436462e-05, 1.1437572538852692e-05, 1.2185424566268921e-05, 1.293327659368515e-05, 1.368112862110138e-05, 1.4428980648517609e-05, 1.5176832675933838e-05, 1.5924684703350067e-05, 1.6672536730766296e-05, 1.7420388758182526e-05, 1.8168240785598755e-05, 1.8916092813014984e-05, 1.9663944840431213e-05, 2.0411796867847443e-05, 2.1159648895263672e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 7.0, 19.0, 22.0, 50.0, 77.0, 128.0, 226.0, 413.0, 715.0, 1425.0, 3098.0, 7231.0, 19488.0, 65466.0, 298628.0, 479200.0, 121680.0, 31588.0, 10561.0, 4399.0, 1980.0, 921.0, 555.0, 283.0, 128.0, 76.0, 60.0, 36.0, 18.0, 18.0, 8.0, 9.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04656982421875, -0.045124053955078125, -0.04367828369140625, -0.042232513427734375, -0.0407867431640625, -0.039340972900390625, -0.03789520263671875, -0.036449432373046875, -0.035003662109375, -0.033557891845703125, -0.03211212158203125, -0.030666351318359375, -0.0292205810546875, -0.027774810791015625, -0.02632904052734375, -0.024883270263671875, -0.0234375, -0.021991729736328125, -0.02054595947265625, -0.019100189208984375, -0.0176544189453125, -0.016208648681640625, -0.01476287841796875, -0.013317108154296875, -0.011871337890625, -0.010425567626953125, -0.00897979736328125, -0.007534027099609375, -0.0060882568359375, -0.004642486572265625, -0.00319671630859375, -0.001750946044921875, -0.00030517578125, 0.001140594482421875, 0.00258636474609375, 0.004032135009765625, 0.0054779052734375, 0.006923675537109375, 0.00836944580078125, 0.009815216064453125, 0.011260986328125, 0.012706756591796875, 0.01415252685546875, 0.015598297119140625, 0.0170440673828125, 0.018489837646484375, 0.01993560791015625, 0.021381378173828125, 0.0228271484375, 0.024272918701171875, 0.02571868896484375, 0.027164459228515625, 0.0286102294921875, 0.030055999755859375, 0.03150177001953125, 0.032947540283203125, 0.034393310546875, 0.035839080810546875, 0.03728485107421875, 0.038730621337890625, 0.0401763916015625, 0.041622161865234375, 0.04306793212890625, 0.044513702392578125, 0.04595947265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 10.0, 9.0, 10.0, 10.0, 15.0, 24.0, 29.0, 31.0, 49.0, 80.0, 75.0, 79.0, 69.0, 85.0, 82.0, 65.0, 65.0, 51.0, 29.0, 30.0, 26.0, 15.0, 8.0, 14.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01165008544921875, -0.01130533218383789, -0.010960578918457031, -0.010615825653076172, -0.010271072387695312, -0.009926319122314453, -0.009581565856933594, -0.009236812591552734, -0.008892059326171875, -0.008547306060791016, -0.008202552795410156, -0.007857799530029297, -0.0075130462646484375, -0.007168292999267578, -0.006823539733886719, -0.006478786468505859, -0.006134033203125, -0.005789279937744141, -0.005444526672363281, -0.005099773406982422, -0.0047550201416015625, -0.004410266876220703, -0.004065513610839844, -0.0037207603454589844, -0.003376007080078125, -0.0030312538146972656, -0.0026865005493164062, -0.002341747283935547, -0.0019969940185546875, -0.0016522407531738281, -0.0013074874877929688, -0.0009627342224121094, -0.00061798095703125, -0.0002732276916503906, 7.152557373046875e-05, 0.0004162788391113281, 0.0007610321044921875, 0.0011057853698730469, 0.0014505386352539062, 0.0017952919006347656, 0.002140045166015625, 0.0024847984313964844, 0.0028295516967773438, 0.003174304962158203, 0.0035190582275390625, 0.003863811492919922, 0.004208564758300781, 0.004553318023681641, 0.0048980712890625, 0.005242824554443359, 0.005587577819824219, 0.005932331085205078, 0.0062770843505859375, 0.006621837615966797, 0.006966590881347656, 0.007311344146728516, 0.007656097412109375, 0.008000850677490234, 0.008345603942871094, 0.008690357208251953, 0.009035110473632812, 0.009379863739013672, 0.009724617004394531, 0.01006937026977539, 0.01041412353515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 15.0, 25.0, 35.0, 50.0, 89.0, 107.0, 155.0, 142.0, 133.0, 83.0, 54.0, 34.0, 18.0, 21.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47072476148605347, -0.451171338558197, -0.43161794543266296, -0.4120645225048065, -0.39251112937927246, -0.372957706451416, -0.35340428352355957, -0.3338508605957031, -0.31429746747016907, -0.2947440445423126, -0.27519065141677856, -0.2556372284889221, -0.23608382046222687, -0.21653041243553162, -0.19697698950767517, -0.17742358148097992, -0.15787017345428467, -0.13831676542758942, -0.11876334995031357, -0.09920993447303772, -0.07965652644634247, -0.06010311841964722, -0.04054970294237137, -0.02099628746509552, -0.0014428794384002686, 0.01811053231358528, 0.03766394406557083, 0.05721735581755638, 0.07677076756954193, 0.09632417559623718, 0.11587759107351303, 0.13543100655078888, 0.15498441457748413, 0.17453782260417938, 0.19409123063087463, 0.21364465355873108, 0.23319806158542633, 0.2527514696121216, 0.272304892539978, 0.2918583154678345, 0.31141170859336853, 0.330965131521225, 0.35051852464675903, 0.3700719475746155, 0.3896253705024719, 0.409178763628006, 0.4287321865558624, 0.4482855796813965, 0.46783900260925293, 0.4873924255371094, 0.5069458484649658, 0.5264992117881775, 0.5460526347160339, 0.5656060576438904, 0.5851594805717468, 0.6047129034996033, 0.6242662668228149, 0.6438196897506714, 0.6633731126785278, 0.6829264760017395, 0.702479898929596, 0.7220333218574524, 0.7415867447853088, 0.7611401677131653, 0.7806935906410217]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 1.0, 8.0, 15.0, 15.0, 14.0, 12.0, 22.0, 28.0, 44.0, 33.0, 34.0, 39.0, 44.0, 56.0, 59.0, 60.0, 53.0, 68.0, 58.0, 55.0, 43.0, 43.0, 36.0, 31.0, 21.0, 26.0, 25.0, 18.0, 11.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3167051374912262, -0.30682605504989624, -0.2969469428062439, -0.28706786036491394, -0.2771887481212616, -0.26730966567993164, -0.2574305534362793, -0.24755147099494934, -0.2376723736524582, -0.22779327630996704, -0.2179141789674759, -0.20803508162498474, -0.19815599918365479, -0.18827688694000244, -0.17839780449867249, -0.16851870715618134, -0.15863960981369019, -0.14876051247119904, -0.13888141512870789, -0.12900231778621674, -0.11912322789430618, -0.10924413055181503, -0.09936504065990448, -0.08948594331741333, -0.07960684597492218, -0.06972774863243103, -0.05984865501523018, -0.04996956139802933, -0.04009046405553818, -0.030211366713047028, -0.020332273095846176, -0.010453179478645325, -0.0005740523338317871, 0.009305043146014214, 0.019184138625860214, 0.029063234105706215, 0.038942329585552216, 0.048821426928043365, 0.05870052054524422, 0.06857961416244507, 0.07845871150493622, 0.08833780884742737, 0.09821690618991852, 0.10809599608182907, 0.11797509342432022, 0.12785419821739197, 0.13773328065872192, 0.14761237800121307, 0.15749147534370422, 0.16737057268619537, 0.17724967002868652, 0.18712876737117767, 0.19700786471366882, 0.20688694715499878, 0.21676604449748993, 0.22664514183998108, 0.23652423918247223, 0.24640333652496338, 0.25628241896629333, 0.2661615312099457, 0.27604061365127563, 0.285919725894928, 0.29579880833625793, 0.3056778907775879, 0.31555700302124023]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 13.0, 16.0, 29.0, 44.0, 64.0, 153.0, 303.0, 589.0, 1120.0, 2428.0, 5775.0, 15069.0, 50161.0, 292596.0, 553929.0, 89504.0, 22276.0, 8082.0, 3431.0, 1477.0, 748.0, 313.0, 185.0, 111.0, 47.0, 29.0, 15.0, 5.0, 6.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5763320922851562, -0.5584259033203125, -0.5405197143554688, -0.522613525390625, -0.5047073364257812, -0.4868011474609375, -0.46889495849609375, -0.45098876953125, -0.43308258056640625, -0.4151763916015625, -0.39727020263671875, -0.379364013671875, -0.36145782470703125, -0.3435516357421875, -0.32564544677734375, -0.3077392578125, -0.28983306884765625, -0.2719268798828125, -0.25402069091796875, -0.236114501953125, -0.21820831298828125, -0.2003021240234375, -0.18239593505859375, -0.16448974609375, -0.14658355712890625, -0.1286773681640625, -0.11077117919921875, -0.092864990234375, -0.07495880126953125, -0.0570526123046875, -0.03914642333984375, -0.021240234375, -0.00333404541015625, 0.0145721435546875, 0.03247833251953125, 0.050384521484375, 0.06829071044921875, 0.0861968994140625, 0.10410308837890625, 0.12200927734375, 0.13991546630859375, 0.1578216552734375, 0.17572784423828125, 0.193634033203125, 0.21154022216796875, 0.2294464111328125, 0.24735260009765625, 0.2652587890625, 0.28316497802734375, 0.3010711669921875, 0.31897735595703125, 0.336883544921875, 0.35478973388671875, 0.3726959228515625, 0.39060211181640625, 0.40850830078125, 0.42641448974609375, 0.4443206787109375, 0.46222686767578125, 0.480133056640625, 0.49803924560546875, 0.5159454345703125, 0.5338516235351562, 0.5517578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 9.0, 10.0, 13.0, 18.0, 29.0, 20.0, 34.0, 24.0, 40.0, 40.0, 35.0, 54.0, 57.0, 46.0, 54.0, 52.0, 62.0, 58.0, 63.0, 40.0, 45.0, 33.0, 34.0, 20.0, 16.0, 26.0, 11.0, 11.0, 8.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.4165840148925781, -0.39884185791015625, -0.3810997009277344, -0.3633575439453125, -0.3456153869628906, -0.32787322998046875, -0.3101310729980469, -0.292388916015625, -0.2746467590332031, -0.25690460205078125, -0.23916244506835938, -0.2214202880859375, -0.20367813110351562, -0.18593597412109375, -0.16819381713867188, -0.15045166015625, -0.13270950317382812, -0.11496734619140625, -0.09722518920898438, -0.0794830322265625, -0.061740875244140625, -0.04399871826171875, -0.026256561279296875, -0.008514404296875, 0.009227752685546875, 0.02696990966796875, 0.044712066650390625, 0.0624542236328125, 0.08019638061523438, 0.09793853759765625, 0.11568069458007812, 0.1334228515625, 0.15116500854492188, 0.16890716552734375, 0.18664932250976562, 0.2043914794921875, 0.22213363647460938, 0.23987579345703125, 0.2576179504394531, 0.275360107421875, 0.2931022644042969, 0.31084442138671875, 0.3285865783691406, 0.3463287353515625, 0.3640708923339844, 0.38181304931640625, 0.3995552062988281, 0.41729736328125, 0.4350395202636719, 0.45278167724609375, 0.4705238342285156, 0.4882659912109375, 0.5060081481933594, 0.5237503051757812, 0.5414924621582031, 0.559234619140625, 0.5769767761230469, 0.5947189331054688, 0.6124610900878906, 0.6302032470703125, 0.6479454040527344, 0.6656875610351562, 0.6834297180175781, 0.701171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 7.0, 3.0, 4.0, 11.0, 8.0, 12.0, 7.0, 16.0, 16.0, 22.0, 25.0, 25.0, 34.0, 28.0, 50.0, 81.0, 160.0, 286.0, 796.0, 5247.0, 113610.0, 903148.0, 21905.0, 1961.0, 438.0, 172.0, 102.0, 67.0, 55.0, 50.0, 35.0, 21.0, 23.0, 17.0, 22.0, 12.0, 17.0, 17.0, 10.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.41015625, -1.3650665283203125, -1.319976806640625, -1.2748870849609375, -1.22979736328125, -1.1847076416015625, -1.139617919921875, -1.0945281982421875, -1.0494384765625, -1.0043487548828125, -0.959259033203125, -0.9141693115234375, -0.86907958984375, -0.8239898681640625, -0.778900146484375, -0.7338104248046875, -0.688720703125, -0.6436309814453125, -0.598541259765625, -0.5534515380859375, -0.50836181640625, -0.4632720947265625, -0.418182373046875, -0.3730926513671875, -0.3280029296875, -0.2829132080078125, -0.237823486328125, -0.1927337646484375, -0.14764404296875, -0.1025543212890625, -0.057464599609375, -0.0123748779296875, 0.03271484375, 0.0778045654296875, 0.122894287109375, 0.1679840087890625, 0.21307373046875, 0.2581634521484375, 0.303253173828125, 0.3483428955078125, 0.3934326171875, 0.4385223388671875, 0.483612060546875, 0.5287017822265625, 0.57379150390625, 0.6188812255859375, 0.663970947265625, 0.7090606689453125, 0.754150390625, 0.7992401123046875, 0.844329833984375, 0.8894195556640625, 0.93450927734375, 0.9795989990234375, 1.024688720703125, 1.0697784423828125, 1.1148681640625, 1.1599578857421875, 1.205047607421875, 1.2501373291015625, 1.29522705078125, 1.3403167724609375, 1.385406494140625, 1.4304962158203125, 1.4755859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 7.0, 4.0, 9.0, 6.0, 13.0, 13.0, 9.0, 12.0, 20.0, 18.0, 21.0, 25.0, 22.0, 29.0, 28.0, 22.0, 41.0, 42.0, 38.0, 36.0, 43.0, 34.0, 28.0, 40.0, 52.0, 37.0, 35.0, 41.0, 31.0, 38.0, 24.0, 21.0, 21.0, 17.0, 21.0, 23.0, 12.0, 11.0, 8.0, 8.0, 7.0, 4.0, 7.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.474609375, -0.4599800109863281, -0.44535064697265625, -0.4307212829589844, -0.4160919189453125, -0.4014625549316406, -0.38683319091796875, -0.3722038269042969, -0.357574462890625, -0.3429450988769531, -0.32831573486328125, -0.3136863708496094, -0.2990570068359375, -0.2844276428222656, -0.26979827880859375, -0.2551689147949219, -0.24053955078125, -0.22591018676757812, -0.21128082275390625, -0.19665145874023438, -0.1820220947265625, -0.16739273071289062, -0.15276336669921875, -0.13813400268554688, -0.123504638671875, -0.10887527465820312, -0.09424591064453125, -0.07961654663085938, -0.0649871826171875, -0.050357818603515625, -0.03572845458984375, -0.021099090576171875, -0.0064697265625, 0.008159637451171875, 0.02278900146484375, 0.037418365478515625, 0.0520477294921875, 0.06667709350585938, 0.08130645751953125, 0.09593582153320312, 0.110565185546875, 0.12519454956054688, 0.13982391357421875, 0.15445327758789062, 0.1690826416015625, 0.18371200561523438, 0.19834136962890625, 0.21297073364257812, 0.22760009765625, 0.24222946166992188, 0.25685882568359375, 0.2714881896972656, 0.2861175537109375, 0.3007469177246094, 0.31537628173828125, 0.3300056457519531, 0.344635009765625, 0.3592643737792969, 0.37389373779296875, 0.3885231018066406, 0.4031524658203125, 0.4177818298339844, 0.43241119384765625, 0.4470405578613281, 0.461669921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 12.0, 19.0, 23.0, 41.0, 76.0, 127.0, 240.0, 468.0, 1194.0, 3635.0, 16828.0, 145155.0, 772177.0, 91491.0, 12305.0, 2811.0, 988.0, 416.0, 215.0, 103.0, 67.0, 49.0, 26.0, 14.0, 10.0, 16.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.25048828125, -0.2436084747314453, -0.23672866821289062, -0.22984886169433594, -0.22296905517578125, -0.21608924865722656, -0.20920944213867188, -0.2023296356201172, -0.1954498291015625, -0.1885700225830078, -0.18169021606445312, -0.17481040954589844, -0.16793060302734375, -0.16105079650878906, -0.15417098999023438, -0.1472911834716797, -0.140411376953125, -0.1335315704345703, -0.12665176391601562, -0.11977195739746094, -0.11289215087890625, -0.10601234436035156, -0.09913253784179688, -0.09225273132324219, -0.0853729248046875, -0.07849311828613281, -0.07161331176757812, -0.06473350524902344, -0.05785369873046875, -0.05097389221191406, -0.044094085693359375, -0.03721427917480469, -0.03033447265625, -0.023454666137695312, -0.016574859619140625, -0.009695053100585938, -0.00281524658203125, 0.0040645599365234375, 0.010944366455078125, 0.017824172973632812, 0.0247039794921875, 0.03158378601074219, 0.038463592529296875, 0.04534339904785156, 0.05222320556640625, 0.05910301208496094, 0.06598281860351562, 0.07286262512207031, 0.079742431640625, 0.08662223815917969, 0.09350204467773438, 0.10038185119628906, 0.10726165771484375, 0.11414146423339844, 0.12102127075195312, 0.1279010772705078, 0.1347808837890625, 0.1416606903076172, 0.14854049682617188, 0.15542030334472656, 0.16230010986328125, 0.16917991638183594, 0.17605972290039062, 0.1829395294189453, 0.1898193359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 2.0, 5.0, 2.0, 8.0, 10.0, 15.0, 22.0, 17.0, 25.0, 36.0, 46.0, 71.0, 95.0, 147.0, 139.0, 94.0, 73.0, 47.0, 53.0, 20.0, 17.0, 13.0, 13.0, 7.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-05, -2.8806738555431366e-05, -2.781115472316742e-05, -2.6815570890903473e-05, -2.5819987058639526e-05, -2.482440322637558e-05, -2.3828819394111633e-05, -2.2833235561847687e-05, -2.183765172958374e-05, -2.0842067897319794e-05, -1.9846484065055847e-05, -1.88509002327919e-05, -1.7855316400527954e-05, -1.6859732568264008e-05, -1.586414873600006e-05, -1.4868564903736115e-05, -1.3872981071472168e-05, -1.2877397239208221e-05, -1.1881813406944275e-05, -1.0886229574680328e-05, -9.890645742416382e-06, -8.895061910152435e-06, -7.899478077888489e-06, -6.903894245624542e-06, -5.908310413360596e-06, -4.912726581096649e-06, -3.917142748832703e-06, -2.921558916568756e-06, -1.9259750843048096e-06, -9.30391252040863e-07, 6.51925802230835e-08, 1.06077641248703e-06, 2.0563602447509766e-06, 3.051944077014923e-06, 4.04752790927887e-06, 5.043111741542816e-06, 6.038695573806763e-06, 7.034279406070709e-06, 8.029863238334656e-06, 9.025447070598602e-06, 1.0021030902862549e-05, 1.1016614735126495e-05, 1.2012198567390442e-05, 1.3007782399654388e-05, 1.4003366231918335e-05, 1.4998950064182281e-05, 1.5994533896446228e-05, 1.6990117728710175e-05, 1.798570156097412e-05, 1.8981285393238068e-05, 1.9976869225502014e-05, 2.097245305776596e-05, 2.1968036890029907e-05, 2.2963620722293854e-05, 2.39592045545578e-05, 2.4954788386821747e-05, 2.5950372219085693e-05, 2.694595605134964e-05, 2.7941539883613586e-05, 2.8937123715877533e-05, 2.993270754814148e-05, 3.0928291380405426e-05, 3.192387521266937e-05, 3.291945904493332e-05, 3.3915042877197266e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 9.0, 18.0, 20.0, 31.0, 65.0, 120.0, 228.0, 480.0, 1172.0, 3874.0, 20944.0, 248157.0, 709534.0, 53431.0, 7336.0, 1801.0, 641.0, 282.0, 156.0, 67.0, 64.0, 34.0, 27.0, 16.0, 10.0, 8.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3037109375, -0.2961578369140625, -0.288604736328125, -0.2810516357421875, -0.27349853515625, -0.2659454345703125, -0.258392333984375, -0.2508392333984375, -0.2432861328125, -0.2357330322265625, -0.228179931640625, -0.2206268310546875, -0.21307373046875, -0.2055206298828125, -0.197967529296875, -0.1904144287109375, -0.182861328125, -0.1753082275390625, -0.167755126953125, -0.1602020263671875, -0.15264892578125, -0.1450958251953125, -0.137542724609375, -0.1299896240234375, -0.1224365234375, -0.1148834228515625, -0.107330322265625, -0.0997772216796875, -0.09222412109375, -0.0846710205078125, -0.077117919921875, -0.0695648193359375, -0.06201171875, -0.0544586181640625, -0.046905517578125, -0.0393524169921875, -0.03179931640625, -0.0242462158203125, -0.016693115234375, -0.0091400146484375, -0.0015869140625, 0.0059661865234375, 0.013519287109375, 0.0210723876953125, 0.02862548828125, 0.0361785888671875, 0.043731689453125, 0.0512847900390625, 0.058837890625, 0.0663909912109375, 0.073944091796875, 0.0814971923828125, 0.08905029296875, 0.0966033935546875, 0.104156494140625, 0.1117095947265625, 0.1192626953125, 0.1268157958984375, 0.134368896484375, 0.1419219970703125, 0.14947509765625, 0.1570281982421875, 0.164581298828125, 0.1721343994140625, 0.1796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 13.0, 12.0, 21.0, 18.0, 37.0, 44.0, 41.0, 61.0, 87.0, 96.0, 108.0, 85.0, 63.0, 61.0, 56.0, 49.0, 37.0, 20.0, 19.0, 15.0, 8.0, 9.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05999755859375, -0.05782318115234375, -0.0556488037109375, -0.05347442626953125, -0.051300048828125, -0.04912567138671875, -0.0469512939453125, -0.04477691650390625, -0.0426025390625, -0.04042816162109375, -0.0382537841796875, -0.03607940673828125, -0.033905029296875, -0.03173065185546875, -0.0295562744140625, -0.02738189697265625, -0.02520751953125, -0.02303314208984375, -0.0208587646484375, -0.01868438720703125, -0.016510009765625, -0.01433563232421875, -0.0121612548828125, -0.00998687744140625, -0.0078125, -0.00563812255859375, -0.0034637451171875, -0.00128936767578125, 0.000885009765625, 0.00305938720703125, 0.0052337646484375, 0.00740814208984375, 0.00958251953125, 0.01175689697265625, 0.0139312744140625, 0.01610565185546875, 0.018280029296875, 0.02045440673828125, 0.0226287841796875, 0.02480316162109375, 0.0269775390625, 0.02915191650390625, 0.0313262939453125, 0.03350067138671875, 0.035675048828125, 0.03784942626953125, 0.0400238037109375, 0.04219818115234375, 0.04437255859375, 0.04654693603515625, 0.0487213134765625, 0.05089569091796875, 0.053070068359375, 0.05524444580078125, 0.0574188232421875, 0.05959320068359375, 0.061767578125, 0.06394195556640625, 0.0661163330078125, 0.06829071044921875, 0.070465087890625, 0.07263946533203125, 0.0748138427734375, 0.07698822021484375, 0.07916259765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 62.0, 648.0, 275.0, 26.0, 3.0], "bins": [-15.009307861328125, -14.762321472167969, -14.515335083007812, -14.26834774017334, -14.021361351013184, -13.774374961853027, -13.527387619018555, -13.280401229858398, -13.033414840698242, -12.786428451538086, -12.53944206237793, -12.292454719543457, -12.0454683303833, -11.798481941223145, -11.551494598388672, -11.304508209228516, -11.05752182006836, -10.810535430908203, -10.563549041748047, -10.316561698913574, -10.069575309753418, -9.822588920593262, -9.575601577758789, -9.328615188598633, -9.081628799438477, -8.83464241027832, -8.587656021118164, -8.340668678283691, -8.093682289123535, -7.846695899963379, -7.5997090339660645, -7.35272216796875, -7.1057353019714355, -6.858748435974121, -6.611762046813965, -6.364775657653809, -6.117788791656494, -5.87080192565918, -5.623815536499023, -5.376829147338867, -5.129842281341553, -4.882855415344238, -4.635869026184082, -4.388882637023926, -4.141895771026611, -3.894909143447876, -3.6479225158691406, -3.4009358882904053, -3.15394926071167, -2.9069626331329346, -2.659976005554199, -2.412989377975464, -2.1660027503967285, -1.9190161228179932, -1.6720294952392578, -1.4250428676605225, -1.1780563592910767, -0.9310697317123413, -0.684083104133606, -0.4370964765548706, -0.19010984897613525, 0.0568767786026001, 0.30386340618133545, 0.5508500337600708, 0.7978366613388062]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 12.0, 15.0, 11.0, 20.0, 12.0, 26.0, 25.0, 26.0, 30.0, 28.0, 38.0, 34.0, 34.0, 50.0, 44.0, 38.0, 36.0, 47.0, 46.0, 41.0, 36.0, 46.0, 39.0, 38.0, 31.0, 30.0, 24.0, 26.0, 14.0, 15.0, 13.0, 10.0, 9.0, 4.0, 7.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8316761255264282, -0.8047030568122864, -0.7777299880981445, -0.7507569193840027, -0.7237838506698608, -0.6968108415603638, -0.6698377132415771, -0.6428647041320801, -0.6158916354179382, -0.5889185667037964, -0.5619454979896545, -0.5349724292755127, -0.5079993605613708, -0.4810263216495514, -0.45405325293540955, -0.4270802140235901, -0.40010711550712585, -0.373134046792984, -0.34616097807884216, -0.3191879391670227, -0.29221487045288086, -0.265241801738739, -0.23826873302459717, -0.21129567921161652, -0.18432261049747467, -0.15734954178333282, -0.13037648797035217, -0.10340341925621033, -0.07643035799264908, -0.04945729672908783, -0.022484228014945984, 0.004488825798034668, 0.031461894512176514, 0.05843495577573776, 0.08540801703929901, 0.11238108575344086, 0.1393541395664215, 0.16632720828056335, 0.1933002769947052, 0.22027333080768585, 0.2472463995218277, 0.27421945333480835, 0.3011925220489502, 0.32816559076309204, 0.3551386594772339, 0.38211172819137573, 0.4090847969055176, 0.43605783581733704, 0.4630309045314789, 0.4900039732456207, 0.5169770121574402, 0.543950080871582, 0.5709231495857239, 0.5978962182998657, 0.6248692870140076, 0.6518423557281494, 0.6788154244422913, 0.7057884931564331, 0.732761561870575, 0.7597346305847168, 0.7867076992988586, 0.8136807680130005, 0.8406537771224976, 0.8676268458366394, 0.8945999145507812]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 17.0, 14.0, 21.0, 44.0, 41.0, 89.0, 141.0, 228.0, 408.0, 809.0, 1823.0, 5311.0, 23220.0, 345800.0, 3379263.0, 403344.0, 24337.0, 5541.0, 1904.0, 863.0, 405.0, 268.0, 149.0, 88.0, 45.0, 30.0, 21.0, 20.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.894989013671875, -0.86566162109375, -0.836334228515625, -0.8070068359375, -0.777679443359375, -0.74835205078125, -0.719024658203125, -0.689697265625, -0.660369873046875, -0.63104248046875, -0.601715087890625, -0.5723876953125, -0.543060302734375, -0.51373291015625, -0.484405517578125, -0.455078125, -0.425750732421875, -0.39642333984375, -0.367095947265625, -0.3377685546875, -0.308441162109375, -0.27911376953125, -0.249786376953125, -0.220458984375, -0.191131591796875, -0.16180419921875, -0.132476806640625, -0.1031494140625, -0.073822021484375, -0.04449462890625, -0.015167236328125, 0.01416015625, 0.043487548828125, 0.07281494140625, 0.102142333984375, 0.1314697265625, 0.160797119140625, 0.19012451171875, 0.219451904296875, 0.248779296875, 0.278106689453125, 0.30743408203125, 0.336761474609375, 0.3660888671875, 0.395416259765625, 0.42474365234375, 0.454071044921875, 0.4833984375, 0.512725830078125, 0.54205322265625, 0.571380615234375, 0.6007080078125, 0.630035400390625, 0.65936279296875, 0.688690185546875, 0.718017578125, 0.747344970703125, 0.77667236328125, 0.805999755859375, 0.8353271484375, 0.864654541015625, 0.89398193359375, 0.923309326171875, 0.95263671875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 7.0, 1.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 9.0, 7.0, 21.0, 7.0, 23.0, 9.0, 18.0, 27.0, 25.0, 44.0, 19.0, 25.0, 25.0, 29.0, 26.0, 46.0, 25.0, 44.0, 34.0, 39.0, 47.0, 29.0, 28.0, 32.0, 38.0, 43.0, 39.0, 23.0, 28.0, 19.0, 21.0, 21.0, 16.0, 16.0, 15.0, 12.0, 8.0, 6.0, 2.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.281982421875, -0.2727813720703125, -0.263580322265625, -0.2543792724609375, -0.24517822265625, -0.2359771728515625, -0.226776123046875, -0.2175750732421875, -0.2083740234375, -0.1991729736328125, -0.189971923828125, -0.1807708740234375, -0.17156982421875, -0.1623687744140625, -0.153167724609375, -0.1439666748046875, -0.134765625, -0.1255645751953125, -0.116363525390625, -0.1071624755859375, -0.09796142578125, -0.0887603759765625, -0.079559326171875, -0.0703582763671875, -0.0611572265625, -0.0519561767578125, -0.042755126953125, -0.0335540771484375, -0.02435302734375, -0.0151519775390625, -0.005950927734375, 0.0032501220703125, 0.012451171875, 0.0216522216796875, 0.030853271484375, 0.0400543212890625, 0.04925537109375, 0.0584564208984375, 0.067657470703125, 0.0768585205078125, 0.0860595703125, 0.0952606201171875, 0.104461669921875, 0.1136627197265625, 0.12286376953125, 0.1320648193359375, 0.141265869140625, 0.1504669189453125, 0.15966796875, 0.1688690185546875, 0.178070068359375, 0.1872711181640625, 0.19647216796875, 0.2056732177734375, 0.214874267578125, 0.2240753173828125, 0.2332763671875, 0.2424774169921875, 0.251678466796875, 0.2608795166015625, 0.27008056640625, 0.2792816162109375, 0.288482666015625, 0.2976837158203125, 0.306884765625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 13.0, 6.0, 15.0, 18.0, 19.0, 32.0, 38.0, 53.0, 90.0, 135.0, 306.0, 820.0, 3401.0, 43035.0, 4021819.0, 117151.0, 5327.0, 1080.0, 361.0, 173.0, 105.0, 72.0, 42.0, 37.0, 22.0, 19.0, 7.0, 12.0, 11.0, 10.0, 9.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.501251220703125, -1.44879150390625, -1.396331787109375, -1.3438720703125, -1.291412353515625, -1.23895263671875, -1.186492919921875, -1.134033203125, -1.081573486328125, -1.02911376953125, -0.976654052734375, -0.9241943359375, -0.871734619140625, -0.81927490234375, -0.766815185546875, -0.71435546875, -0.661895751953125, -0.60943603515625, -0.556976318359375, -0.5045166015625, -0.452056884765625, -0.39959716796875, -0.347137451171875, -0.294677734375, -0.242218017578125, -0.18975830078125, -0.137298583984375, -0.0848388671875, -0.032379150390625, 0.02008056640625, 0.072540283203125, 0.125, 0.177459716796875, 0.22991943359375, 0.282379150390625, 0.3348388671875, 0.387298583984375, 0.43975830078125, 0.492218017578125, 0.544677734375, 0.597137451171875, 0.64959716796875, 0.702056884765625, 0.7545166015625, 0.806976318359375, 0.85943603515625, 0.911895751953125, 0.96435546875, 1.016815185546875, 1.06927490234375, 1.121734619140625, 1.1741943359375, 1.226654052734375, 1.27911376953125, 1.331573486328125, 1.384033203125, 1.436492919921875, 1.48895263671875, 1.541412353515625, 1.5938720703125, 1.646331787109375, 1.69879150390625, 1.751251220703125, 1.8037109375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 9.0, 6.0, 8.0, 17.0, 43.0, 49.0, 80.0, 138.0, 287.0, 494.0, 932.0, 930.0, 501.0, 231.0, 139.0, 82.0, 30.0, 29.0, 16.0, 15.0, 10.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.323974609375, -0.3156585693359375, -0.307342529296875, -0.2990264892578125, -0.29071044921875, -0.2823944091796875, -0.274078369140625, -0.2657623291015625, -0.2574462890625, -0.2491302490234375, -0.240814208984375, -0.2324981689453125, -0.22418212890625, -0.2158660888671875, -0.207550048828125, -0.1992340087890625, -0.19091796875, -0.1826019287109375, -0.174285888671875, -0.1659698486328125, -0.15765380859375, -0.1493377685546875, -0.141021728515625, -0.1327056884765625, -0.1243896484375, -0.1160736083984375, -0.107757568359375, -0.0994415283203125, -0.09112548828125, -0.0828094482421875, -0.074493408203125, -0.0661773681640625, -0.057861328125, -0.0495452880859375, -0.041229248046875, -0.0329132080078125, -0.02459716796875, -0.0162811279296875, -0.007965087890625, 0.0003509521484375, 0.0086669921875, 0.0169830322265625, 0.025299072265625, 0.0336151123046875, 0.04193115234375, 0.0502471923828125, 0.058563232421875, 0.0668792724609375, 0.0751953125, 0.0835113525390625, 0.091827392578125, 0.1001434326171875, 0.10845947265625, 0.1167755126953125, 0.125091552734375, 0.1334075927734375, 0.1417236328125, 0.1500396728515625, 0.158355712890625, 0.1666717529296875, 0.17498779296875, 0.1833038330078125, 0.191619873046875, 0.1999359130859375, 0.208251953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 2.0, 6.0, 12.0, 17.0, 16.0, 23.0, 35.0, 46.0, 54.0, 76.0, 81.0, 100.0, 89.0, 85.0, 84.0, 65.0, 57.0, 35.0, 36.0, 19.0, 20.0, 11.0, 13.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.571103572845459, -0.5502992272377014, -0.5294948816299438, -0.5086905360221863, -0.4878861606121063, -0.46708181500434875, -0.4462774693965912, -0.42547309398651123, -0.40466874837875366, -0.3838644027709961, -0.3630600571632385, -0.34225571155548096, -0.321451336145401, -0.30064699053764343, -0.27984264492988586, -0.2590382695198059, -0.23823395371437073, -0.21742960810661316, -0.1966252475976944, -0.17582090198993683, -0.15501654148101807, -0.1342121958732605, -0.11340785026550293, -0.09260348975658417, -0.0717991441488266, -0.050994791090488434, -0.030190441757440567, -0.0093860924243927, 0.011418260633945465, 0.03222261369228363, 0.0530269593000412, 0.07383131980895996, 0.09463566541671753, 0.1154400184750557, 0.13624437153339386, 0.15704871714115143, 0.1778530776500702, 0.19865742325782776, 0.21946176886558533, 0.2402661293745041, 0.26107048988342285, 0.2818748354911804, 0.302679181098938, 0.32348352670669556, 0.3442879021167755, 0.3650922477245331, 0.38589659333229065, 0.4067009687423706, 0.4275052845478058, 0.44830963015556335, 0.4691139757633209, 0.4899183511734009, 0.5107226967811584, 0.531527042388916, 0.5523313879966736, 0.5731357336044312, 0.5939400792121887, 0.6147444248199463, 0.6355487704277039, 0.6563531160354614, 0.677157461643219, 0.6979618072509766, 0.7187662124633789, 0.7395705580711365, 0.760374903678894]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 3.0, 2.0, 7.0, 7.0, 11.0, 8.0, 6.0, 12.0, 20.0, 23.0, 21.0, 21.0, 35.0, 28.0, 30.0, 35.0, 46.0, 35.0, 33.0, 39.0, 45.0, 48.0, 42.0, 45.0, 27.0, 33.0, 30.0, 36.0, 33.0, 29.0, 38.0, 19.0, 32.0, 25.0, 18.0, 15.0, 12.0, 7.0, 14.0, 6.0, 3.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32858216762542725, -0.31640568375587463, -0.304229199886322, -0.2920527458190918, -0.2798762619495392, -0.2676997780799866, -0.25552329421043396, -0.24334681034088135, -0.23117034137248993, -0.21899385750293732, -0.2068173885345459, -0.1946409046649933, -0.18246442079544067, -0.17028795182704926, -0.15811146795749664, -0.14593499898910522, -0.1337585151195526, -0.1215820387005806, -0.10940556228160858, -0.09722907841205597, -0.08505260199308395, -0.07287612557411194, -0.060699641704559326, -0.04852316528558731, -0.036346688866615295, -0.02417021058499813, -0.011993732303380966, 0.00018274784088134766, 0.012359224259853363, 0.02453570067882538, 0.03671218454837799, 0.048888660967350006, 0.061065107583999634, 0.07324158400297165, 0.08541806042194366, 0.09759454429149628, 0.10977102071046829, 0.12194749712944031, 0.13412398099899292, 0.14630046486854553, 0.15847693383693695, 0.17065341770648956, 0.18282988667488098, 0.1950063705444336, 0.2071828544139862, 0.21935932338237762, 0.23153580725193024, 0.24371227622032166, 0.25588876008987427, 0.2680652439594269, 0.2802417278289795, 0.2924181818962097, 0.30459466576576233, 0.31677114963531494, 0.32894763350486755, 0.34112411737442017, 0.3533005714416504, 0.365477055311203, 0.3776535391807556, 0.38982999324798584, 0.40200647711753845, 0.41418296098709106, 0.4263594448566437, 0.4385359287261963, 0.4507124125957489]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 5.0, 7.0, 17.0, 21.0, 29.0, 45.0, 79.0, 88.0, 158.0, 283.0, 467.0, 834.0, 1704.0, 3653.0, 8698.0, 23171.0, 70863.0, 229989.0, 417614.0, 195996.0, 60235.0, 20295.0, 7792.0, 3141.0, 1513.0, 791.0, 396.0, 253.0, 131.0, 92.0, 59.0, 44.0, 25.0, 22.0, 17.0, 10.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0789794921875, -0.07629585266113281, -0.07361221313476562, -0.07092857360839844, -0.06824493408203125, -0.06556129455566406, -0.06287765502929688, -0.06019401550292969, -0.0575103759765625, -0.05482673645019531, -0.052143096923828125, -0.04945945739746094, -0.04677581787109375, -0.04409217834472656, -0.041408538818359375, -0.03872489929199219, -0.036041259765625, -0.03335762023925781, -0.030673980712890625, -0.027990341186523438, -0.02530670166015625, -0.022623062133789062, -0.019939422607421875, -0.017255783081054688, -0.0145721435546875, -0.011888504028320312, -0.009204864501953125, -0.0065212249755859375, -0.00383758544921875, -0.0011539459228515625, 0.001529693603515625, 0.0042133331298828125, 0.00689697265625, 0.009580612182617188, 0.012264251708984375, 0.014947891235351562, 0.01763153076171875, 0.020315170288085938, 0.022998809814453125, 0.025682449340820312, 0.0283660888671875, 0.031049728393554688, 0.033733367919921875, 0.03641700744628906, 0.03910064697265625, 0.04178428649902344, 0.044467926025390625, 0.04715156555175781, 0.049835205078125, 0.05251884460449219, 0.055202484130859375, 0.05788612365722656, 0.06056976318359375, 0.06325340270996094, 0.06593704223632812, 0.06862068176269531, 0.0713043212890625, 0.07398796081542969, 0.07667160034179688, 0.07935523986816406, 0.08203887939453125, 0.08472251892089844, 0.08740615844726562, 0.09008979797363281, 0.0927734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 7.0, 14.0, 10.0, 10.0, 16.0, 9.0, 34.0, 32.0, 33.0, 28.0, 42.0, 49.0, 54.0, 43.0, 51.0, 58.0, 55.0, 61.0, 33.0, 43.0, 36.0, 41.0, 38.0, 27.0, 36.0, 28.0, 23.0, 18.0, 16.0, 11.0, 9.0, 10.0, 3.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.253692626953125, -0.24395751953125, -0.234222412109375, -0.2244873046875, -0.214752197265625, -0.20501708984375, -0.195281982421875, -0.185546875, -0.175811767578125, -0.16607666015625, -0.156341552734375, -0.1466064453125, -0.136871337890625, -0.12713623046875, -0.117401123046875, -0.107666015625, -0.097930908203125, -0.08819580078125, -0.078460693359375, -0.0687255859375, -0.058990478515625, -0.04925537109375, -0.039520263671875, -0.02978515625, -0.020050048828125, -0.01031494140625, -0.000579833984375, 0.0091552734375, 0.018890380859375, 0.02862548828125, 0.038360595703125, 0.048095703125, 0.057830810546875, 0.06756591796875, 0.077301025390625, 0.0870361328125, 0.096771240234375, 0.10650634765625, 0.116241455078125, 0.1259765625, 0.135711669921875, 0.14544677734375, 0.155181884765625, 0.1649169921875, 0.174652099609375, 0.18438720703125, 0.194122314453125, 0.203857421875, 0.213592529296875, 0.22332763671875, 0.233062744140625, 0.2427978515625, 0.252532958984375, 0.26226806640625, 0.272003173828125, 0.28173828125, 0.291473388671875, 0.30120849609375, 0.310943603515625, 0.3206787109375, 0.330413818359375, 0.34014892578125, 0.349884033203125, 0.359619140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 17.0, 14.0, 36.0, 38.0, 56.0, 82.0, 142.0, 199.0, 343.0, 616.0, 1133.0, 2317.0, 5167.0, 12620.0, 35839.0, 113749.0, 325108.0, 352513.0, 131236.0, 41650.0, 14397.0, 5711.0, 2622.0, 1250.0, 651.0, 354.0, 239.0, 143.0, 107.0, 50.0, 41.0, 29.0, 22.0, 10.0, 14.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0614013671875, -0.058951377868652344, -0.05650138854980469, -0.05405139923095703, -0.051601409912109375, -0.04915142059326172, -0.04670143127441406, -0.044251441955566406, -0.04180145263671875, -0.039351463317871094, -0.03690147399902344, -0.03445148468017578, -0.032001495361328125, -0.02955150604248047, -0.027101516723632812, -0.024651527404785156, -0.0222015380859375, -0.019751548767089844, -0.017301559448242188, -0.014851570129394531, -0.012401580810546875, -0.009951591491699219, -0.0075016021728515625, -0.005051612854003906, -0.00260162353515625, -0.00015163421630859375, 0.0022983551025390625, 0.004748344421386719, 0.007198333740234375, 0.009648323059082031, 0.012098312377929688, 0.014548301696777344, 0.016998291015625, 0.019448280334472656, 0.021898269653320312, 0.02434825897216797, 0.026798248291015625, 0.02924823760986328, 0.03169822692871094, 0.034148216247558594, 0.03659820556640625, 0.039048194885253906, 0.04149818420410156, 0.04394817352294922, 0.046398162841796875, 0.04884815216064453, 0.05129814147949219, 0.053748130798339844, 0.0561981201171875, 0.058648109436035156, 0.06109809875488281, 0.06354808807373047, 0.06599807739257812, 0.06844806671142578, 0.07089805603027344, 0.0733480453491211, 0.07579803466796875, 0.0782480239868164, 0.08069801330566406, 0.08314800262451172, 0.08559799194335938, 0.08804798126220703, 0.09049797058105469, 0.09294795989990234, 0.09539794921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 9.0, 8.0, 20.0, 18.0, 23.0, 18.0, 21.0, 35.0, 33.0, 33.0, 55.0, 39.0, 56.0, 63.0, 47.0, 56.0, 41.0, 36.0, 50.0, 43.0, 35.0, 38.0, 32.0, 29.0, 27.0, 30.0, 16.0, 12.0, 11.0, 13.0, 11.0, 6.0, 6.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.583526611328125, -0.56549072265625, -0.547454833984375, -0.5294189453125, -0.511383056640625, -0.49334716796875, -0.475311279296875, -0.457275390625, -0.439239501953125, -0.42120361328125, -0.403167724609375, -0.3851318359375, -0.367095947265625, -0.34906005859375, -0.331024169921875, -0.31298828125, -0.294952392578125, -0.27691650390625, -0.258880615234375, -0.2408447265625, -0.222808837890625, -0.20477294921875, -0.186737060546875, -0.168701171875, -0.150665283203125, -0.13262939453125, -0.114593505859375, -0.0965576171875, -0.078521728515625, -0.06048583984375, -0.042449951171875, -0.0244140625, -0.006378173828125, 0.01165771484375, 0.029693603515625, 0.0477294921875, 0.065765380859375, 0.08380126953125, 0.101837158203125, 0.119873046875, 0.137908935546875, 0.15594482421875, 0.173980712890625, 0.1920166015625, 0.210052490234375, 0.22808837890625, 0.246124267578125, 0.26416015625, 0.282196044921875, 0.30023193359375, 0.318267822265625, 0.3363037109375, 0.354339599609375, 0.37237548828125, 0.390411376953125, 0.408447265625, 0.426483154296875, 0.44451904296875, 0.462554931640625, 0.4805908203125, 0.498626708984375, 0.51666259765625, 0.534698486328125, 0.552734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 12.0, 16.0, 22.0, 38.0, 53.0, 105.0, 167.0, 326.0, 544.0, 1195.0, 2619.0, 6243.0, 18732.0, 77187.0, 395437.0, 427598.0, 86024.0, 20185.0, 6732.0, 2677.0, 1178.0, 628.0, 336.0, 186.0, 107.0, 66.0, 39.0, 33.0, 15.0, 17.0, 10.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.040771484375, -0.039726972579956055, -0.03868246078491211, -0.037637948989868164, -0.03659343719482422, -0.03554892539978027, -0.03450441360473633, -0.03345990180969238, -0.03241539001464844, -0.03137087821960449, -0.030326366424560547, -0.0292818546295166, -0.028237342834472656, -0.02719283103942871, -0.026148319244384766, -0.02510380744934082, -0.024059295654296875, -0.02301478385925293, -0.021970272064208984, -0.02092576026916504, -0.019881248474121094, -0.01883673667907715, -0.017792224884033203, -0.016747713088989258, -0.015703201293945312, -0.014658689498901367, -0.013614177703857422, -0.012569665908813477, -0.011525154113769531, -0.010480642318725586, -0.00943613052368164, -0.008391618728637695, -0.00734710693359375, -0.006302595138549805, -0.005258083343505859, -0.004213571548461914, -0.0031690597534179688, -0.0021245479583740234, -0.0010800361633300781, -3.552436828613281e-05, 0.0010089874267578125, 0.002053499221801758, 0.003098011016845703, 0.0041425228118896484, 0.005187034606933594, 0.006231546401977539, 0.007276058197021484, 0.00832056999206543, 0.009365081787109375, 0.01040959358215332, 0.011454105377197266, 0.012498617172241211, 0.013543128967285156, 0.014587640762329102, 0.015632152557373047, 0.016676664352416992, 0.017721176147460938, 0.018765687942504883, 0.019810199737548828, 0.020854711532592773, 0.02189922332763672, 0.022943735122680664, 0.02398824691772461, 0.025032758712768555, 0.0260772705078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 8.0, 4.0, 6.0, 6.0, 4.0, 13.0, 12.0, 19.0, 32.0, 32.0, 58.0, 56.0, 78.0, 81.0, 104.0, 93.0, 101.0, 82.0, 54.0, 45.0, 36.0, 34.0, 13.0, 4.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7437152564525604e-05, -1.681409776210785e-05, -1.6191042959690094e-05, -1.556798815727234e-05, -1.4944933354854584e-05, -1.4321878552436829e-05, -1.3698823750019073e-05, -1.3075768947601318e-05, -1.2452714145183563e-05, -1.1829659342765808e-05, -1.1206604540348053e-05, -1.0583549737930298e-05, -9.960494935512543e-06, -9.337440133094788e-06, -8.714385330677032e-06, -8.091330528259277e-06, -7.468275725841522e-06, -6.845220923423767e-06, -6.222166121006012e-06, -5.599111318588257e-06, -4.976056516170502e-06, -4.353001713752747e-06, -3.7299469113349915e-06, -3.1068921089172363e-06, -2.483837306499481e-06, -1.860782504081726e-06, -1.237727701663971e-06, -6.146728992462158e-07, 8.381903171539307e-09, 6.314367055892944e-07, 1.2544915080070496e-06, 1.8775463104248047e-06, 2.50060111284256e-06, 3.123655915260315e-06, 3.74671071767807e-06, 4.369765520095825e-06, 4.99282032251358e-06, 5.6158751249313354e-06, 6.2389299273490906e-06, 6.861984729766846e-06, 7.485039532184601e-06, 8.108094334602356e-06, 8.731149137020111e-06, 9.354203939437866e-06, 9.977258741855621e-06, 1.0600313544273376e-05, 1.1223368346691132e-05, 1.1846423149108887e-05, 1.2469477951526642e-05, 1.3092532753944397e-05, 1.3715587556362152e-05, 1.4338642358779907e-05, 1.4961697161197662e-05, 1.5584751963615417e-05, 1.6207806766033173e-05, 1.6830861568450928e-05, 1.7453916370868683e-05, 1.8076971173286438e-05, 1.8700025975704193e-05, 1.9323080778121948e-05, 1.9946135580539703e-05, 2.056919038295746e-05, 2.1192245185375214e-05, 2.181529998779297e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 11.0, 12.0, 17.0, 32.0, 61.0, 102.0, 142.0, 234.0, 462.0, 829.0, 1798.0, 4314.0, 11887.0, 38347.0, 161437.0, 489571.0, 254919.0, 57533.0, 16368.0, 5694.0, 2386.0, 1096.0, 596.0, 273.0, 164.0, 95.0, 50.0, 31.0, 16.0, 21.0, 14.0, 11.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297088623046875, -0.02877020835876465, -0.027831554412841797, -0.026892900466918945, -0.025954246520996094, -0.025015592575073242, -0.02407693862915039, -0.02313828468322754, -0.022199630737304688, -0.021260976791381836, -0.020322322845458984, -0.019383668899536133, -0.01844501495361328, -0.01750636100769043, -0.016567707061767578, -0.015629053115844727, -0.014690399169921875, -0.013751745223999023, -0.012813091278076172, -0.01187443733215332, -0.010935783386230469, -0.009997129440307617, -0.009058475494384766, -0.008119821548461914, -0.0071811676025390625, -0.006242513656616211, -0.005303859710693359, -0.004365205764770508, -0.0034265518188476562, -0.0024878978729248047, -0.0015492439270019531, -0.0006105899810791016, 0.00032806396484375, 0.0012667179107666016, 0.002205371856689453, 0.0031440258026123047, 0.004082679748535156, 0.005021333694458008, 0.005959987640380859, 0.006898641586303711, 0.007837295532226562, 0.008775949478149414, 0.009714603424072266, 0.010653257369995117, 0.011591911315917969, 0.01253056526184082, 0.013469219207763672, 0.014407873153686523, 0.015346527099609375, 0.016285181045532227, 0.017223834991455078, 0.01816248893737793, 0.01910114288330078, 0.020039796829223633, 0.020978450775146484, 0.021917104721069336, 0.022855758666992188, 0.02379441261291504, 0.02473306655883789, 0.025671720504760742, 0.026610374450683594, 0.027549028396606445, 0.028487682342529297, 0.02942633628845215, 0.030364990234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 9.0, 6.0, 4.0, 5.0, 9.0, 13.0, 14.0, 16.0, 27.0, 44.0, 44.0, 47.0, 72.0, 93.0, 85.0, 84.0, 91.0, 59.0, 67.0, 54.0, 38.0, 33.0, 18.0, 23.0, 12.0, 11.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0082244873046875, -0.007966399192810059, -0.007708311080932617, -0.007450222969055176, -0.007192134857177734, -0.006934046745300293, -0.0066759586334228516, -0.00641787052154541, -0.006159782409667969, -0.005901694297790527, -0.005643606185913086, -0.0053855180740356445, -0.005127429962158203, -0.004869341850280762, -0.00461125373840332, -0.004353165626525879, -0.0040950775146484375, -0.003836989402770996, -0.0035789012908935547, -0.0033208131790161133, -0.003062725067138672, -0.0028046369552612305, -0.002546548843383789, -0.0022884607315063477, -0.0020303726196289062, -0.0017722845077514648, -0.0015141963958740234, -0.001256108283996582, -0.0009980201721191406, -0.0007399320602416992, -0.0004818439483642578, -0.0002237558364868164, 3.4332275390625e-05, 0.0002924203872680664, 0.0005505084991455078, 0.0008085966110229492, 0.0010666847229003906, 0.001324772834777832, 0.0015828609466552734, 0.0018409490585327148, 0.0020990371704101562, 0.0023571252822875977, 0.002615213394165039, 0.0028733015060424805, 0.003131389617919922, 0.0033894777297973633, 0.0036475658416748047, 0.003905653953552246, 0.0041637420654296875, 0.004421830177307129, 0.00467991828918457, 0.004938006401062012, 0.005196094512939453, 0.0054541826248168945, 0.005712270736694336, 0.005970358848571777, 0.006228446960449219, 0.00648653507232666, 0.0067446231842041016, 0.007002711296081543, 0.007260799407958984, 0.007518887519836426, 0.007776975631713867, 0.008035063743591309, 0.00829315185546875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 18.0, 25.0, 58.0, 84.0, 154.0, 203.0, 165.0, 129.0, 62.0, 52.0, 17.0, 11.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5143777132034302, -0.489646315574646, -0.4649149477481842, -0.4401835501194, -0.41545215249061584, -0.39072078466415405, -0.3659893870353699, -0.3412579894065857, -0.3165265917778015, -0.29179519414901733, -0.26706382632255554, -0.24233242869377136, -0.21760103106498718, -0.1928696483373642, -0.1681382656097412, -0.14340686798095703, -0.11867550015449524, -0.09394410997629166, -0.06921271979808807, -0.04448133707046509, -0.019749946892261505, 0.004981443285942078, 0.029712826013565063, 0.05444422364234924, 0.07917560636997223, 0.10390699654817581, 0.1286383867263794, 0.15336976945400238, 0.17810115218162537, 0.20283254981040955, 0.22756393253803253, 0.2522953152656555, 0.2770267128944397, 0.3017581105232239, 0.32648947834968567, 0.35122087597846985, 0.37595227360725403, 0.4006836414337158, 0.4254150390625, 0.4501464366912842, 0.47487783432006836, 0.49960923194885254, 0.5243406295776367, 0.5490720272064209, 0.5738033652305603, 0.5985347628593445, 0.6232661604881287, 0.6479975581169128, 0.6727288961410522, 0.6974602937698364, 0.7221916913986206, 0.7469230890274048, 0.7716544270515442, 0.7963858246803284, 0.8211172223091125, 0.8458486199378967, 0.8705800175666809, 0.8953114151954651, 0.9200428128242493, 0.9447741508483887, 0.9695055484771729, 0.994236946105957, 1.0189683437347412, 1.0436997413635254, 1.0684311389923096]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 12.0, 10.0, 14.0, 19.0, 25.0, 25.0, 30.0, 33.0, 41.0, 32.0, 47.0, 46.0, 38.0, 54.0, 57.0, 53.0, 46.0, 39.0, 27.0, 33.0, 37.0, 51.0, 35.0, 32.0, 22.0, 23.0, 24.0, 16.0, 10.0, 8.0, 14.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23610919713974, -0.22735466063022614, -0.21860012412071228, -0.20984557271003723, -0.20109103620052338, -0.19233649969100952, -0.18358194828033447, -0.17482741177082062, -0.16607287526130676, -0.1573183387517929, -0.14856380224227905, -0.139809250831604, -0.13105471432209015, -0.1223001778125763, -0.11354563385248184, -0.10479108989238739, -0.09603655338287354, -0.08728201687335968, -0.07852747291326523, -0.06977292895317078, -0.06101839244365692, -0.05226385220885277, -0.043509311974048615, -0.03475477173924446, -0.026000231504440308, -0.017245691269636154, -0.008491151034832, 0.0002633891999721527, 0.009017929434776306, 0.01777246966958046, 0.026527009904384613, 0.035281550139188766, 0.04403609037399292, 0.05279063060879707, 0.06154517084360123, 0.07029971480369568, 0.07905425131320953, 0.08780878782272339, 0.09656333178281784, 0.10531787574291229, 0.11407241225242615, 0.12282694876194, 0.13158148527145386, 0.1403360366821289, 0.14909057319164276, 0.15784510970115662, 0.16659966111183167, 0.17535419762134552, 0.18410873413085938, 0.19286327064037323, 0.20161780714988708, 0.21037235856056213, 0.219126895070076, 0.22788143157958984, 0.2366359829902649, 0.24539051949977875, 0.2541450560092926, 0.26289960741996765, 0.2716541290283203, 0.28040868043899536, 0.2891632318496704, 0.29791775345802307, 0.3066723048686981, 0.3154268264770508, 0.32418137788772583]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 12.0, 7.0, 18.0, 53.0, 110.0, 412.0, 1786.0, 11144.0, 132611.0, 821456.0, 71883.0, 7301.0, 1256.0, 321.0, 87.0, 39.0, 18.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97607421875, -0.94769287109375, -0.9193115234375, -0.89093017578125, -0.862548828125, -0.83416748046875, -0.8057861328125, -0.77740478515625, -0.7490234375, -0.72064208984375, -0.6922607421875, -0.66387939453125, -0.635498046875, -0.60711669921875, -0.5787353515625, -0.55035400390625, -0.52197265625, -0.49359130859375, -0.4652099609375, -0.43682861328125, -0.408447265625, -0.38006591796875, -0.3516845703125, -0.32330322265625, -0.294921875, -0.26654052734375, -0.2381591796875, -0.20977783203125, -0.181396484375, -0.15301513671875, -0.1246337890625, -0.09625244140625, -0.06787109375, -0.03948974609375, -0.0111083984375, 0.01727294921875, 0.045654296875, 0.07403564453125, 0.1024169921875, 0.13079833984375, 0.1591796875, 0.18756103515625, 0.2159423828125, 0.24432373046875, 0.272705078125, 0.30108642578125, 0.3294677734375, 0.35784912109375, 0.38623046875, 0.41461181640625, 0.4429931640625, 0.47137451171875, 0.499755859375, 0.52813720703125, 0.5565185546875, 0.58489990234375, 0.61328125, 0.64166259765625, 0.6700439453125, 0.69842529296875, 0.726806640625, 0.75518798828125, 0.7835693359375, 0.81195068359375, 0.84033203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 12.0, 13.0, 20.0, 27.0, 33.0, 29.0, 43.0, 48.0, 50.0, 53.0, 58.0, 62.0, 90.0, 58.0, 58.0, 45.0, 52.0, 47.0, 41.0, 39.0, 22.0, 23.0, 15.0, 15.0, 10.0, 8.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.484130859375, -0.4623908996582031, -0.44065093994140625, -0.4189109802246094, -0.3971710205078125, -0.3754310607910156, -0.35369110107421875, -0.3319511413574219, -0.310211181640625, -0.2884712219238281, -0.26673126220703125, -0.24499130249023438, -0.2232513427734375, -0.20151138305664062, -0.17977142333984375, -0.15803146362304688, -0.13629150390625, -0.11455154418945312, -0.09281158447265625, -0.07107162475585938, -0.0493316650390625, -0.027591705322265625, -0.00585174560546875, 0.015888214111328125, 0.037628173828125, 0.059368133544921875, 0.08110809326171875, 0.10284805297851562, 0.1245880126953125, 0.14632797241210938, 0.16806793212890625, 0.18980789184570312, 0.2115478515625, 0.23328781127929688, 0.25502777099609375, 0.2767677307128906, 0.2985076904296875, 0.3202476501464844, 0.34198760986328125, 0.3637275695800781, 0.385467529296875, 0.4072074890136719, 0.42894744873046875, 0.4506874084472656, 0.4724273681640625, 0.4941673278808594, 0.5159072875976562, 0.5376472473144531, 0.55938720703125, 0.5811271667480469, 0.6028671264648438, 0.6246070861816406, 0.6463470458984375, 0.6680870056152344, 0.6898269653320312, 0.7115669250488281, 0.733306884765625, 0.7550468444824219, 0.7767868041992188, 0.7985267639160156, 0.8202667236328125, 0.8420066833496094, 0.8637466430664062, 0.8854866027832031, 0.9072265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 9.0, 4.0, 11.0, 20.0, 22.0, 22.0, 37.0, 38.0, 38.0, 37.0, 70.0, 72.0, 110.0, 133.0, 183.0, 337.0, 794.0, 3641.0, 31193.0, 648320.0, 339592.0, 19575.0, 2576.0, 593.0, 290.0, 198.0, 133.0, 106.0, 80.0, 55.0, 46.0, 51.0, 35.0, 24.0, 22.0, 17.0, 12.0, 11.0, 5.0, 4.0, 11.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.8916015625, -0.866058349609375, -0.84051513671875, -0.814971923828125, -0.7894287109375, -0.763885498046875, -0.73834228515625, -0.712799072265625, -0.687255859375, -0.661712646484375, -0.63616943359375, -0.610626220703125, -0.5850830078125, -0.559539794921875, -0.53399658203125, -0.508453369140625, -0.48291015625, -0.457366943359375, -0.43182373046875, -0.406280517578125, -0.3807373046875, -0.355194091796875, -0.32965087890625, -0.304107666015625, -0.278564453125, -0.253021240234375, -0.22747802734375, -0.201934814453125, -0.1763916015625, -0.150848388671875, -0.12530517578125, -0.099761962890625, -0.07421875, -0.048675537109375, -0.02313232421875, 0.002410888671875, 0.0279541015625, 0.053497314453125, 0.07904052734375, 0.104583740234375, 0.130126953125, 0.155670166015625, 0.18121337890625, 0.206756591796875, 0.2322998046875, 0.257843017578125, 0.28338623046875, 0.308929443359375, 0.33447265625, 0.360015869140625, 0.38555908203125, 0.411102294921875, 0.4366455078125, 0.462188720703125, 0.48773193359375, 0.513275146484375, 0.538818359375, 0.564361572265625, 0.58990478515625, 0.615447998046875, 0.6409912109375, 0.666534423828125, 0.69207763671875, 0.717620849609375, 0.7431640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 8.0, 13.0, 12.0, 9.0, 14.0, 15.0, 22.0, 28.0, 18.0, 26.0, 26.0, 37.0, 33.0, 30.0, 30.0, 40.0, 44.0, 45.0, 40.0, 42.0, 54.0, 46.0, 42.0, 37.0, 36.0, 34.0, 40.0, 30.0, 16.0, 20.0, 19.0, 9.0, 10.0, 17.0, 11.0, 13.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5217132568359375, -0.504852294921875, -0.4879913330078125, -0.47113037109375, -0.4542694091796875, -0.437408447265625, -0.4205474853515625, -0.4036865234375, -0.3868255615234375, -0.369964599609375, -0.3531036376953125, -0.33624267578125, -0.3193817138671875, -0.302520751953125, -0.2856597900390625, -0.268798828125, -0.2519378662109375, -0.235076904296875, -0.2182159423828125, -0.20135498046875, -0.1844940185546875, -0.167633056640625, -0.1507720947265625, -0.1339111328125, -0.1170501708984375, -0.100189208984375, -0.0833282470703125, -0.06646728515625, -0.0496063232421875, -0.032745361328125, -0.0158843994140625, 0.0009765625, 0.0178375244140625, 0.034698486328125, 0.0515594482421875, 0.06842041015625, 0.0852813720703125, 0.102142333984375, 0.1190032958984375, 0.1358642578125, 0.1527252197265625, 0.169586181640625, 0.1864471435546875, 0.20330810546875, 0.2201690673828125, 0.237030029296875, 0.2538909912109375, 0.270751953125, 0.2876129150390625, 0.304473876953125, 0.3213348388671875, 0.33819580078125, 0.3550567626953125, 0.371917724609375, 0.3887786865234375, 0.4056396484375, 0.4225006103515625, 0.439361572265625, 0.4562225341796875, 0.47308349609375, 0.4899444580078125, 0.506805419921875, 0.5236663818359375, 0.54052734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 2.0, 4.0, 6.0, 7.0, 18.0, 22.0, 40.0, 73.0, 162.0, 485.0, 1612.0, 8321.0, 120923.0, 860966.0, 49255.0, 4874.0, 1142.0, 342.0, 136.0, 59.0, 31.0, 20.0, 14.0, 6.0, 4.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.2579078674316406, -0.24848175048828125, -0.23905563354492188, -0.2296295166015625, -0.22020339965820312, -0.21077728271484375, -0.20135116577148438, -0.191925048828125, -0.18249893188476562, -0.17307281494140625, -0.16364669799804688, -0.1542205810546875, -0.14479446411132812, -0.13536834716796875, -0.12594223022460938, -0.11651611328125, -0.10708999633789062, -0.09766387939453125, -0.08823776245117188, -0.0788116455078125, -0.06938552856445312, -0.05995941162109375, -0.050533294677734375, -0.041107177734375, -0.031681060791015625, -0.02225494384765625, -0.012828826904296875, -0.0034027099609375, 0.006023406982421875, 0.01544952392578125, 0.024875640869140625, 0.0343017578125, 0.043727874755859375, 0.05315399169921875, 0.06258010864257812, 0.0720062255859375, 0.08143234252929688, 0.09085845947265625, 0.10028457641601562, 0.109710693359375, 0.11913681030273438, 0.12856292724609375, 0.13798904418945312, 0.1474151611328125, 0.15684127807617188, 0.16626739501953125, 0.17569351196289062, 0.18511962890625, 0.19454574584960938, 0.20397186279296875, 0.21339797973632812, 0.2228240966796875, 0.23225021362304688, 0.24167633056640625, 0.2511024475097656, 0.260528564453125, 0.2699546813964844, 0.27938079833984375, 0.2888069152832031, 0.2982330322265625, 0.3076591491699219, 0.31708526611328125, 0.3265113830566406, 0.3359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 12.0, 20.0, 30.0, 51.0, 65.0, 116.0, 182.0, 191.0, 112.0, 71.0, 43.0, 29.0, 21.0, 17.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7206878662109375e-05, -4.590023308992386e-05, -4.459358751773834e-05, -4.3286941945552826e-05, -4.198029637336731e-05, -4.067365080118179e-05, -3.936700522899628e-05, -3.806035965681076e-05, -3.6753714084625244e-05, -3.544706851243973e-05, -3.414042294025421e-05, -3.2833777368068695e-05, -3.152713179588318e-05, -3.0220486223697662e-05, -2.8913840651512146e-05, -2.760719507932663e-05, -2.6300549507141113e-05, -2.4993903934955597e-05, -2.368725836277008e-05, -2.2380612790584564e-05, -2.1073967218399048e-05, -1.976732164621353e-05, -1.8460676074028015e-05, -1.71540305018425e-05, -1.5847384929656982e-05, -1.4540739357471466e-05, -1.323409378528595e-05, -1.1927448213100433e-05, -1.0620802640914917e-05, -9.3141570687294e-06, -8.007511496543884e-06, -6.700865924358368e-06, -5.3942203521728516e-06, -4.087574779987335e-06, -2.780929207801819e-06, -1.4742836356163025e-06, -1.6763806343078613e-07, 1.1390075087547302e-06, 2.4456530809402466e-06, 3.752298653125763e-06, 5.058944225311279e-06, 6.365589797496796e-06, 7.672235369682312e-06, 8.978880941867828e-06, 1.0285526514053345e-05, 1.1592172086238861e-05, 1.2898817658424377e-05, 1.4205463230609894e-05, 1.551210880279541e-05, 1.6818754374980927e-05, 1.8125399947166443e-05, 1.943204551935196e-05, 2.0738691091537476e-05, 2.2045336663722992e-05, 2.3351982235908508e-05, 2.4658627808094025e-05, 2.596527338027954e-05, 2.7271918952465057e-05, 2.8578564524650574e-05, 2.988521009683609e-05, 3.1191855669021606e-05, 3.249850124120712e-05, 3.380514681339264e-05, 3.5111792385578156e-05, 3.641843795776367e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 6.0, 1.0, 10.0, 9.0, 17.0, 17.0, 36.0, 80.0, 158.0, 493.0, 1764.0, 10846.0, 290272.0, 721933.0, 19331.0, 2544.0, 613.0, 204.0, 86.0, 47.0, 36.0, 11.0, 9.0, 13.0, 5.0, 1.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.37548828125, -0.3637962341308594, -0.35210418701171875, -0.3404121398925781, -0.3287200927734375, -0.3170280456542969, -0.30533599853515625, -0.2936439514160156, -0.281951904296875, -0.2702598571777344, -0.25856781005859375, -0.24687576293945312, -0.2351837158203125, -0.22349166870117188, -0.21179962158203125, -0.20010757446289062, -0.18841552734375, -0.17672348022460938, -0.16503143310546875, -0.15333938598632812, -0.1416473388671875, -0.12995529174804688, -0.11826324462890625, -0.10657119750976562, -0.094879150390625, -0.08318710327148438, -0.07149505615234375, -0.059803009033203125, -0.0481109619140625, -0.036418914794921875, -0.02472686767578125, -0.013034820556640625, -0.0013427734375, 0.010349273681640625, 0.02204132080078125, 0.033733367919921875, 0.0454254150390625, 0.057117462158203125, 0.06880950927734375, 0.08050155639648438, 0.092193603515625, 0.10388565063476562, 0.11557769775390625, 0.12726974487304688, 0.1389617919921875, 0.15065383911132812, 0.16234588623046875, 0.17403793334960938, 0.18572998046875, 0.19742202758789062, 0.20911407470703125, 0.22080612182617188, 0.2324981689453125, 0.24419021606445312, 0.25588226318359375, 0.2675743103027344, 0.279266357421875, 0.2909584045410156, 0.30265045166015625, 0.3143424987792969, 0.3260345458984375, 0.3377265930175781, 0.34941864013671875, 0.3611106872558594, 0.372802734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 11.0, 7.0, 23.0, 28.0, 39.0, 67.0, 113.0, 164.0, 156.0, 125.0, 90.0, 41.0, 37.0, 25.0, 17.0, 15.0, 8.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.10021686553955078, -0.09728431701660156, -0.09435176849365234, -0.09141921997070312, -0.0884866714477539, -0.08555412292480469, -0.08262157440185547, -0.07968902587890625, -0.07675647735595703, -0.07382392883300781, -0.0708913803100586, -0.06795883178710938, -0.06502628326416016, -0.06209373474121094, -0.05916118621826172, -0.0562286376953125, -0.05329608917236328, -0.05036354064941406, -0.047430992126464844, -0.044498443603515625, -0.041565895080566406, -0.03863334655761719, -0.03570079803466797, -0.03276824951171875, -0.02983570098876953, -0.026903152465820312, -0.023970603942871094, -0.021038055419921875, -0.018105506896972656, -0.015172958374023438, -0.012240409851074219, -0.009307861328125, -0.006375312805175781, -0.0034427642822265625, -0.0005102157592773438, 0.002422332763671875, 0.005354881286621094, 0.008287429809570312, 0.011219978332519531, 0.01415252685546875, 0.01708507537841797, 0.020017623901367188, 0.022950172424316406, 0.025882720947265625, 0.028815269470214844, 0.03174781799316406, 0.03468036651611328, 0.0376129150390625, 0.04054546356201172, 0.04347801208496094, 0.046410560607910156, 0.049343109130859375, 0.052275657653808594, 0.05520820617675781, 0.05814075469970703, 0.06107330322265625, 0.06400585174560547, 0.06693840026855469, 0.0698709487915039, 0.07280349731445312, 0.07573604583740234, 0.07866859436035156, 0.08160114288330078, 0.08453369140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 20.0, 25.0, 40.0, 65.0, 90.0, 108.0, 141.0, 133.0, 107.0, 91.0, 59.0, 31.0, 24.0, 11.0, 9.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8961554765701294, -0.8628050684928894, -0.8294546008110046, -0.7961041927337646, -0.7627537250518799, -0.7294033169746399, -0.6960529088973999, -0.6627024412155151, -0.6293519735336304, -0.5960015654563904, -0.5626510977745056, -0.5293006896972656, -0.49595022201538086, -0.46259981393814087, -0.4292493760585785, -0.3958989381790161, -0.3625485301017761, -0.32919809222221375, -0.29584765434265137, -0.2624972462654114, -0.2291467934846878, -0.19579635560512543, -0.16244593262672424, -0.12909549474716187, -0.09574505686759949, -0.06239462271332741, -0.02904418855905533, 0.004306241869926453, 0.03765667974948883, 0.07100711762905121, 0.10435754060745239, 0.13770797848701477, 0.17105841636657715, 0.20440885424613953, 0.2377592921257019, 0.2711097002029419, 0.30446016788482666, 0.33781057596206665, 0.37116101384162903, 0.4045114517211914, 0.4378618896007538, 0.47121232748031616, 0.5045627355575562, 0.5379132032394409, 0.5712636113166809, 0.6046140789985657, 0.6379644870758057, 0.6713149547576904, 0.7046653628349304, 0.7380157709121704, 0.7713662385940552, 0.8047166466712952, 0.8380671143531799, 0.8714175224304199, 0.9047679901123047, 0.9381183981895447, 0.9714688062667847, 1.0048192739486694, 1.0381696224212646, 1.0715200901031494, 1.1048705577850342, 1.138221025466919, 1.1715713739395142, 1.204921841621399, 1.2382723093032837]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 14.0, 8.0, 12.0, 9.0, 21.0, 15.0, 25.0, 31.0, 37.0, 49.0, 29.0, 45.0, 55.0, 52.0, 56.0, 54.0, 56.0, 56.0, 57.0, 48.0, 50.0, 42.0, 31.0, 40.0, 28.0, 22.0, 19.0, 20.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9736251831054688, -0.9356900453567505, -0.8977549076080322, -0.8598197102546692, -0.8218845725059509, -0.7839494347572327, -0.7460142374038696, -0.7080790996551514, -0.6701439619064331, -0.6322088241577148, -0.5942736864089966, -0.5563384890556335, -0.5184033513069153, -0.480468213558197, -0.44253304600715637, -0.4045978784561157, -0.36666274070739746, -0.3287276029586792, -0.29079243540763855, -0.2528572678565979, -0.21492213010787964, -0.17698697745800018, -0.13905182480812073, -0.10111665725708008, -0.06318151950836182, -0.02524636685848236, 0.012688785791397095, 0.05062393844127655, 0.088559091091156, 0.12649424374103546, 0.16442939639091492, 0.20236456394195557, 0.24029982089996338, 0.27823495864868164, 0.3161701261997223, 0.35410529375076294, 0.3920404314994812, 0.42997556924819946, 0.4679107367992401, 0.5058459043502808, 0.543781042098999, 0.5817161798477173, 0.6196513175964355, 0.6575865149497986, 0.6955216526985168, 0.7334567904472351, 0.7713919878005981, 0.8093271255493164, 0.8472622632980347, 0.8851974010467529, 0.9231325387954712, 0.9610677361488342, 0.9990028738975525, 1.0369380712509155, 1.0748732089996338, 1.112808346748352, 1.1507434844970703, 1.1886786222457886, 1.2266137599945068, 1.264548897743225, 1.3024840354919434, 1.3404192924499512, 1.3783544301986694, 1.4162895679473877, 1.454224705696106]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 10.0, 15.0, 20.0, 43.0, 57.0, 110.0, 269.0, 613.0, 1869.0, 7164.0, 52445.0, 1978350.0, 2083160.0, 59274.0, 7524.0, 2011.0, 680.0, 276.0, 130.0, 78.0, 39.0, 35.0, 15.0, 15.0, 11.0, 10.0, 4.0, 3.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8552093505859375, -0.824676513671875, -0.7941436767578125, -0.76361083984375, -0.7330780029296875, -0.702545166015625, -0.6720123291015625, -0.6414794921875, -0.6109466552734375, -0.580413818359375, -0.5498809814453125, -0.51934814453125, -0.4888153076171875, -0.458282470703125, -0.4277496337890625, -0.397216796875, -0.3666839599609375, -0.336151123046875, -0.3056182861328125, -0.27508544921875, -0.2445526123046875, -0.214019775390625, -0.1834869384765625, -0.1529541015625, -0.1224212646484375, -0.091888427734375, -0.0613555908203125, -0.03082275390625, -0.0002899169921875, 0.030242919921875, 0.0607757568359375, 0.09130859375, 0.1218414306640625, 0.152374267578125, 0.1829071044921875, 0.21343994140625, 0.2439727783203125, 0.274505615234375, 0.3050384521484375, 0.3355712890625, 0.3661041259765625, 0.396636962890625, 0.4271697998046875, 0.45770263671875, 0.4882354736328125, 0.518768310546875, 0.5493011474609375, 0.579833984375, 0.6103668212890625, 0.640899658203125, 0.6714324951171875, 0.70196533203125, 0.7324981689453125, 0.763031005859375, 0.7935638427734375, 0.8240966796875, 0.8546295166015625, 0.885162353515625, 0.9156951904296875, 0.94622802734375, 0.9767608642578125, 1.007293701171875, 1.0378265380859375, 1.068359375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 7.0, 12.0, 11.0, 20.0, 21.0, 18.0, 23.0, 39.0, 27.0, 48.0, 40.0, 45.0, 54.0, 40.0, 51.0, 58.0, 45.0, 46.0, 49.0, 41.0, 42.0, 48.0, 29.0, 28.0, 29.0, 28.0, 20.0, 13.0, 15.0, 10.0, 7.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.3273773193359375, -0.314910888671875, -0.3024444580078125, -0.28997802734375, -0.2775115966796875, -0.265045166015625, -0.2525787353515625, -0.2401123046875, -0.2276458740234375, -0.215179443359375, -0.2027130126953125, -0.19024658203125, -0.1777801513671875, -0.165313720703125, -0.1528472900390625, -0.140380859375, -0.1279144287109375, -0.115447998046875, -0.1029815673828125, -0.09051513671875, -0.0780487060546875, -0.065582275390625, -0.0531158447265625, -0.0406494140625, -0.0281829833984375, -0.015716552734375, -0.0032501220703125, 0.00921630859375, 0.0216827392578125, 0.034149169921875, 0.0466156005859375, 0.05908203125, 0.0715484619140625, 0.084014892578125, 0.0964813232421875, 0.10894775390625, 0.1214141845703125, 0.133880615234375, 0.1463470458984375, 0.1588134765625, 0.1712799072265625, 0.183746337890625, 0.1962127685546875, 0.20867919921875, 0.2211456298828125, 0.233612060546875, 0.2460784912109375, 0.258544921875, 0.2710113525390625, 0.283477783203125, 0.2959442138671875, 0.30841064453125, 0.3208770751953125, 0.333343505859375, 0.3458099365234375, 0.3582763671875, 0.3707427978515625, 0.383209228515625, 0.3956756591796875, 0.40814208984375, 0.4206085205078125, 0.433074951171875, 0.4455413818359375, 0.4580078125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 21.0, 38.0, 64.0, 82.0, 191.0, 452.0, 1500.0, 6838.0, 98440.0, 3946702.0, 129280.0, 8024.0, 1651.0, 511.0, 221.0, 81.0, 46.0, 31.0, 21.0, 23.0, 12.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3203125, -1.2831573486328125, -1.246002197265625, -1.2088470458984375, -1.17169189453125, -1.1345367431640625, -1.097381591796875, -1.0602264404296875, -1.0230712890625, -0.9859161376953125, -0.948760986328125, -0.9116058349609375, -0.87445068359375, -0.8372955322265625, -0.800140380859375, -0.7629852294921875, -0.725830078125, -0.6886749267578125, -0.651519775390625, -0.6143646240234375, -0.57720947265625, -0.5400543212890625, -0.502899169921875, -0.4657440185546875, -0.4285888671875, -0.3914337158203125, -0.354278564453125, -0.3171234130859375, -0.27996826171875, -0.2428131103515625, -0.205657958984375, -0.1685028076171875, -0.13134765625, -0.0941925048828125, -0.057037353515625, -0.0198822021484375, 0.01727294921875, 0.0544281005859375, 0.091583251953125, 0.1287384033203125, 0.1658935546875, 0.2030487060546875, 0.240203857421875, 0.2773590087890625, 0.31451416015625, 0.3516693115234375, 0.388824462890625, 0.4259796142578125, 0.463134765625, 0.5002899169921875, 0.537445068359375, 0.5746002197265625, 0.61175537109375, 0.6489105224609375, 0.686065673828125, 0.7232208251953125, 0.7603759765625, 0.7975311279296875, 0.834686279296875, 0.8718414306640625, 0.90899658203125, 0.9461517333984375, 0.983306884765625, 1.0204620361328125, 1.0576171875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 11.0, 15.0, 21.0, 25.0, 27.0, 41.0, 74.0, 101.0, 163.0, 280.0, 462.0, 671.0, 724.0, 527.0, 331.0, 192.0, 121.0, 82.0, 48.0, 46.0, 28.0, 21.0, 16.0, 13.0, 9.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.1548004150390625, -0.149322509765625, -0.1438446044921875, -0.13836669921875, -0.1328887939453125, -0.127410888671875, -0.1219329833984375, -0.116455078125, -0.1109771728515625, -0.105499267578125, -0.1000213623046875, -0.09454345703125, -0.0890655517578125, -0.083587646484375, -0.0781097412109375, -0.0726318359375, -0.0671539306640625, -0.061676025390625, -0.0561981201171875, -0.05072021484375, -0.0452423095703125, -0.039764404296875, -0.0342864990234375, -0.02880859375, -0.0233306884765625, -0.017852783203125, -0.0123748779296875, -0.00689697265625, -0.0014190673828125, 0.004058837890625, 0.0095367431640625, 0.0150146484375, 0.0204925537109375, 0.025970458984375, 0.0314483642578125, 0.03692626953125, 0.0424041748046875, 0.047882080078125, 0.0533599853515625, 0.058837890625, 0.0643157958984375, 0.069793701171875, 0.0752716064453125, 0.08074951171875, 0.0862274169921875, 0.091705322265625, 0.0971832275390625, 0.1026611328125, 0.1081390380859375, 0.113616943359375, 0.1190948486328125, 0.12457275390625, 0.1300506591796875, 0.135528564453125, 0.1410064697265625, 0.146484375, 0.1519622802734375, 0.157440185546875, 0.1629180908203125, 0.16839599609375, 0.1738739013671875, 0.179351806640625, 0.1848297119140625, 0.1903076171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 16.0, 27.0, 30.0, 44.0, 60.0, 90.0, 123.0, 149.0, 122.0, 96.0, 68.0, 65.0, 37.0, 15.0, 11.0, 9.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6566445231437683, -0.6300395727157593, -0.6034346222877502, -0.5768296718597412, -0.5502246618270874, -0.5236197113990784, -0.49701476097106934, -0.4704098105430603, -0.4438048303127289, -0.41719987988471985, -0.3905948996543884, -0.3639899492263794, -0.33738499879837036, -0.31078001856803894, -0.2841750681400299, -0.2575700879096985, -0.23096513748168945, -0.20436017215251923, -0.177755206823349, -0.15115025639533997, -0.12454529106616974, -0.09794032573699951, -0.07133537530899048, -0.04473040997982025, -0.018125444650650024, 0.008479516953229904, 0.03508447855710983, 0.06168943643569946, 0.08829440176486969, 0.11489936709403992, 0.14150431752204895, 0.16810928285121918, 0.19471430778503418, 0.2213192731142044, 0.24792423844337463, 0.27452918887138367, 0.3011341691017151, 0.3277391195297241, 0.35434406995773315, 0.3809490203857422, 0.4075540006160736, 0.43415895104408264, 0.46076393127441406, 0.4873688817024231, 0.5139738321304321, 0.5405788421630859, 0.5671837329864502, 0.593788743019104, 0.620393693447113, 0.6469986438751221, 0.6736035943031311, 0.7002085447311401, 0.726813554763794, 0.753418505191803, 0.780023455619812, 0.806628406047821, 0.8332333564758301, 0.8598383069038391, 0.8864432573318481, 0.913048267364502, 0.939653217792511, 0.96625816822052, 0.992863118648529, 1.019468069076538, 1.046073079109192]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 7.0, 16.0, 10.0, 15.0, 21.0, 18.0, 26.0, 18.0, 32.0, 41.0, 35.0, 50.0, 55.0, 44.0, 48.0, 52.0, 48.0, 52.0, 46.0, 49.0, 37.0, 47.0, 41.0, 32.0, 30.0, 14.0, 25.0, 17.0, 18.0, 9.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3984873294830322, -0.38455063104629517, -0.3706139326095581, -0.35667726397514343, -0.34274056553840637, -0.3288038671016693, -0.31486716866493225, -0.3009305000305176, -0.2869938015937805, -0.27305710315704346, -0.2591204047203064, -0.24518372118473053, -0.23124703764915466, -0.2173103392124176, -0.20337364077568054, -0.18943695724010468, -0.17550025880336761, -0.16156356036663055, -0.1476268768310547, -0.13369017839431763, -0.11975349485874176, -0.1058167964220047, -0.09188010543584824, -0.07794341444969177, -0.06400672346353531, -0.050070032477378845, -0.03613334149122238, -0.02219664677977562, -0.008259955793619156, 0.005676738917827606, 0.01961342990398407, 0.03355012089014053, 0.047486811876297, 0.06142350286245346, 0.07536019384860992, 0.08929689228534698, 0.10323357582092285, 0.11717027425765991, 0.13110697269439697, 0.14504365622997284, 0.1589803397655487, 0.17291703820228577, 0.18685372173786163, 0.2007904201745987, 0.21472710371017456, 0.22866380214691162, 0.24260050058364868, 0.25653719902038574, 0.2704738974571228, 0.28441059589385986, 0.2983472943305969, 0.3122839629650116, 0.32622066140174866, 0.3401573598384857, 0.3540940582752228, 0.36803072690963745, 0.3819674253463745, 0.3959041237831116, 0.40984082221984863, 0.4237774908542633, 0.43771418929100037, 0.4516508877277374, 0.4655875861644745, 0.47952425479888916, 0.4934609532356262]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 6.0, 6.0, 10.0, 24.0, 43.0, 59.0, 179.0, 483.0, 1293.0, 4013.0, 16190.0, 130349.0, 727663.0, 144451.0, 17293.0, 4378.0, 1327.0, 424.0, 185.0, 84.0, 29.0, 18.0, 14.0, 5.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17403602600097656, -0.16814041137695312, -0.1622447967529297, -0.15634918212890625, -0.1504535675048828, -0.14455795288085938, -0.13866233825683594, -0.1327667236328125, -0.12687110900878906, -0.12097549438476562, -0.11507987976074219, -0.10918426513671875, -0.10328865051269531, -0.09739303588867188, -0.09149742126464844, -0.085601806640625, -0.07970619201660156, -0.07381057739257812, -0.06791496276855469, -0.06201934814453125, -0.05612373352050781, -0.050228118896484375, -0.04433250427246094, -0.0384368896484375, -0.03254127502441406, -0.026645660400390625, -0.020750045776367188, -0.01485443115234375, -0.008958816528320312, -0.003063201904296875, 0.0028324127197265625, 0.00872802734375, 0.014623641967773438, 0.020519256591796875, 0.026414871215820312, 0.03231048583984375, 0.03820610046386719, 0.044101715087890625, 0.04999732971191406, 0.0558929443359375, 0.06178855895996094, 0.06768417358398438, 0.07357978820800781, 0.07947540283203125, 0.08537101745605469, 0.09126663208007812, 0.09716224670410156, 0.103057861328125, 0.10895347595214844, 0.11484909057617188, 0.12074470520019531, 0.12664031982421875, 0.1325359344482422, 0.13843154907226562, 0.14432716369628906, 0.1502227783203125, 0.15611839294433594, 0.16201400756835938, 0.1679096221923828, 0.17380523681640625, 0.1797008514404297, 0.18559646606445312, 0.19149208068847656, 0.1973876953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 15.0, 9.0, 18.0, 23.0, 19.0, 21.0, 34.0, 48.0, 47.0, 54.0, 65.0, 67.0, 62.0, 68.0, 61.0, 63.0, 65.0, 56.0, 44.0, 35.0, 30.0, 18.0, 27.0, 6.0, 15.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.35467529296875, -0.3424072265625, -0.33013916015625, -0.31787109375, -0.30560302734375, -0.2933349609375, -0.28106689453125, -0.268798828125, -0.25653076171875, -0.2442626953125, -0.23199462890625, -0.2197265625, -0.20745849609375, -0.1951904296875, -0.18292236328125, -0.170654296875, -0.15838623046875, -0.1461181640625, -0.13385009765625, -0.12158203125, -0.10931396484375, -0.0970458984375, -0.08477783203125, -0.072509765625, -0.06024169921875, -0.0479736328125, -0.03570556640625, -0.0234375, -0.01116943359375, 0.0010986328125, 0.01336669921875, 0.025634765625, 0.03790283203125, 0.0501708984375, 0.06243896484375, 0.07470703125, 0.08697509765625, 0.0992431640625, 0.11151123046875, 0.123779296875, 0.13604736328125, 0.1483154296875, 0.16058349609375, 0.1728515625, 0.18511962890625, 0.1973876953125, 0.20965576171875, 0.221923828125, 0.23419189453125, 0.2464599609375, 0.25872802734375, 0.27099609375, 0.28326416015625, 0.2955322265625, 0.30780029296875, 0.320068359375, 0.33233642578125, 0.3446044921875, 0.35687255859375, 0.369140625, 0.38140869140625, 0.3936767578125, 0.40594482421875, 0.418212890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 21.0, 32.0, 57.0, 71.0, 113.0, 194.0, 402.0, 699.0, 1436.0, 3401.0, 9050.0, 26981.0, 104612.0, 395855.0, 371244.0, 94409.0, 25174.0, 8455.0, 3240.0, 1415.0, 670.0, 382.0, 213.0, 127.0, 98.0, 51.0, 33.0, 27.0, 19.0, 6.0, 10.0, 13.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09930419921875, -0.09629154205322266, -0.09327888488769531, -0.09026622772216797, -0.08725357055664062, -0.08424091339111328, -0.08122825622558594, -0.0782155990600586, -0.07520294189453125, -0.0721902847290039, -0.06917762756347656, -0.06616497039794922, -0.06315231323242188, -0.06013965606689453, -0.05712699890136719, -0.054114341735839844, -0.0511016845703125, -0.048089027404785156, -0.04507637023925781, -0.04206371307373047, -0.039051055908203125, -0.03603839874267578, -0.03302574157714844, -0.030013084411621094, -0.02700042724609375, -0.023987770080566406, -0.020975112915039062, -0.01796245574951172, -0.014949798583984375, -0.011937141418457031, -0.008924484252929688, -0.005911827087402344, -0.002899169921875, 0.00011348724365234375, 0.0031261444091796875, 0.006138801574707031, 0.009151458740234375, 0.012164115905761719, 0.015176773071289062, 0.018189430236816406, 0.02120208740234375, 0.024214744567871094, 0.027227401733398438, 0.03024005889892578, 0.033252716064453125, 0.03626537322998047, 0.03927803039550781, 0.042290687561035156, 0.0453033447265625, 0.048316001892089844, 0.05132865905761719, 0.05434131622314453, 0.057353973388671875, 0.06036663055419922, 0.06337928771972656, 0.0663919448852539, 0.06940460205078125, 0.0724172592163086, 0.07542991638183594, 0.07844257354736328, 0.08145523071289062, 0.08446788787841797, 0.08748054504394531, 0.09049320220947266, 0.093505859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 8.0, 11.0, 15.0, 18.0, 19.0, 14.0, 30.0, 33.0, 45.0, 34.0, 48.0, 49.0, 53.0, 75.0, 52.0, 45.0, 61.0, 55.0, 42.0, 47.0, 47.0, 36.0, 32.0, 27.0, 20.0, 17.0, 17.0, 10.0, 2.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.5912322998046875, -0.569671630859375, -0.5481109619140625, -0.52655029296875, -0.5049896240234375, -0.483428955078125, -0.4618682861328125, -0.4403076171875, -0.4187469482421875, -0.397186279296875, -0.3756256103515625, -0.35406494140625, -0.3325042724609375, -0.310943603515625, -0.2893829345703125, -0.267822265625, -0.2462615966796875, -0.224700927734375, -0.2031402587890625, -0.18157958984375, -0.1600189208984375, -0.138458251953125, -0.1168975830078125, -0.0953369140625, -0.0737762451171875, -0.052215576171875, -0.0306549072265625, -0.00909423828125, 0.0124664306640625, 0.034027099609375, 0.0555877685546875, 0.0771484375, 0.0987091064453125, 0.120269775390625, 0.1418304443359375, 0.16339111328125, 0.1849517822265625, 0.206512451171875, 0.2280731201171875, 0.2496337890625, 0.2711944580078125, 0.292755126953125, 0.3143157958984375, 0.33587646484375, 0.3574371337890625, 0.378997802734375, 0.4005584716796875, 0.422119140625, 0.4436798095703125, 0.465240478515625, 0.4868011474609375, 0.50836181640625, 0.5299224853515625, 0.551483154296875, 0.5730438232421875, 0.5946044921875, 0.6161651611328125, 0.637725830078125, 0.6592864990234375, 0.68084716796875, 0.7024078369140625, 0.723968505859375, 0.7455291748046875, 0.76708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 23.0, 22.0, 27.0, 28.0, 46.0, 86.0, 135.0, 241.0, 443.0, 823.0, 1642.0, 3768.0, 9746.0, 32138.0, 141307.0, 505474.0, 271021.0, 56006.0, 15437.0, 5525.0, 2236.0, 1051.0, 527.0, 317.0, 193.0, 89.0, 66.0, 36.0, 27.0, 23.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.03829383850097656, -0.037250518798828125, -0.03620719909667969, -0.03516387939453125, -0.03412055969238281, -0.033077239990234375, -0.03203392028808594, -0.0309906005859375, -0.029947280883789062, -0.028903961181640625, -0.027860641479492188, -0.02681732177734375, -0.025774002075195312, -0.024730682373046875, -0.023687362670898438, -0.02264404296875, -0.021600723266601562, -0.020557403564453125, -0.019514083862304688, -0.01847076416015625, -0.017427444458007812, -0.016384124755859375, -0.015340805053710938, -0.0142974853515625, -0.013254165649414062, -0.012210845947265625, -0.011167526245117188, -0.01012420654296875, -0.009080886840820312, -0.008037567138671875, -0.0069942474365234375, -0.005950927734375, -0.0049076080322265625, -0.003864288330078125, -0.0028209686279296875, -0.00177764892578125, -0.0007343292236328125, 0.000308990478515625, 0.0013523101806640625, 0.0023956298828125, 0.0034389495849609375, 0.004482269287109375, 0.0055255889892578125, 0.00656890869140625, 0.0076122283935546875, 0.008655548095703125, 0.009698867797851562, 0.0107421875, 0.011785507202148438, 0.012828826904296875, 0.013872146606445312, 0.01491546630859375, 0.015958786010742188, 0.017002105712890625, 0.018045425415039062, 0.0190887451171875, 0.020132064819335938, 0.021175384521484375, 0.022218704223632812, 0.02326202392578125, 0.024305343627929688, 0.025348663330078125, 0.026391983032226562, 0.027435302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 6.0, 6.0, 15.0, 10.0, 20.0, 19.0, 22.0, 31.0, 55.0, 52.0, 59.0, 74.0, 105.0, 74.0, 70.0, 74.0, 56.0, 53.0, 32.0, 39.0, 26.0, 17.0, 24.0, 10.0, 5.0, 7.0, 8.0, 6.0, 3.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6510486602783203e-05, -1.6016885638237e-05, -1.5523284673690796e-05, -1.5029683709144592e-05, -1.4536082744598389e-05, -1.4042481780052185e-05, -1.3548880815505981e-05, -1.3055279850959778e-05, -1.2561678886413574e-05, -1.206807792186737e-05, -1.1574476957321167e-05, -1.1080875992774963e-05, -1.058727502822876e-05, -1.0093674063682556e-05, -9.600073099136353e-06, -9.106472134590149e-06, -8.612871170043945e-06, -8.119270205497742e-06, -7.625669240951538e-06, -7.1320682764053345e-06, -6.638467311859131e-06, -6.144866347312927e-06, -5.651265382766724e-06, -5.15766441822052e-06, -4.664063453674316e-06, -4.170462489128113e-06, -3.676861524581909e-06, -3.1832605600357056e-06, -2.689659595489502e-06, -2.1960586309432983e-06, -1.7024576663970947e-06, -1.2088567018508911e-06, -7.152557373046875e-07, -2.2165477275848389e-07, 2.7194619178771973e-07, 7.655471563339233e-07, 1.259148120880127e-06, 1.7527490854263306e-06, 2.246350049972534e-06, 2.739951014518738e-06, 3.2335519790649414e-06, 3.727152943611145e-06, 4.220753908157349e-06, 4.714354872703552e-06, 5.207955837249756e-06, 5.7015568017959595e-06, 6.195157766342163e-06, 6.688758730888367e-06, 7.18235969543457e-06, 7.675960659980774e-06, 8.169561624526978e-06, 8.663162589073181e-06, 9.156763553619385e-06, 9.650364518165588e-06, 1.0143965482711792e-05, 1.0637566447257996e-05, 1.11311674118042e-05, 1.1624768376350403e-05, 1.2118369340896606e-05, 1.261197030544281e-05, 1.3105571269989014e-05, 1.3599172234535217e-05, 1.4092773199081421e-05, 1.4586374163627625e-05, 1.5079975128173828e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 10.0, 7.0, 11.0, 18.0, 26.0, 43.0, 66.0, 108.0, 175.0, 296.0, 474.0, 867.0, 1953.0, 4927.0, 14199.0, 53378.0, 254597.0, 505310.0, 159826.0, 35076.0, 10225.0, 3634.0, 1547.0, 708.0, 406.0, 240.0, 149.0, 97.0, 63.0, 40.0, 24.0, 15.0, 17.0, 10.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032470703125, -0.03143501281738281, -0.030399322509765625, -0.029363632202148438, -0.02832794189453125, -0.027292251586914062, -0.026256561279296875, -0.025220870971679688, -0.0241851806640625, -0.023149490356445312, -0.022113800048828125, -0.021078109741210938, -0.02004241943359375, -0.019006729125976562, -0.017971038818359375, -0.016935348510742188, -0.015899658203125, -0.014863967895507812, -0.013828277587890625, -0.012792587280273438, -0.01175689697265625, -0.010721206665039062, -0.009685516357421875, -0.008649826049804688, -0.0076141357421875, -0.0065784454345703125, -0.005542755126953125, -0.0045070648193359375, -0.00347137451171875, -0.0024356842041015625, -0.001399993896484375, -0.0003643035888671875, 0.00067138671875, 0.0017070770263671875, 0.002742767333984375, 0.0037784576416015625, 0.00481414794921875, 0.0058498382568359375, 0.006885528564453125, 0.007921218872070312, 0.0089569091796875, 0.009992599487304688, 0.011028289794921875, 0.012063980102539062, 0.01309967041015625, 0.014135360717773438, 0.015171051025390625, 0.016206741333007812, 0.017242431640625, 0.018278121948242188, 0.019313812255859375, 0.020349502563476562, 0.02138519287109375, 0.022420883178710938, 0.023456573486328125, 0.024492263793945312, 0.0255279541015625, 0.026563644409179688, 0.027599334716796875, 0.028635025024414062, 0.02967071533203125, 0.030706405639648438, 0.031742095947265625, 0.03277778625488281, 0.0338134765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 4.0, 9.0, 19.0, 12.0, 19.0, 35.0, 28.0, 25.0, 26.0, 51.0, 58.0, 56.0, 72.0, 56.0, 64.0, 52.0, 65.0, 49.0, 45.0, 34.0, 31.0, 26.0, 29.0, 18.0, 17.0, 17.0, 8.0, 13.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005687713623046875, -0.005492985248565674, -0.005298256874084473, -0.0051035284996032715, -0.00490880012512207, -0.004714071750640869, -0.004519343376159668, -0.004324615001678467, -0.004129886627197266, -0.0039351582527160645, -0.0037404298782348633, -0.003545701503753662, -0.003350973129272461, -0.0031562447547912598, -0.0029615163803100586, -0.0027667880058288574, -0.0025720596313476562, -0.002377331256866455, -0.002182602882385254, -0.0019878745079040527, -0.0017931461334228516, -0.0015984177589416504, -0.0014036893844604492, -0.001208961009979248, -0.0010142326354980469, -0.0008195042610168457, -0.0006247758865356445, -0.00043004751205444336, -0.0002353191375732422, -4.0590763092041016e-05, 0.00015413761138916016, 0.00034886598587036133, 0.0005435943603515625, 0.0007383227348327637, 0.0009330511093139648, 0.001127779483795166, 0.0013225078582763672, 0.0015172362327575684, 0.0017119646072387695, 0.0019066929817199707, 0.002101421356201172, 0.002296149730682373, 0.0024908781051635742, 0.0026856064796447754, 0.0028803348541259766, 0.0030750632286071777, 0.003269791603088379, 0.00346451997756958, 0.0036592483520507812, 0.0038539767265319824, 0.004048705101013184, 0.004243433475494385, 0.004438161849975586, 0.004632890224456787, 0.004827618598937988, 0.0050223469734191895, 0.005217075347900391, 0.005411803722381592, 0.005606532096862793, 0.005801260471343994, 0.005995988845825195, 0.0061907172203063965, 0.006385445594787598, 0.006580173969268799, 0.00677490234375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 20.0, 36.0, 61.0, 93.0, 209.0, 224.0, 156.0, 96.0, 45.0, 23.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888968706130981, -0.5613466501235962, -0.5337964296340942, -0.5062462091445923, -0.47869595885276794, -0.451145738363266, -0.42359548807144165, -0.3960452675819397, -0.36849504709243774, -0.3409448266029358, -0.31339460611343384, -0.2858443558216095, -0.25829413533210754, -0.2307439148426056, -0.20319367945194244, -0.1756434440612793, -0.14809322357177734, -0.1205429956316948, -0.09299276769161224, -0.0654425397515297, -0.037892311811447144, -0.01034209132194519, 0.017208144068717957, 0.044758379459381104, 0.07230859994888306, 0.0998588278889656, 0.12740905582904816, 0.1549592912197113, 0.18250951170921326, 0.2100597321987152, 0.23760996758937836, 0.2651602029800415, 0.29271042346954346, 0.3202606439590454, 0.34781086444854736, 0.3753611147403717, 0.40291133522987366, 0.4304615557193756, 0.45801180601119995, 0.4855620265007019, 0.5131122469902039, 0.5406624674797058, 0.5682126879692078, 0.5957629084587097, 0.6233131885528564, 0.6508634090423584, 0.6784136295318604, 0.7059638500213623, 0.7335140705108643, 0.7610642910003662, 0.7886145114898682, 0.8161647319793701, 0.8437149524688721, 0.871265172958374, 0.8988154530525208, 0.9263656735420227, 0.9539158940315247, 0.9814661145210266, 1.0090163946151733, 1.0365666151046753, 1.0641168355941772, 1.0916670560836792, 1.1192172765731812, 1.146767497062683, 1.174317717552185]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 9.0, 13.0, 9.0, 20.0, 16.0, 25.0, 25.0, 31.0, 47.0, 49.0, 47.0, 52.0, 62.0, 59.0, 58.0, 55.0, 62.0, 58.0, 51.0, 51.0, 40.0, 41.0, 18.0, 17.0, 25.0, 9.0, 15.0, 9.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27519190311431885, -0.2643825113773346, -0.25357311964035034, -0.2427637279033661, -0.23195433616638184, -0.22114494442939758, -0.21033555269241333, -0.19952616095542908, -0.18871676921844482, -0.17790737748146057, -0.16709798574447632, -0.15628859400749207, -0.1454792022705078, -0.13466981053352356, -0.1238604187965393, -0.11305102705955505, -0.1022416353225708, -0.09143224358558655, -0.0806228518486023, -0.06981346011161804, -0.05900406837463379, -0.048194676637649536, -0.03738528490066528, -0.02657589316368103, -0.015766501426696777, -0.004957109689712524, 0.0058522820472717285, 0.01666167378425598, 0.027471065521240234, 0.03828045725822449, 0.04908984899520874, 0.05989924073219299, 0.07070866227149963, 0.08151805400848389, 0.09232744574546814, 0.10313683748245239, 0.11394622921943665, 0.1247556209564209, 0.13556501269340515, 0.1463744044303894, 0.15718379616737366, 0.1679931879043579, 0.17880257964134216, 0.18961197137832642, 0.20042136311531067, 0.21123075485229492, 0.22204014658927917, 0.23284953832626343, 0.24365893006324768, 0.25446832180023193, 0.2652777135372162, 0.27608710527420044, 0.2868964970111847, 0.29770588874816895, 0.3085152804851532, 0.31932467222213745, 0.3301340639591217, 0.34094345569610596, 0.3517528474330902, 0.36256223917007446, 0.3733716309070587, 0.38418102264404297, 0.3949904143810272, 0.4057998061180115, 0.4166091978549957]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 7.0, 3.0, 12.0, 18.0, 35.0, 111.0, 369.0, 2133.0, 22338.0, 864903.0, 151378.0, 6036.0, 849.0, 199.0, 65.0, 27.0, 11.0, 10.0, 2.0, 4.0, 5.0, 0.0, 1.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.223876953125, -1.18408203125, -1.144287109375, -1.1044921875, -1.064697265625, -1.02490234375, -0.985107421875, -0.9453125, -0.905517578125, -0.86572265625, -0.825927734375, -0.7861328125, -0.746337890625, -0.70654296875, -0.666748046875, -0.626953125, -0.587158203125, -0.54736328125, -0.507568359375, -0.4677734375, -0.427978515625, -0.38818359375, -0.348388671875, -0.30859375, -0.268798828125, -0.22900390625, -0.189208984375, -0.1494140625, -0.109619140625, -0.06982421875, -0.030029296875, 0.009765625, 0.049560546875, 0.08935546875, 0.129150390625, 0.1689453125, 0.208740234375, 0.24853515625, 0.288330078125, 0.328125, 0.367919921875, 0.40771484375, 0.447509765625, 0.4873046875, 0.527099609375, 0.56689453125, 0.606689453125, 0.646484375, 0.686279296875, 0.72607421875, 0.765869140625, 0.8056640625, 0.845458984375, 0.88525390625, 0.925048828125, 0.96484375, 1.004638671875, 1.04443359375, 1.084228515625, 1.1240234375, 1.163818359375, 1.20361328125, 1.243408203125, 1.283203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 15.0, 16.0, 29.0, 42.0, 71.0, 98.0, 112.0, 114.0, 114.0, 114.0, 103.0, 69.0, 42.0, 29.0, 20.0, 3.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.5399551391601562, -0.4983673095703125, -0.45677947998046875, -0.415191650390625, -0.37360382080078125, -0.3320159912109375, -0.29042816162109375, -0.24884033203125, -0.20725250244140625, -0.1656646728515625, -0.12407684326171875, -0.082489013671875, -0.04090118408203125, 0.0006866455078125, 0.04227447509765625, 0.0838623046875, 0.12545013427734375, 0.1670379638671875, 0.20862579345703125, 0.250213623046875, 0.29180145263671875, 0.3333892822265625, 0.37497711181640625, 0.41656494140625, 0.45815277099609375, 0.4997406005859375, 0.5413284301757812, 0.582916259765625, 0.6245040893554688, 0.6660919189453125, 0.7076797485351562, 0.749267578125, 0.7908554077148438, 0.8324432373046875, 0.8740310668945312, 0.915618896484375, 0.9572067260742188, 0.9987945556640625, 1.0403823852539062, 1.08197021484375, 1.1235580444335938, 1.1651458740234375, 1.2067337036132812, 1.248321533203125, 1.2899093627929688, 1.3314971923828125, 1.3730850219726562, 1.4146728515625, 1.4562606811523438, 1.4978485107421875, 1.5394363403320312, 1.581024169921875, 1.6226119995117188, 1.6641998291015625, 1.7057876586914062, 1.74737548828125, 1.7889633178710938, 1.8305511474609375, 1.8721389770507812, 1.913726806640625, 1.9553146362304688, 1.9969024658203125, 2.0384902954101562, 2.080078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 12.0, 10.0, 11.0, 14.0, 32.0, 25.0, 43.0, 96.0, 144.0, 269.0, 685.0, 2066.0, 11721.0, 199846.0, 796426.0, 31122.0, 4167.0, 964.0, 383.0, 193.0, 114.0, 74.0, 37.0, 27.0, 20.0, 19.0, 11.0, 6.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.0732421875, -1.0465545654296875, -1.019866943359375, -0.9931793212890625, -0.96649169921875, -0.9398040771484375, -0.913116455078125, -0.8864288330078125, -0.8597412109375, -0.8330535888671875, -0.806365966796875, -0.7796783447265625, -0.75299072265625, -0.7263031005859375, -0.699615478515625, -0.6729278564453125, -0.646240234375, -0.6195526123046875, -0.592864990234375, -0.5661773681640625, -0.53948974609375, -0.5128021240234375, -0.486114501953125, -0.4594268798828125, -0.4327392578125, -0.4060516357421875, -0.379364013671875, -0.3526763916015625, -0.32598876953125, -0.2993011474609375, -0.272613525390625, -0.2459259033203125, -0.21923828125, -0.1925506591796875, -0.165863037109375, -0.1391754150390625, -0.11248779296875, -0.0858001708984375, -0.059112548828125, -0.0324249267578125, -0.0057373046875, 0.0209503173828125, 0.047637939453125, 0.0743255615234375, 0.10101318359375, 0.1277008056640625, 0.154388427734375, 0.1810760498046875, 0.207763671875, 0.2344512939453125, 0.261138916015625, 0.2878265380859375, 0.31451416015625, 0.3412017822265625, 0.367889404296875, 0.3945770263671875, 0.4212646484375, 0.4479522705078125, 0.474639892578125, 0.5013275146484375, 0.52801513671875, 0.5547027587890625, 0.581390380859375, 0.6080780029296875, 0.634765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 7.0, 6.0, 5.0, 7.0, 14.0, 21.0, 22.0, 16.0, 28.0, 31.0, 26.0, 22.0, 34.0, 40.0, 31.0, 38.0, 27.0, 42.0, 36.0, 38.0, 43.0, 51.0, 43.0, 41.0, 34.0, 31.0, 31.0, 24.0, 23.0, 26.0, 22.0, 12.0, 15.0, 19.0, 8.0, 8.0, 15.0, 6.0, 7.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5078125, -0.4907989501953125, -0.473785400390625, -0.4567718505859375, -0.43975830078125, -0.4227447509765625, -0.405731201171875, -0.3887176513671875, -0.3717041015625, -0.3546905517578125, -0.337677001953125, -0.3206634521484375, -0.30364990234375, -0.2866363525390625, -0.269622802734375, -0.2526092529296875, -0.235595703125, -0.2185821533203125, -0.201568603515625, -0.1845550537109375, -0.16754150390625, -0.1505279541015625, -0.133514404296875, -0.1165008544921875, -0.0994873046875, -0.0824737548828125, -0.065460205078125, -0.0484466552734375, -0.03143310546875, -0.0144195556640625, 0.002593994140625, 0.0196075439453125, 0.03662109375, 0.0536346435546875, 0.070648193359375, 0.0876617431640625, 0.10467529296875, 0.1216888427734375, 0.138702392578125, 0.1557159423828125, 0.1727294921875, 0.1897430419921875, 0.206756591796875, 0.2237701416015625, 0.24078369140625, 0.2577972412109375, 0.274810791015625, 0.2918243408203125, 0.308837890625, 0.3258514404296875, 0.342864990234375, 0.3598785400390625, 0.37689208984375, 0.3939056396484375, 0.410919189453125, 0.4279327392578125, 0.4449462890625, 0.4619598388671875, 0.478973388671875, 0.4959869384765625, 0.51300048828125, 0.5300140380859375, 0.547027587890625, 0.5640411376953125, 0.5810546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 12.0, 8.0, 16.0, 13.0, 43.0, 87.0, 150.0, 328.0, 759.0, 2249.0, 8951.0, 77434.0, 840400.0, 103267.0, 10794.0, 2486.0, 866.0, 347.0, 155.0, 71.0, 49.0, 25.0, 11.0, 8.0, 10.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2744140625, -0.26598358154296875, -0.2575531005859375, -0.24912261962890625, -0.240692138671875, -0.23226165771484375, -0.2238311767578125, -0.21540069580078125, -0.20697021484375, -0.19853973388671875, -0.1901092529296875, -0.18167877197265625, -0.173248291015625, -0.16481781005859375, -0.1563873291015625, -0.14795684814453125, -0.1395263671875, -0.13109588623046875, -0.1226654052734375, -0.11423492431640625, -0.105804443359375, -0.09737396240234375, -0.0889434814453125, -0.08051300048828125, -0.07208251953125, -0.06365203857421875, -0.0552215576171875, -0.04679107666015625, -0.038360595703125, -0.02993011474609375, -0.0214996337890625, -0.01306915283203125, -0.004638671875, 0.00379180908203125, 0.0122222900390625, 0.02065277099609375, 0.029083251953125, 0.03751373291015625, 0.0459442138671875, 0.05437469482421875, 0.06280517578125, 0.07123565673828125, 0.0796661376953125, 0.08809661865234375, 0.096527099609375, 0.10495758056640625, 0.1133880615234375, 0.12181854248046875, 0.1302490234375, 0.13867950439453125, 0.1471099853515625, 0.15554046630859375, 0.163970947265625, 0.17240142822265625, 0.1808319091796875, 0.18926239013671875, 0.19769287109375, 0.20612335205078125, 0.2145538330078125, 0.22298431396484375, 0.231414794921875, 0.23984527587890625, 0.2482757568359375, 0.25670623779296875, 0.26513671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 7.0, 3.0, 8.0, 14.0, 10.0, 13.0, 30.0, 29.0, 51.0, 66.0, 92.0, 142.0, 156.0, 99.0, 81.0, 48.0, 43.0, 28.0, 24.0, 16.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5787390768527985e-05, -2.493150532245636e-05, -2.4075619876384735e-05, -2.321973443031311e-05, -2.2363848984241486e-05, -2.150796353816986e-05, -2.0652078092098236e-05, -1.979619264602661e-05, -1.8940307199954987e-05, -1.8084421753883362e-05, -1.7228536307811737e-05, -1.6372650861740112e-05, -1.5516765415668488e-05, -1.4660879969596863e-05, -1.3804994523525238e-05, -1.2949109077453613e-05, -1.2093223631381989e-05, -1.1237338185310364e-05, -1.0381452739238739e-05, -9.525567293167114e-06, -8.66968184709549e-06, -7.813796401023865e-06, -6.95791095495224e-06, -6.102025508880615e-06, -5.2461400628089905e-06, -4.390254616737366e-06, -3.534369170665741e-06, -2.678483724594116e-06, -1.8225982785224915e-06, -9.667128324508667e-07, -1.1082738637924194e-07, 7.450580596923828e-07, 1.6009435057640076e-06, 2.4568289518356323e-06, 3.312714397907257e-06, 4.168599843978882e-06, 5.024485290050507e-06, 5.880370736122131e-06, 6.736256182193756e-06, 7.592141628265381e-06, 8.448027074337006e-06, 9.30391252040863e-06, 1.0159797966480255e-05, 1.101568341255188e-05, 1.1871568858623505e-05, 1.272745430469513e-05, 1.3583339750766754e-05, 1.4439225196838379e-05, 1.5295110642910004e-05, 1.615099608898163e-05, 1.7006881535053253e-05, 1.7862766981124878e-05, 1.8718652427196503e-05, 1.9574537873268127e-05, 2.0430423319339752e-05, 2.1286308765411377e-05, 2.2142194211483002e-05, 2.2998079657554626e-05, 2.385396510362625e-05, 2.4709850549697876e-05, 2.55657359957695e-05, 2.6421621441841125e-05, 2.727750688791275e-05, 2.8133392333984375e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 22.0, 24.0, 43.0, 66.0, 146.0, 270.0, 770.0, 3167.0, 27198.0, 807551.0, 197419.0, 9367.0, 1567.0, 467.0, 202.0, 86.0, 63.0, 28.0, 24.0, 21.0, 10.0, 1.0, 7.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35302734375, -0.3428802490234375, -0.332733154296875, -0.3225860595703125, -0.31243896484375, -0.3022918701171875, -0.292144775390625, -0.2819976806640625, -0.2718505859375, -0.2617034912109375, -0.251556396484375, -0.2414093017578125, -0.23126220703125, -0.2211151123046875, -0.210968017578125, -0.2008209228515625, -0.190673828125, -0.1805267333984375, -0.170379638671875, -0.1602325439453125, -0.15008544921875, -0.1399383544921875, -0.129791259765625, -0.1196441650390625, -0.1094970703125, -0.0993499755859375, -0.089202880859375, -0.0790557861328125, -0.06890869140625, -0.0587615966796875, -0.048614501953125, -0.0384674072265625, -0.0283203125, -0.0181732177734375, -0.008026123046875, 0.0021209716796875, 0.01226806640625, 0.0224151611328125, 0.032562255859375, 0.0427093505859375, 0.0528564453125, 0.0630035400390625, 0.073150634765625, 0.0832977294921875, 0.09344482421875, 0.1035919189453125, 0.113739013671875, 0.1238861083984375, 0.134033203125, 0.1441802978515625, 0.154327392578125, 0.1644744873046875, 0.17462158203125, 0.1847686767578125, 0.194915771484375, 0.2050628662109375, 0.2152099609375, 0.2253570556640625, 0.235504150390625, 0.2456512451171875, 0.25579833984375, 0.2659454345703125, 0.276092529296875, 0.2862396240234375, 0.29638671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 2.0, 10.0, 8.0, 19.0, 23.0, 29.0, 29.0, 41.0, 64.0, 89.0, 113.0, 132.0, 120.0, 97.0, 65.0, 49.0, 38.0, 15.0, 20.0, 12.0, 12.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0772705078125, -0.07463932037353516, -0.07200813293457031, -0.06937694549560547, -0.06674575805664062, -0.06411457061767578, -0.06148338317871094, -0.058852195739746094, -0.05622100830078125, -0.053589820861816406, -0.05095863342285156, -0.04832744598388672, -0.045696258544921875, -0.04306507110595703, -0.04043388366699219, -0.037802696228027344, -0.0351715087890625, -0.032540321350097656, -0.029909133911132812, -0.02727794647216797, -0.024646759033203125, -0.02201557159423828, -0.019384384155273438, -0.016753196716308594, -0.01412200927734375, -0.011490821838378906, -0.008859634399414062, -0.006228446960449219, -0.003597259521484375, -0.0009660720825195312, 0.0016651153564453125, 0.004296302795410156, 0.006927490234375, 0.009558677673339844, 0.012189865112304688, 0.014821052551269531, 0.017452239990234375, 0.02008342742919922, 0.022714614868164062, 0.025345802307128906, 0.02797698974609375, 0.030608177185058594, 0.03323936462402344, 0.03587055206298828, 0.038501739501953125, 0.04113292694091797, 0.04376411437988281, 0.046395301818847656, 0.0490264892578125, 0.051657676696777344, 0.05428886413574219, 0.05692005157470703, 0.059551239013671875, 0.06218242645263672, 0.06481361389160156, 0.0674448013305664, 0.07007598876953125, 0.0727071762084961, 0.07533836364746094, 0.07796955108642578, 0.08060073852539062, 0.08323192596435547, 0.08586311340332031, 0.08849430084228516, 0.09112548828125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 10.0, 11.0, 22.0, 45.0, 74.0, 142.0, 240.0, 196.0, 156.0, 53.0, 24.0, 14.0, 12.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.669635534286499, -1.611814022064209, -1.5539923906326294, -1.4961708784103394, -1.4383493661880493, -1.3805277347564697, -1.3227062225341797, -1.2648847103118896, -1.20706307888031, -1.14924156665802, -1.0914199352264404, -1.0335984230041504, -0.9757768511772156, -0.9179552793502808, -0.8601337671279907, -0.8023121953010559, -0.7444906830787659, -0.686669111251831, -0.628847599029541, -0.5710260272026062, -0.5132044553756714, -0.45538291335105896, -0.39756137132644653, -0.3397397994995117, -0.2819182574748993, -0.22409670054912567, -0.16627514362335205, -0.10845360159873962, -0.050632044672966, 0.007189512252807617, 0.06501105427742004, 0.12283262610435486, 0.18065416812896729, 0.2384757250547409, 0.2962972819805145, 0.35411882400512695, 0.41194039583206177, 0.4697619378566742, 0.5275834798812866, 0.5854050517082214, 0.6432266235351562, 0.7010481953620911, 0.7588697075843811, 0.8166912794113159, 0.8745128512382507, 0.9323344230651855, 0.9901559352874756, 1.0479774475097656, 1.1057989597320557, 1.1636204719543457, 1.2214421033859253, 1.2792636156082153, 1.3370851278305054, 1.394906759262085, 1.452728271484375, 1.510549783706665, 1.5683714151382446, 1.6261929273605347, 1.6840145587921143, 1.7418360710144043, 1.7996575832366943, 1.857479214668274, 1.915300726890564, 1.9731223583221436, 2.0309438705444336]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 12.0, 13.0, 23.0, 14.0, 40.0, 39.0, 38.0, 46.0, 44.0, 58.0, 50.0, 71.0, 49.0, 58.0, 54.0, 65.0, 55.0, 50.0, 47.0, 38.0, 37.0, 32.0, 18.0, 11.0, 10.0, 2.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9879714846611023, -0.9422454833984375, -0.8965195417404175, -0.8507936000823975, -0.8050675988197327, -0.7593415975570679, -0.7136156558990479, -0.6678897142410278, -0.622163712978363, -0.5764377117156982, -0.5307117700576782, -0.4849857985973358, -0.4392598271369934, -0.393533855676651, -0.3478078842163086, -0.3020819127559662, -0.2563559412956238, -0.21062996983528137, -0.16490399837493896, -0.11917802691459656, -0.07345205545425415, -0.027726083993911743, 0.017999887466430664, 0.06372585892677307, 0.10945183038711548, 0.15517780184745789, 0.2009037733078003, 0.2466297447681427, 0.2923557162284851, 0.3380816876888275, 0.3838076591491699, 0.42953363060951233, 0.47525954246520996, 0.52098548412323, 0.5667114853858948, 0.6124374866485596, 0.6581634283065796, 0.7038893699645996, 0.7496153712272644, 0.7953413724899292, 0.8410673141479492, 0.8867932558059692, 0.932519257068634, 0.9782452583312988, 1.0239711999893188, 1.0696971416473389, 1.1154232025146484, 1.1611491441726685, 1.2068750858306885, 1.2526010274887085, 1.2983269691467285, 1.344053030014038, 1.389778971672058, 1.4355049133300781, 1.4812309741973877, 1.5269569158554077, 1.5726828575134277, 1.6184087991714478, 1.6641347408294678, 1.7098608016967773, 1.7555867433547974, 1.8013126850128174, 1.847038745880127, 1.892764687538147, 1.938490629196167]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 16.0, 19.0, 20.0, 22.0, 30.0, 39.0, 56.0, 117.0, 207.0, 457.0, 1264.0, 4583.0, 27887.0, 948619.0, 3136535.0, 63728.0, 7523.0, 1851.0, 641.0, 258.0, 122.0, 77.0, 47.0, 35.0, 24.0, 23.0, 16.0, 8.0, 12.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2080078125, -1.1726531982421875, -1.137298583984375, -1.1019439697265625, -1.06658935546875, -1.0312347412109375, -0.995880126953125, -0.9605255126953125, -0.9251708984375, -0.8898162841796875, -0.854461669921875, -0.8191070556640625, -0.78375244140625, -0.7483978271484375, -0.713043212890625, -0.6776885986328125, -0.642333984375, -0.6069793701171875, -0.571624755859375, -0.5362701416015625, -0.50091552734375, -0.4655609130859375, -0.430206298828125, -0.3948516845703125, -0.3594970703125, -0.3241424560546875, -0.288787841796875, -0.2534332275390625, -0.21807861328125, -0.1827239990234375, -0.147369384765625, -0.1120147705078125, -0.07666015625, -0.0413055419921875, -0.005950927734375, 0.0294036865234375, 0.06475830078125, 0.1001129150390625, 0.135467529296875, 0.1708221435546875, 0.2061767578125, 0.2415313720703125, 0.276885986328125, 0.3122406005859375, 0.34759521484375, 0.3829498291015625, 0.418304443359375, 0.4536590576171875, 0.489013671875, 0.5243682861328125, 0.559722900390625, 0.5950775146484375, 0.63043212890625, 0.6657867431640625, 0.701141357421875, 0.7364959716796875, 0.7718505859375, 0.8072052001953125, 0.842559814453125, 0.8779144287109375, 0.91326904296875, 0.9486236572265625, 0.983978271484375, 1.0193328857421875, 1.0546875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 20.0, 17.0, 27.0, 26.0, 33.0, 40.0, 53.0, 43.0, 38.0, 60.0, 59.0, 51.0, 64.0, 72.0, 67.0, 52.0, 44.0, 37.0, 38.0, 39.0, 28.0, 19.0, 10.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4145774841308594, -0.40068817138671875, -0.3867988586425781, -0.3729095458984375, -0.3590202331542969, -0.34513092041015625, -0.3312416076660156, -0.317352294921875, -0.3034629821777344, -0.28957366943359375, -0.2756843566894531, -0.2617950439453125, -0.24790573120117188, -0.23401641845703125, -0.22012710571289062, -0.20623779296875, -0.19234848022460938, -0.17845916748046875, -0.16456985473632812, -0.1506805419921875, -0.13679122924804688, -0.12290191650390625, -0.10901260375976562, -0.095123291015625, -0.08123397827148438, -0.06734466552734375, -0.053455352783203125, -0.0395660400390625, -0.025676727294921875, -0.01178741455078125, 0.002101898193359375, 0.0159912109375, 0.029880523681640625, 0.04376983642578125, 0.057659149169921875, 0.0715484619140625, 0.08543777465820312, 0.09932708740234375, 0.11321640014648438, 0.127105712890625, 0.14099502563476562, 0.15488433837890625, 0.16877365112304688, 0.1826629638671875, 0.19655227661132812, 0.21044158935546875, 0.22433090209960938, 0.23822021484375, 0.2521095275878906, 0.26599884033203125, 0.2798881530761719, 0.2937774658203125, 0.3076667785644531, 0.32155609130859375, 0.3354454040527344, 0.349334716796875, 0.3632240295410156, 0.37711334228515625, 0.3910026550292969, 0.4048919677734375, 0.4187812805175781, 0.43267059326171875, 0.4465599060058594, 0.46044921875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 9.0, 12.0, 11.0, 16.0, 27.0, 44.0, 78.0, 111.0, 186.0, 365.0, 810.0, 2258.0, 7527.0, 41306.0, 857948.0, 3181389.0, 85328.0, 11896.0, 2933.0, 1009.0, 441.0, 230.0, 144.0, 69.0, 41.0, 17.0, 22.0, 9.0, 13.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.9078521728515625, -0.884063720703125, -0.8602752685546875, -0.83648681640625, -0.8126983642578125, -0.788909912109375, -0.7651214599609375, -0.7413330078125, -0.7175445556640625, -0.693756103515625, -0.6699676513671875, -0.64617919921875, -0.6223907470703125, -0.598602294921875, -0.5748138427734375, -0.551025390625, -0.5272369384765625, -0.503448486328125, -0.4796600341796875, -0.45587158203125, -0.4320831298828125, -0.408294677734375, -0.3845062255859375, -0.3607177734375, -0.3369293212890625, -0.313140869140625, -0.2893524169921875, -0.26556396484375, -0.2417755126953125, -0.217987060546875, -0.1941986083984375, -0.17041015625, -0.1466217041015625, -0.122833251953125, -0.0990447998046875, -0.07525634765625, -0.0514678955078125, -0.027679443359375, -0.0038909912109375, 0.0198974609375, 0.0436859130859375, 0.067474365234375, 0.0912628173828125, 0.11505126953125, 0.1388397216796875, 0.162628173828125, 0.1864166259765625, 0.210205078125, 0.2339935302734375, 0.257781982421875, 0.2815704345703125, 0.30535888671875, 0.3291473388671875, 0.352935791015625, 0.3767242431640625, 0.4005126953125, 0.4243011474609375, 0.448089599609375, 0.4718780517578125, 0.49566650390625, 0.5194549560546875, 0.543243408203125, 0.5670318603515625, 0.5908203125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 10.0, 9.0, 18.0, 15.0, 40.0, 50.0, 73.0, 129.0, 227.0, 436.0, 743.0, 861.0, 603.0, 329.0, 178.0, 111.0, 70.0, 53.0, 33.0, 21.0, 25.0, 5.0, 5.0, 8.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136962890625, -0.13054275512695312, -0.12412261962890625, -0.11770248413085938, -0.1112823486328125, -0.10486221313476562, -0.09844207763671875, -0.09202194213867188, -0.085601806640625, -0.07918167114257812, -0.07276153564453125, -0.06634140014648438, -0.0599212646484375, -0.053501129150390625, -0.04708099365234375, -0.040660858154296875, -0.03424072265625, -0.027820587158203125, -0.02140045166015625, -0.014980316162109375, -0.0085601806640625, -0.002140045166015625, 0.00428009033203125, 0.010700225830078125, 0.017120361328125, 0.023540496826171875, 0.02996063232421875, 0.036380767822265625, 0.0428009033203125, 0.049221038818359375, 0.05564117431640625, 0.062061309814453125, 0.0684814453125, 0.07490158081054688, 0.08132171630859375, 0.08774185180664062, 0.0941619873046875, 0.10058212280273438, 0.10700225830078125, 0.11342239379882812, 0.119842529296875, 0.12626266479492188, 0.13268280029296875, 0.13910293579101562, 0.1455230712890625, 0.15194320678710938, 0.15836334228515625, 0.16478347778320312, 0.17120361328125, 0.17762374877929688, 0.18404388427734375, 0.19046401977539062, 0.1968841552734375, 0.20330429077148438, 0.20972442626953125, 0.21614456176757812, 0.222564697265625, 0.22898483276367188, 0.23540496826171875, 0.24182510375976562, 0.2482452392578125, 0.2546653747558594, 0.26108551025390625, 0.2675056457519531, 0.27392578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 6.0, 9.0, 8.0, 10.0, 18.0, 25.0, 47.0, 61.0, 83.0, 98.0, 99.0, 98.0, 94.0, 113.0, 77.0, 39.0, 31.0, 25.0, 21.0, 13.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42179274559020996, -0.39984646439552307, -0.3779001832008362, -0.3559538722038269, -0.3340076208114624, -0.3120613098144531, -0.29011502861976624, -0.26816874742507935, -0.24622246623039246, -0.22427618503570557, -0.20232990384101868, -0.1803836077451706, -0.1584373265504837, -0.13649104535579681, -0.11454474925994873, -0.09259846806526184, -0.07065218687057495, -0.04870590195059776, -0.026759617030620575, -0.004813328385353088, 0.0171329528093338, 0.03907923400402069, 0.061025530099868774, 0.08297181129455566, 0.10491809248924255, 0.12686437368392944, 0.14881065487861633, 0.17075695097446442, 0.1927032321691513, 0.2146495133638382, 0.23659580945968628, 0.25854209065437317, 0.2804883122444153, 0.3024345934391022, 0.32438087463378906, 0.34632718563079834, 0.36827343702316284, 0.3902197480201721, 0.412166029214859, 0.4341123104095459, 0.4560585916042328, 0.4780048727989197, 0.49995115399360657, 0.5218974351882935, 0.5438437461853027, 0.5657899975776672, 0.5877363085746765, 0.609682559967041, 0.6316288709640503, 0.6535751819610596, 0.6755214333534241, 0.6974677443504333, 0.7194139957427979, 0.7413603067398071, 0.7633066177368164, 0.7852528691291809, 0.8071991205215454, 0.8291454315185547, 0.8510916829109192, 0.8730379939079285, 0.894984245300293, 0.9169305562973022, 0.9388768672943115, 0.960823118686676, 0.9827694296836853]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 2.0, 4.0, 8.0, 13.0, 19.0, 18.0, 18.0, 22.0, 26.0, 33.0, 32.0, 39.0, 40.0, 44.0, 48.0, 36.0, 49.0, 51.0, 55.0, 48.0, 40.0, 49.0, 49.0, 40.0, 28.0, 22.0, 36.0, 23.0, 18.0, 18.0, 14.0, 12.0, 7.0, 5.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3696340024471283, -0.3574292063713074, -0.34522441029548645, -0.3330196142196655, -0.3208147883415222, -0.3086099922657013, -0.29640519618988037, -0.28420040011405945, -0.2719956040382385, -0.2597908079624176, -0.24758599698543549, -0.23538120090961456, -0.22317638993263245, -0.21097159385681152, -0.1987667977809906, -0.18656200170516968, -0.17435717582702637, -0.16215237975120544, -0.14994756877422333, -0.1377427726984024, -0.1255379617214203, -0.11333316564559937, -0.10112836956977844, -0.08892356604337692, -0.0767187625169754, -0.06451395899057388, -0.05230915918946266, -0.04010435938835144, -0.02789955586194992, -0.0156947523355484, -0.003489956259727478, 0.008714847266674042, 0.02091968059539795, 0.03312448412179947, 0.04532928392291069, 0.05753408372402191, 0.06973888725042343, 0.08194369077682495, 0.09414848685264587, 0.1063532903790474, 0.11855809390544891, 0.13076288998126984, 0.14296770095825195, 0.15517249703407288, 0.1673772931098938, 0.17958210408687592, 0.19178690016269684, 0.20399171113967896, 0.21619650721549988, 0.2284013032913208, 0.24060611426830292, 0.25281089544296265, 0.26501572132110596, 0.2772205173969269, 0.2894253134727478, 0.3016301095485687, 0.31383490562438965, 0.32603970170021057, 0.3382444977760315, 0.3504493236541748, 0.3626541197299957, 0.37485891580581665, 0.3870637118816376, 0.3992685079574585, 0.4114733338356018]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 9.0, 10.0, 11.0, 20.0, 16.0, 33.0, 37.0, 44.0, 54.0, 108.0, 138.0, 260.0, 492.0, 1051.0, 2191.0, 5351.0, 14086.0, 40213.0, 119922.0, 306115.0, 336956.0, 144418.0, 48865.0, 16713.0, 6328.0, 2607.0, 1160.0, 523.0, 279.0, 195.0, 104.0, 59.0, 46.0, 37.0, 33.0, 24.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06671142578125, -0.06486272811889648, -0.06301403045654297, -0.06116533279418945, -0.05931663513183594, -0.05746793746948242, -0.055619239807128906, -0.05377054214477539, -0.051921844482421875, -0.05007314682006836, -0.048224449157714844, -0.04637575149536133, -0.04452705383300781, -0.0426783561706543, -0.04082965850830078, -0.038980960845947266, -0.03713226318359375, -0.035283565521240234, -0.03343486785888672, -0.0315861701965332, -0.029737472534179688, -0.027888774871826172, -0.026040077209472656, -0.02419137954711914, -0.022342681884765625, -0.02049398422241211, -0.018645286560058594, -0.016796588897705078, -0.014947891235351562, -0.013099193572998047, -0.011250495910644531, -0.009401798248291016, -0.0075531005859375, -0.005704402923583984, -0.0038557052612304688, -0.002007007598876953, -0.0001583099365234375, 0.0016903877258300781, 0.0035390853881835938, 0.005387783050537109, 0.007236480712890625, 0.00908517837524414, 0.010933876037597656, 0.012782573699951172, 0.014631271362304688, 0.016479969024658203, 0.01832866668701172, 0.020177364349365234, 0.02202606201171875, 0.023874759674072266, 0.02572345733642578, 0.027572154998779297, 0.029420852661132812, 0.03126955032348633, 0.033118247985839844, 0.03496694564819336, 0.036815643310546875, 0.03866434097290039, 0.040513038635253906, 0.04236173629760742, 0.04421043395996094, 0.04605913162231445, 0.04790782928466797, 0.049756526947021484, 0.051605224609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 2.0, 14.0, 8.0, 4.0, 14.0, 24.0, 28.0, 31.0, 35.0, 39.0, 52.0, 65.0, 52.0, 55.0, 79.0, 67.0, 59.0, 76.0, 65.0, 41.0, 31.0, 36.0, 33.0, 19.0, 20.0, 20.0, 3.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.252227783203125, -0.24127197265625, -0.230316162109375, -0.2193603515625, -0.208404541015625, -0.19744873046875, -0.186492919921875, -0.175537109375, -0.164581298828125, -0.15362548828125, -0.142669677734375, -0.1317138671875, -0.120758056640625, -0.10980224609375, -0.098846435546875, -0.087890625, -0.076934814453125, -0.06597900390625, -0.055023193359375, -0.0440673828125, -0.033111572265625, -0.02215576171875, -0.011199951171875, -0.000244140625, 0.010711669921875, 0.02166748046875, 0.032623291015625, 0.0435791015625, 0.054534912109375, 0.06549072265625, 0.076446533203125, 0.08740234375, 0.098358154296875, 0.10931396484375, 0.120269775390625, 0.1312255859375, 0.142181396484375, 0.15313720703125, 0.164093017578125, 0.175048828125, 0.186004638671875, 0.19696044921875, 0.207916259765625, 0.2188720703125, 0.229827880859375, 0.24078369140625, 0.251739501953125, 0.2626953125, 0.273651123046875, 0.28460693359375, 0.295562744140625, 0.3065185546875, 0.317474365234375, 0.32843017578125, 0.339385986328125, 0.350341796875, 0.361297607421875, 0.37225341796875, 0.383209228515625, 0.3941650390625, 0.405120849609375, 0.41607666015625, 0.427032470703125, 0.43798828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 13.0, 8.0, 17.0, 19.0, 35.0, 48.0, 85.0, 121.0, 224.0, 314.0, 607.0, 1193.0, 2585.0, 6025.0, 15687.0, 47961.0, 158344.0, 389619.0, 287210.0, 92509.0, 28246.0, 9734.0, 3991.0, 1788.0, 887.0, 509.0, 307.0, 190.0, 104.0, 56.0, 29.0, 32.0, 21.0, 14.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.07427978515625, -0.07236433029174805, -0.0704488754272461, -0.06853342056274414, -0.06661796569824219, -0.06470251083374023, -0.06278705596923828, -0.06087160110473633, -0.058956146240234375, -0.05704069137573242, -0.05512523651123047, -0.053209781646728516, -0.05129432678222656, -0.04937887191772461, -0.047463417053222656, -0.0455479621887207, -0.04363250732421875, -0.0417170524597168, -0.039801597595214844, -0.03788614273071289, -0.03597068786621094, -0.034055233001708984, -0.03213977813720703, -0.030224323272705078, -0.028308868408203125, -0.026393413543701172, -0.02447795867919922, -0.022562503814697266, -0.020647048950195312, -0.01873159408569336, -0.016816139221191406, -0.014900684356689453, -0.0129852294921875, -0.011069774627685547, -0.009154319763183594, -0.007238864898681641, -0.0053234100341796875, -0.0034079551696777344, -0.0014925003051757812, 0.0004229545593261719, 0.002338409423828125, 0.004253864288330078, 0.006169319152832031, 0.008084774017333984, 0.010000228881835938, 0.01191568374633789, 0.013831138610839844, 0.015746593475341797, 0.01766204833984375, 0.019577503204345703, 0.021492958068847656, 0.02340841293334961, 0.025323867797851562, 0.027239322662353516, 0.02915477752685547, 0.031070232391357422, 0.032985687255859375, 0.03490114212036133, 0.03681659698486328, 0.038732051849365234, 0.04064750671386719, 0.04256296157836914, 0.044478416442871094, 0.04639387130737305, 0.048309326171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 10.0, 9.0, 15.0, 11.0, 12.0, 18.0, 19.0, 25.0, 20.0, 35.0, 34.0, 32.0, 39.0, 36.0, 46.0, 39.0, 55.0, 41.0, 55.0, 41.0, 35.0, 49.0, 44.0, 34.0, 35.0, 32.0, 31.0, 21.0, 19.0, 12.0, 16.0, 12.0, 8.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.55615234375, -0.5408363342285156, -0.5255203247070312, -0.5102043151855469, -0.4948883056640625, -0.4795722961425781, -0.46425628662109375, -0.4489402770996094, -0.433624267578125, -0.4183082580566406, -0.40299224853515625, -0.3876762390136719, -0.3723602294921875, -0.3570442199707031, -0.34172821044921875, -0.3264122009277344, -0.31109619140625, -0.2957801818847656, -0.28046417236328125, -0.2651481628417969, -0.2498321533203125, -0.23451614379882812, -0.21920013427734375, -0.20388412475585938, -0.188568115234375, -0.17325210571289062, -0.15793609619140625, -0.14262008666992188, -0.1273040771484375, -0.11198806762695312, -0.09667205810546875, -0.08135604858398438, -0.0660400390625, -0.050724029541015625, -0.03540802001953125, -0.020092010498046875, -0.0047760009765625, 0.010540008544921875, 0.02585601806640625, 0.041172027587890625, 0.056488037109375, 0.07180404663085938, 0.08712005615234375, 0.10243606567382812, 0.1177520751953125, 0.13306808471679688, 0.14838409423828125, 0.16370010375976562, 0.17901611328125, 0.19433212280273438, 0.20964813232421875, 0.22496414184570312, 0.2402801513671875, 0.2555961608886719, 0.27091217041015625, 0.2862281799316406, 0.301544189453125, 0.3168601989746094, 0.33217620849609375, 0.3474922180175781, 0.3628082275390625, 0.3781242370605469, 0.39344024658203125, 0.4087562561035156, 0.424072265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 11.0, 21.0, 15.0, 26.0, 38.0, 53.0, 67.0, 103.0, 157.0, 246.0, 432.0, 764.0, 1341.0, 2692.0, 5752.0, 14690.0, 48505.0, 209496.0, 517549.0, 179473.0, 42993.0, 13226.0, 5206.0, 2491.0, 1322.0, 703.0, 417.0, 244.0, 175.0, 96.0, 77.0, 22.0, 42.0, 19.0, 10.0, 15.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020233154296875, -0.019568681716918945, -0.01890420913696289, -0.018239736557006836, -0.01757526397705078, -0.016910791397094727, -0.016246318817138672, -0.015581846237182617, -0.014917373657226562, -0.014252901077270508, -0.013588428497314453, -0.012923955917358398, -0.012259483337402344, -0.011595010757446289, -0.010930538177490234, -0.01026606559753418, -0.009601593017578125, -0.00893712043762207, -0.008272647857666016, -0.007608175277709961, -0.006943702697753906, -0.0062792301177978516, -0.005614757537841797, -0.004950284957885742, -0.0042858123779296875, -0.003621339797973633, -0.002956867218017578, -0.0022923946380615234, -0.0016279220581054688, -0.0009634494781494141, -0.0002989768981933594, 0.0003654956817626953, 0.00102996826171875, 0.0016944408416748047, 0.0023589134216308594, 0.003023386001586914, 0.0036878585815429688, 0.0043523311614990234, 0.005016803741455078, 0.005681276321411133, 0.0063457489013671875, 0.007010221481323242, 0.007674694061279297, 0.008339166641235352, 0.009003639221191406, 0.009668111801147461, 0.010332584381103516, 0.01099705696105957, 0.011661529541015625, 0.01232600212097168, 0.012990474700927734, 0.013654947280883789, 0.014319419860839844, 0.014983892440795898, 0.015648365020751953, 0.016312837600708008, 0.016977310180664062, 0.017641782760620117, 0.018306255340576172, 0.018970727920532227, 0.01963520050048828, 0.020299673080444336, 0.02096414566040039, 0.021628618240356445, 0.0222930908203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 7.0, 24.0, 24.0, 30.0, 47.0, 51.0, 54.0, 87.0, 71.0, 110.0, 104.0, 77.0, 88.0, 63.0, 39.0, 30.0, 32.0, 14.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4901161193847656e-05, -1.4456920325756073e-05, -1.401267945766449e-05, -1.3568438589572906e-05, -1.3124197721481323e-05, -1.267995685338974e-05, -1.2235715985298157e-05, -1.1791475117206573e-05, -1.134723424911499e-05, -1.0902993381023407e-05, -1.0458752512931824e-05, -1.001451164484024e-05, -9.570270776748657e-06, -9.126029908657074e-06, -8.68178904056549e-06, -8.237548172473907e-06, -7.793307304382324e-06, -7.349066436290741e-06, -6.904825568199158e-06, -6.4605847001075745e-06, -6.016343832015991e-06, -5.572102963924408e-06, -5.127862095832825e-06, -4.6836212277412415e-06, -4.239380359649658e-06, -3.795139491558075e-06, -3.3508986234664917e-06, -2.9066577553749084e-06, -2.462416887283325e-06, -2.018176019191742e-06, -1.5739351511001587e-06, -1.1296942830085754e-06, -6.854534149169922e-07, -2.4121254682540894e-07, 2.0302832126617432e-07, 6.472691893577576e-07, 1.0915100574493408e-06, 1.535750925540924e-06, 1.9799917936325073e-06, 2.4242326617240906e-06, 2.868473529815674e-06, 3.312714397907257e-06, 3.7569552659988403e-06, 4.201196134090424e-06, 4.645437002182007e-06, 5.08967787027359e-06, 5.533918738365173e-06, 5.978159606456757e-06, 6.42240047454834e-06, 6.866641342639923e-06, 7.310882210731506e-06, 7.75512307882309e-06, 8.199363946914673e-06, 8.643604815006256e-06, 9.08784568309784e-06, 9.532086551189423e-06, 9.976327419281006e-06, 1.0420568287372589e-05, 1.0864809155464172e-05, 1.1309050023555756e-05, 1.1753290891647339e-05, 1.2197531759738922e-05, 1.2641772627830505e-05, 1.3086013495922089e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 13.0, 17.0, 28.0, 35.0, 59.0, 74.0, 113.0, 124.0, 215.0, 379.0, 704.0, 1193.0, 2470.0, 5791.0, 14656.0, 41681.0, 126174.0, 318484.0, 330538.0, 134083.0, 44462.0, 15665.0, 6068.0, 2500.0, 1239.0, 610.0, 376.0, 236.0, 154.0, 109.0, 87.0, 49.0, 36.0, 34.0, 25.0, 13.0, 10.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0158538818359375, -0.015342950820922852, -0.014832019805908203, -0.014321088790893555, -0.013810157775878906, -0.013299226760864258, -0.01278829574584961, -0.012277364730834961, -0.011766433715820312, -0.011255502700805664, -0.010744571685791016, -0.010233640670776367, -0.009722709655761719, -0.00921177864074707, -0.008700847625732422, -0.008189916610717773, -0.007678985595703125, -0.0071680545806884766, -0.006657123565673828, -0.00614619255065918, -0.005635261535644531, -0.005124330520629883, -0.004613399505615234, -0.004102468490600586, -0.0035915374755859375, -0.003080606460571289, -0.0025696754455566406, -0.002058744430541992, -0.0015478134155273438, -0.0010368824005126953, -0.0005259513854980469, -1.5020370483398438e-05, 0.00049591064453125, 0.0010068416595458984, 0.0015177726745605469, 0.0020287036895751953, 0.0025396347045898438, 0.003050565719604492, 0.0035614967346191406, 0.004072427749633789, 0.0045833587646484375, 0.005094289779663086, 0.005605220794677734, 0.006116151809692383, 0.006627082824707031, 0.00713801383972168, 0.007648944854736328, 0.008159875869750977, 0.008670806884765625, 0.009181737899780273, 0.009692668914794922, 0.01020359992980957, 0.010714530944824219, 0.011225461959838867, 0.011736392974853516, 0.012247323989868164, 0.012758255004882812, 0.013269186019897461, 0.01378011703491211, 0.014291048049926758, 0.014801979064941406, 0.015312910079956055, 0.015823841094970703, 0.01633477210998535, 0.016845703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 7.0, 11.0, 11.0, 10.0, 12.0, 8.0, 19.0, 30.0, 25.0, 31.0, 29.0, 38.0, 62.0, 52.0, 49.0, 67.0, 57.0, 44.0, 52.0, 46.0, 50.0, 37.0, 32.0, 39.0, 31.0, 22.0, 27.0, 19.0, 16.0, 11.0, 9.0, 7.0, 8.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0048065185546875, -0.004659771919250488, -0.0045130252838134766, -0.004366278648376465, -0.004219532012939453, -0.004072785377502441, -0.00392603874206543, -0.003779292106628418, -0.0036325454711914062, -0.0034857988357543945, -0.003339052200317383, -0.003192305564880371, -0.0030455589294433594, -0.0028988122940063477, -0.002752065658569336, -0.0026053190231323242, -0.0024585723876953125, -0.0023118257522583008, -0.002165079116821289, -0.0020183324813842773, -0.0018715858459472656, -0.001724839210510254, -0.0015780925750732422, -0.0014313459396362305, -0.0012845993041992188, -0.001137852668762207, -0.0009911060333251953, -0.0008443593978881836, -0.0006976127624511719, -0.0005508661270141602, -0.00040411949157714844, -0.0002573728561401367, -0.000110626220703125, 3.612041473388672e-05, 0.00018286705017089844, 0.00032961368560791016, 0.0004763603210449219, 0.0006231069564819336, 0.0007698535919189453, 0.000916600227355957, 0.0010633468627929688, 0.0012100934982299805, 0.0013568401336669922, 0.001503586769104004, 0.0016503334045410156, 0.0017970800399780273, 0.001943826675415039, 0.0020905733108520508, 0.0022373199462890625, 0.0023840665817260742, 0.002530813217163086, 0.0026775598526000977, 0.0028243064880371094, 0.002971053123474121, 0.003117799758911133, 0.0032645463943481445, 0.0034112930297851562, 0.003558039665222168, 0.0037047863006591797, 0.0038515329360961914, 0.003998279571533203, 0.004145026206970215, 0.0042917728424072266, 0.004438519477844238, 0.00458526611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 17.0, 25.0, 52.0, 150.0, 210.0, 250.0, 166.0, 75.0, 28.0, 14.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1758981943130493, -1.1465601921081543, -1.1172221899032593, -1.0878841876983643, -1.0585461854934692, -1.0292081832885742, -0.9998701810836792, -0.9705321788787842, -0.9411941766738892, -0.9118561744689941, -0.8825181722640991, -0.8531801700592041, -0.8238421678543091, -0.7945041656494141, -0.765166163444519, -0.735828161239624, -0.706490159034729, -0.677152156829834, -0.647814154624939, -0.618476152420044, -0.5891381502151489, -0.5598001480102539, -0.5304621458053589, -0.5011241436004639, -0.47178614139556885, -0.44244813919067383, -0.4131101369857788, -0.3837721347808838, -0.35443413257598877, -0.32509613037109375, -0.29575812816619873, -0.2664201259613037, -0.23708206415176392, -0.2077440619468689, -0.17840605974197388, -0.14906805753707886, -0.11973005533218384, -0.09039205312728882, -0.0610540509223938, -0.03171604871749878, -0.0023780465126037598, 0.02695995569229126, 0.05629795789718628, 0.0856359601020813, 0.11497396230697632, 0.14431196451187134, 0.17364996671676636, 0.20298796892166138, 0.2323259711265564, 0.2616639733314514, 0.29100197553634644, 0.32033997774124146, 0.3496779799461365, 0.3790159821510315, 0.4083539843559265, 0.43769198656082153, 0.46702998876571655, 0.4963679909706116, 0.5257059931755066, 0.5550439953804016, 0.5843819975852966, 0.6137199997901917, 0.6430580019950867, 0.6723960041999817, 0.7017340064048767]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 9.0, 17.0, 19.0, 22.0, 25.0, 39.0, 38.0, 33.0, 59.0, 54.0, 62.0, 50.0, 60.0, 70.0, 61.0, 58.0, 52.0, 45.0, 36.0, 35.0, 31.0, 21.0, 23.0, 14.0, 7.0, 11.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2743450701236725, -0.26477813720703125, -0.2552111744880676, -0.2456442266702652, -0.23607727885246277, -0.22651033103466034, -0.2169433832168579, -0.20737643539905548, -0.19780948758125305, -0.18824253976345062, -0.1786755919456482, -0.16910864412784576, -0.15954169631004333, -0.1499747484922409, -0.14040780067443848, -0.13084085285663605, -0.12127390503883362, -0.11170695722103119, -0.10214000940322876, -0.09257306158542633, -0.0830061137676239, -0.07343916594982147, -0.06387221813201904, -0.054305270314216614, -0.044738322496414185, -0.035171374678611755, -0.025604426860809326, -0.016037479043006897, -0.006470531225204468, 0.0030964165925979614, 0.01266336441040039, 0.02223031222820282, 0.03179726004600525, 0.04136420786380768, 0.05093115568161011, 0.06049810349941254, 0.07006505131721497, 0.0796319991350174, 0.08919894695281982, 0.09876589477062225, 0.10833284258842468, 0.11789979040622711, 0.12746673822402954, 0.13703368604183197, 0.1466006338596344, 0.15616758167743683, 0.16573452949523926, 0.1753014773130417, 0.18486842513084412, 0.19443537294864655, 0.20400232076644897, 0.2135692685842514, 0.22313621640205383, 0.23270316421985626, 0.2422701120376587, 0.2518370747566223, 0.26140400767326355, 0.2709709405899048, 0.2805379033088684, 0.29010486602783203, 0.29967179894447327, 0.3092387318611145, 0.3188056945800781, 0.32837265729904175, 0.337939590215683]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 15.0, 11.0, 24.0, 38.0, 51.0, 81.0, 124.0, 193.0, 291.0, 556.0, 933.0, 1680.0, 3223.0, 6451.0, 13813.0, 32101.0, 91108.0, 333532.0, 387404.0, 109035.0, 37242.0, 15515.0, 7074.0, 3539.0, 1894.0, 1030.0, 597.0, 366.0, 230.0, 132.0, 88.0, 48.0, 36.0, 30.0, 19.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.290771484375, -0.2822380065917969, -0.27370452880859375, -0.2651710510253906, -0.2566375732421875, -0.24810409545898438, -0.23957061767578125, -0.23103713989257812, -0.222503662109375, -0.21397018432617188, -0.20543670654296875, -0.19690322875976562, -0.1883697509765625, -0.17983627319335938, -0.17130279541015625, -0.16276931762695312, -0.15423583984375, -0.14570236206054688, -0.13716888427734375, -0.12863540649414062, -0.1201019287109375, -0.11156845092773438, -0.10303497314453125, -0.09450149536132812, -0.085968017578125, -0.07743453979492188, -0.06890106201171875, -0.060367584228515625, -0.0518341064453125, -0.043300628662109375, -0.03476715087890625, -0.026233673095703125, -0.0177001953125, -0.009166717529296875, -0.00063323974609375, 0.007900238037109375, 0.0164337158203125, 0.024967193603515625, 0.03350067138671875, 0.042034149169921875, 0.050567626953125, 0.059101104736328125, 0.06763458251953125, 0.07616806030273438, 0.0847015380859375, 0.09323501586914062, 0.10176849365234375, 0.11030197143554688, 0.11883544921875, 0.12736892700195312, 0.13590240478515625, 0.14443588256835938, 0.1529693603515625, 0.16150283813476562, 0.17003631591796875, 0.17856979370117188, 0.187103271484375, 0.19563674926757812, 0.20417022705078125, 0.21270370483398438, 0.2212371826171875, 0.22977066040039062, 0.23830413818359375, 0.24683761596679688, 0.25537109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 16.0, 14.0, 12.0, 15.0, 30.0, 30.0, 36.0, 47.0, 45.0, 59.0, 42.0, 45.0, 67.0, 59.0, 71.0, 52.0, 58.0, 50.0, 44.0, 43.0, 29.0, 28.0, 16.0, 13.0, 15.0, 13.0, 6.0, 8.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47705078125, -0.4587249755859375, -0.440399169921875, -0.4220733642578125, -0.40374755859375, -0.3854217529296875, -0.367095947265625, -0.3487701416015625, -0.3304443359375, -0.3121185302734375, -0.293792724609375, -0.2754669189453125, -0.25714111328125, -0.2388153076171875, -0.220489501953125, -0.2021636962890625, -0.183837890625, -0.1655120849609375, -0.147186279296875, -0.1288604736328125, -0.11053466796875, -0.0922088623046875, -0.073883056640625, -0.0555572509765625, -0.0372314453125, -0.0189056396484375, -0.000579833984375, 0.0177459716796875, 0.03607177734375, 0.0543975830078125, 0.072723388671875, 0.0910491943359375, 0.109375, 0.1277008056640625, 0.146026611328125, 0.1643524169921875, 0.18267822265625, 0.2010040283203125, 0.219329833984375, 0.2376556396484375, 0.2559814453125, 0.2743072509765625, 0.292633056640625, 0.3109588623046875, 0.32928466796875, 0.3476104736328125, 0.365936279296875, 0.3842620849609375, 0.402587890625, 0.4209136962890625, 0.439239501953125, 0.4575653076171875, 0.47589111328125, 0.4942169189453125, 0.512542724609375, 0.5308685302734375, 0.5491943359375, 0.5675201416015625, 0.585845947265625, 0.6041717529296875, 0.62249755859375, 0.6408233642578125, 0.659149169921875, 0.6774749755859375, 0.69580078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 5.0, 9.0, 7.0, 9.0, 19.0, 27.0, 36.0, 53.0, 76.0, 125.0, 252.0, 655.0, 2635.0, 14666.0, 194610.0, 781092.0, 46200.0, 5882.0, 1252.0, 425.0, 162.0, 101.0, 71.0, 32.0, 37.0, 18.0, 18.0, 11.0, 11.0, 8.0, 7.0, 6.0, 7.0, 1.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.56201171875, -0.5421218872070312, -0.5222320556640625, -0.5023422241210938, -0.482452392578125, -0.46256256103515625, -0.4426727294921875, -0.42278289794921875, -0.40289306640625, -0.38300323486328125, -0.3631134033203125, -0.34322357177734375, -0.323333740234375, -0.30344390869140625, -0.2835540771484375, -0.26366424560546875, -0.2437744140625, -0.22388458251953125, -0.2039947509765625, -0.18410491943359375, -0.164215087890625, -0.14432525634765625, -0.1244354248046875, -0.10454559326171875, -0.08465576171875, -0.06476593017578125, -0.0448760986328125, -0.02498626708984375, -0.005096435546875, 0.01479339599609375, 0.0346832275390625, 0.05457305908203125, 0.074462890625, 0.09435272216796875, 0.1142425537109375, 0.13413238525390625, 0.154022216796875, 0.17391204833984375, 0.1938018798828125, 0.21369171142578125, 0.23358154296875, 0.25347137451171875, 0.2733612060546875, 0.29325103759765625, 0.313140869140625, 0.33303070068359375, 0.3529205322265625, 0.37281036376953125, 0.3927001953125, 0.41259002685546875, 0.4324798583984375, 0.45236968994140625, 0.472259521484375, 0.49214935302734375, 0.5120391845703125, 0.5319290161132812, 0.55181884765625, 0.5717086791992188, 0.5915985107421875, 0.6114883422851562, 0.631378173828125, 0.6512680053710938, 0.6711578369140625, 0.6910476684570312, 0.7109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 10.0, 10.0, 4.0, 10.0, 11.0, 13.0, 16.0, 7.0, 22.0, 35.0, 26.0, 28.0, 27.0, 36.0, 30.0, 42.0, 48.0, 57.0, 61.0, 52.0, 30.0, 39.0, 44.0, 48.0, 37.0, 28.0, 46.0, 36.0, 31.0, 28.0, 22.0, 9.0, 16.0, 13.0, 13.0, 2.0, 4.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49755859375, -0.480010986328125, -0.46246337890625, -0.444915771484375, -0.4273681640625, -0.409820556640625, -0.39227294921875, -0.374725341796875, -0.357177734375, -0.339630126953125, -0.32208251953125, -0.304534912109375, -0.2869873046875, -0.269439697265625, -0.25189208984375, -0.234344482421875, -0.216796875, -0.199249267578125, -0.18170166015625, -0.164154052734375, -0.1466064453125, -0.129058837890625, -0.11151123046875, -0.093963623046875, -0.076416015625, -0.058868408203125, -0.04132080078125, -0.023773193359375, -0.0062255859375, 0.011322021484375, 0.02886962890625, 0.046417236328125, 0.06396484375, 0.081512451171875, 0.09906005859375, 0.116607666015625, 0.1341552734375, 0.151702880859375, 0.16925048828125, 0.186798095703125, 0.204345703125, 0.221893310546875, 0.23944091796875, 0.256988525390625, 0.2745361328125, 0.292083740234375, 0.30963134765625, 0.327178955078125, 0.3447265625, 0.362274169921875, 0.37982177734375, 0.397369384765625, 0.4149169921875, 0.432464599609375, 0.45001220703125, 0.467559814453125, 0.485107421875, 0.502655029296875, 0.52020263671875, 0.537750244140625, 0.5552978515625, 0.572845458984375, 0.59039306640625, 0.607940673828125, 0.62548828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 7.0, 5.0, 14.0, 30.0, 40.0, 67.0, 124.0, 227.0, 408.0, 841.0, 1775.0, 4500.0, 18337.0, 298281.0, 681067.0, 32402.0, 5999.0, 2313.0, 1038.0, 476.0, 255.0, 129.0, 81.0, 57.0, 28.0, 12.0, 16.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24354171752929688, -0.23488616943359375, -0.22623062133789062, -0.2175750732421875, -0.20891952514648438, -0.20026397705078125, -0.19160842895507812, -0.182952880859375, -0.17429733276367188, -0.16564178466796875, -0.15698623657226562, -0.1483306884765625, -0.13967514038085938, -0.13101959228515625, -0.12236404418945312, -0.11370849609375, -0.10505294799804688, -0.09639739990234375, -0.08774185180664062, -0.0790863037109375, -0.07043075561523438, -0.06177520751953125, -0.053119659423828125, -0.044464111328125, -0.035808563232421875, -0.02715301513671875, -0.018497467041015625, -0.0098419189453125, -0.001186370849609375, 0.00746917724609375, 0.016124725341796875, 0.0247802734375, 0.033435821533203125, 0.04209136962890625, 0.050746917724609375, 0.0594024658203125, 0.06805801391601562, 0.07671356201171875, 0.08536911010742188, 0.094024658203125, 0.10268020629882812, 0.11133575439453125, 0.11999130249023438, 0.1286468505859375, 0.13730239868164062, 0.14595794677734375, 0.15461349487304688, 0.16326904296875, 0.17192459106445312, 0.18058013916015625, 0.18923568725585938, 0.1978912353515625, 0.20654678344726562, 0.21520233154296875, 0.22385787963867188, 0.232513427734375, 0.24116897583007812, 0.24982452392578125, 0.2584800720214844, 0.2671356201171875, 0.2757911682128906, 0.28444671630859375, 0.2931022644042969, 0.3017578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 16.0, 22.0, 49.0, 70.0, 132.0, 196.0, 206.0, 140.0, 59.0, 34.0, 24.0, 22.0, 5.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.725290298461914e-05, -3.576651215553284e-05, -3.428012132644653e-05, -3.279373049736023e-05, -3.1307339668273926e-05, -2.9820948839187622e-05, -2.833455801010132e-05, -2.6848167181015015e-05, -2.536177635192871e-05, -2.3875385522842407e-05, -2.2388994693756104e-05, -2.09026038646698e-05, -1.9416213035583496e-05, -1.7929822206497192e-05, -1.644343137741089e-05, -1.4957040548324585e-05, -1.3470649719238281e-05, -1.1984258890151978e-05, -1.0497868061065674e-05, -9.01147723197937e-06, -7.525086402893066e-06, -6.038695573806763e-06, -4.552304744720459e-06, -3.0659139156341553e-06, -1.5795230865478516e-06, -9.313225746154785e-08, 1.3932585716247559e-06, 2.8796494007110596e-06, 4.366040229797363e-06, 5.852431058883667e-06, 7.338821887969971e-06, 8.825212717056274e-06, 1.0311603546142578e-05, 1.1797994375228882e-05, 1.3284385204315186e-05, 1.477077603340149e-05, 1.6257166862487793e-05, 1.7743557691574097e-05, 1.92299485206604e-05, 2.0716339349746704e-05, 2.2202730178833008e-05, 2.368912100791931e-05, 2.5175511837005615e-05, 2.666190266609192e-05, 2.8148293495178223e-05, 2.9634684324264526e-05, 3.112107515335083e-05, 3.2607465982437134e-05, 3.409385681152344e-05, 3.558024764060974e-05, 3.7066638469696045e-05, 3.855302929878235e-05, 4.003942012786865e-05, 4.1525810956954956e-05, 4.301220178604126e-05, 4.4498592615127563e-05, 4.598498344421387e-05, 4.747137427330017e-05, 4.8957765102386475e-05, 5.044415593147278e-05, 5.193054676055908e-05, 5.3416937589645386e-05, 5.490332841873169e-05, 5.638971924781799e-05, 5.78761100769043e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 6.0, 10.0, 20.0, 30.0, 41.0, 64.0, 167.0, 456.0, 1443.0, 5423.0, 50558.0, 927910.0, 54436.0, 5712.0, 1406.0, 460.0, 185.0, 81.0, 43.0, 30.0, 15.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388427734375, -0.3764801025390625, -0.364532470703125, -0.3525848388671875, -0.34063720703125, -0.3286895751953125, -0.316741943359375, -0.3047943115234375, -0.2928466796875, -0.2808990478515625, -0.268951416015625, -0.2570037841796875, -0.24505615234375, -0.2331085205078125, -0.221160888671875, -0.2092132568359375, -0.197265625, -0.1853179931640625, -0.173370361328125, -0.1614227294921875, -0.14947509765625, -0.1375274658203125, -0.125579833984375, -0.1136322021484375, -0.1016845703125, -0.0897369384765625, -0.077789306640625, -0.0658416748046875, -0.05389404296875, -0.0419464111328125, -0.029998779296875, -0.0180511474609375, -0.006103515625, 0.0058441162109375, 0.017791748046875, 0.0297393798828125, 0.04168701171875, 0.0536346435546875, 0.065582275390625, 0.0775299072265625, 0.0894775390625, 0.1014251708984375, 0.113372802734375, 0.1253204345703125, 0.13726806640625, 0.1492156982421875, 0.161163330078125, 0.1731109619140625, 0.18505859375, 0.1970062255859375, 0.208953857421875, 0.2209014892578125, 0.23284912109375, 0.2447967529296875, 0.256744384765625, 0.2686920166015625, 0.2806396484375, 0.2925872802734375, 0.304534912109375, 0.3164825439453125, 0.32843017578125, 0.3403778076171875, 0.352325439453125, 0.3642730712890625, 0.376220703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 12.0, 6.0, 16.0, 24.0, 28.0, 45.0, 51.0, 104.0, 130.0, 161.0, 113.0, 107.0, 68.0, 30.0, 33.0, 16.0, 16.0, 10.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0799560546875, -0.0770425796508789, -0.07412910461425781, -0.07121562957763672, -0.06830215454101562, -0.06538867950439453, -0.06247520446777344, -0.059561729431152344, -0.05664825439453125, -0.053734779357910156, -0.05082130432128906, -0.04790782928466797, -0.044994354248046875, -0.04208087921142578, -0.03916740417480469, -0.036253929138183594, -0.0333404541015625, -0.030426979064941406, -0.027513504028320312, -0.02460002899169922, -0.021686553955078125, -0.01877307891845703, -0.015859603881835938, -0.012946128845214844, -0.01003265380859375, -0.007119178771972656, -0.0042057037353515625, -0.0012922286987304688, 0.001621246337890625, 0.004534721374511719, 0.0074481964111328125, 0.010361671447753906, 0.013275146484375, 0.016188621520996094, 0.019102096557617188, 0.02201557159423828, 0.024929046630859375, 0.02784252166748047, 0.030755996704101562, 0.033669471740722656, 0.03658294677734375, 0.039496421813964844, 0.04240989685058594, 0.04532337188720703, 0.048236846923828125, 0.05115032196044922, 0.05406379699707031, 0.056977272033691406, 0.0598907470703125, 0.0628042221069336, 0.06571769714355469, 0.06863117218017578, 0.07154464721679688, 0.07445812225341797, 0.07737159729003906, 0.08028507232666016, 0.08319854736328125, 0.08611202239990234, 0.08902549743652344, 0.09193897247314453, 0.09485244750976562, 0.09776592254638672, 0.10067939758300781, 0.1035928726196289, 0.10650634765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 8.0, 5.0, 19.0, 29.0, 46.0, 113.0, 148.0, 223.0, 180.0, 116.0, 56.0, 35.0, 18.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302221775054932, -0.48031696677207947, -0.43041178584098816, -0.38050657510757446, -0.33060139417648315, -0.28069618344306946, -0.23079097270965576, -0.18088579177856445, -0.13098058104515076, -0.08107538521289825, -0.031170181930065155, 0.018735021352767944, 0.06864021718502045, 0.11854541301727295, 0.16845062375068665, 0.21835580468177795, 0.26826101541519165, 0.31816622614860535, 0.36807140707969666, 0.41797661781311035, 0.46788179874420166, 0.517786979675293, 0.567692220211029, 0.6175974011421204, 0.6675026416778564, 0.7174078226089478, 0.7673130631446838, 0.8172182440757751, 0.8671234250068665, 0.9170286655426025, 0.9669338464736938, 1.0168390274047852, 1.0667442083358765, 1.1166493892669678, 1.166554570198059, 1.2164597511291504, 1.2663650512695312, 1.3162702322006226, 1.3661754131317139, 1.4160805940628052, 1.4659857749938965, 1.5158909559249878, 1.565796136856079, 1.61570143699646, 1.6656066179275513, 1.7155117988586426, 1.7654169797897339, 1.8153221607208252, 1.865227460861206, 1.9151326417922974, 1.9650378227233887, 2.0149431228637695, 2.0648481845855713, 2.114753484725952, 2.164658546447754, 2.2145638465881348, 2.2644689083099365, 2.3143742084503174, 2.364279270172119, 2.4141845703125, 2.4640896320343018, 2.5139949321746826, 2.5638999938964844, 2.6138052940368652, 2.663710594177246]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 5.0, 6.0, 11.0, 10.0, 14.0, 9.0, 9.0, 23.0, 18.0, 19.0, 21.0, 19.0, 20.0, 24.0, 24.0, 28.0, 23.0, 34.0, 28.0, 36.0, 35.0, 33.0, 43.0, 35.0, 34.0, 44.0, 34.0, 24.0, 32.0, 41.0, 29.0, 30.0, 21.0, 20.0, 22.0, 24.0, 14.0, 19.0, 9.0, 14.0, 10.0, 2.0, 11.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0], "bins": [-0.7506343722343445, -0.7271214127540588, -0.7036084532737732, -0.6800954937934875, -0.6565825939178467, -0.633069634437561, -0.6095566749572754, -0.5860437154769897, -0.5625307559967041, -0.5390177965164185, -0.5155048370361328, -0.49199190735816956, -0.4684789478778839, -0.44496598839759827, -0.421453058719635, -0.39794009923934937, -0.3744271397590637, -0.3509141802787781, -0.32740122079849243, -0.3038882911205292, -0.28037533164024353, -0.2568623721599579, -0.23334942758083344, -0.20983648300170898, -0.18632352352142334, -0.1628105640411377, -0.13929761946201324, -0.1157846674323082, -0.09227171540260315, -0.0687587633728981, -0.045245811343193054, -0.021732866764068604, 0.001780092716217041, 0.02529304474592209, 0.048805996775627136, 0.07231894880533218, 0.09583190083503723, 0.11934485286474228, 0.14285780489444733, 0.16637074947357178, 0.18988370895385742, 0.21339666843414307, 0.23690961301326752, 0.26042255759239197, 0.2839355170726776, 0.30744847655296326, 0.3309614062309265, 0.35447436571121216, 0.3779873251914978, 0.40150028467178345, 0.4250132441520691, 0.44852617383003235, 0.472039133310318, 0.49555209279060364, 0.5190650224685669, 0.5425779819488525, 0.5660909414291382, 0.5896039009094238, 0.6131168603897095, 0.6366298198699951, 0.6601427793502808, 0.6836556792259216, 0.7071686387062073, 0.7306815981864929, 0.7541945576667786]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 10.0, 24.0, 46.0, 99.0, 217.0, 536.0, 1611.0, 7012.0, 98068.0, 3906889.0, 169328.0, 7977.0, 1532.0, 487.0, 174.0, 92.0, 53.0, 24.0, 19.0, 16.0, 15.0, 7.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9287109375, -0.887542724609375, -0.84637451171875, -0.805206298828125, -0.7640380859375, -0.722869873046875, -0.68170166015625, -0.640533447265625, -0.599365234375, -0.558197021484375, -0.51702880859375, -0.475860595703125, -0.4346923828125, -0.393524169921875, -0.35235595703125, -0.311187744140625, -0.27001953125, -0.228851318359375, -0.18768310546875, -0.146514892578125, -0.1053466796875, -0.064178466796875, -0.02301025390625, 0.018157958984375, 0.059326171875, 0.100494384765625, 0.14166259765625, 0.182830810546875, 0.2239990234375, 0.265167236328125, 0.30633544921875, 0.347503662109375, 0.388671875, 0.429840087890625, 0.47100830078125, 0.512176513671875, 0.5533447265625, 0.594512939453125, 0.63568115234375, 0.676849365234375, 0.718017578125, 0.759185791015625, 0.80035400390625, 0.841522216796875, 0.8826904296875, 0.923858642578125, 0.96502685546875, 1.006195068359375, 1.04736328125, 1.088531494140625, 1.12969970703125, 1.170867919921875, 1.2120361328125, 1.253204345703125, 1.29437255859375, 1.335540771484375, 1.376708984375, 1.417877197265625, 1.45904541015625, 1.500213623046875, 1.5413818359375, 1.582550048828125, 1.62371826171875, 1.664886474609375, 1.7060546875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 18.0, 16.0, 25.0, 44.0, 30.0, 61.0, 58.0, 76.0, 77.0, 83.0, 105.0, 81.0, 72.0, 65.0, 43.0, 40.0, 27.0, 16.0, 18.0, 12.0, 7.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36767578125, -0.3507843017578125, -0.333892822265625, -0.3170013427734375, -0.30010986328125, -0.2832183837890625, -0.266326904296875, -0.2494354248046875, -0.2325439453125, -0.2156524658203125, -0.198760986328125, -0.1818695068359375, -0.16497802734375, -0.1480865478515625, -0.131195068359375, -0.1143035888671875, -0.097412109375, -0.0805206298828125, -0.063629150390625, -0.0467376708984375, -0.02984619140625, -0.0129547119140625, 0.003936767578125, 0.0208282470703125, 0.0377197265625, 0.0546112060546875, 0.071502685546875, 0.0883941650390625, 0.10528564453125, 0.1221771240234375, 0.139068603515625, 0.1559600830078125, 0.1728515625, 0.1897430419921875, 0.206634521484375, 0.2235260009765625, 0.24041748046875, 0.2573089599609375, 0.274200439453125, 0.2910919189453125, 0.3079833984375, 0.3248748779296875, 0.341766357421875, 0.3586578369140625, 0.37554931640625, 0.3924407958984375, 0.409332275390625, 0.4262237548828125, 0.443115234375, 0.4600067138671875, 0.476898193359375, 0.4937896728515625, 0.51068115234375, 0.5275726318359375, 0.544464111328125, 0.5613555908203125, 0.5782470703125, 0.5951385498046875, 0.612030029296875, 0.6289215087890625, 0.64581298828125, 0.6627044677734375, 0.679595947265625, 0.6964874267578125, 0.71337890625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 11.0, 13.0, 20.0, 35.0, 43.0, 68.0, 150.0, 305.0, 745.0, 2057.0, 7603.0, 58638.0, 3135952.0, 949897.0, 30979.0, 4959.0, 1526.0, 655.0, 290.0, 134.0, 76.0, 45.0, 28.0, 10.0, 10.0, 10.0, 4.0, 6.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7245025634765625, -0.697540283203125, -0.6705780029296875, -0.64361572265625, -0.6166534423828125, -0.589691162109375, -0.5627288818359375, -0.5357666015625, -0.5088043212890625, -0.481842041015625, -0.4548797607421875, -0.42791748046875, -0.4009552001953125, -0.373992919921875, -0.3470306396484375, -0.320068359375, -0.2931060791015625, -0.266143798828125, -0.2391815185546875, -0.21221923828125, -0.1852569580078125, -0.158294677734375, -0.1313323974609375, -0.1043701171875, -0.0774078369140625, -0.050445556640625, -0.0234832763671875, 0.00347900390625, 0.0304412841796875, 0.057403564453125, 0.0843658447265625, 0.111328125, 0.1382904052734375, 0.165252685546875, 0.1922149658203125, 0.21917724609375, 0.2461395263671875, 0.273101806640625, 0.3000640869140625, 0.3270263671875, 0.3539886474609375, 0.380950927734375, 0.4079132080078125, 0.43487548828125, 0.4618377685546875, 0.488800048828125, 0.5157623291015625, 0.542724609375, 0.5696868896484375, 0.596649169921875, 0.6236114501953125, 0.65057373046875, 0.6775360107421875, 0.704498291015625, 0.7314605712890625, 0.7584228515625, 0.7853851318359375, 0.812347412109375, 0.8393096923828125, 0.86627197265625, 0.8932342529296875, 0.920196533203125, 0.9471588134765625, 0.97412109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 7.0, 6.0, 8.0, 11.0, 15.0, 21.0, 33.0, 42.0, 67.0, 107.0, 174.0, 274.0, 458.0, 679.0, 791.0, 499.0, 334.0, 182.0, 107.0, 72.0, 60.0, 36.0, 30.0, 15.0, 7.0, 8.0, 8.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1920166015625, -0.18670654296875, -0.181396484375, -0.17608642578125, -0.1707763671875, -0.16546630859375, -0.16015625, -0.15484619140625, -0.1495361328125, -0.14422607421875, -0.138916015625, -0.13360595703125, -0.1282958984375, -0.12298583984375, -0.11767578125, -0.11236572265625, -0.1070556640625, -0.10174560546875, -0.096435546875, -0.09112548828125, -0.0858154296875, -0.08050537109375, -0.0751953125, -0.06988525390625, -0.0645751953125, -0.05926513671875, -0.053955078125, -0.04864501953125, -0.0433349609375, -0.03802490234375, -0.03271484375, -0.02740478515625, -0.0220947265625, -0.01678466796875, -0.011474609375, -0.00616455078125, -0.0008544921875, 0.00445556640625, 0.009765625, 0.01507568359375, 0.0203857421875, 0.02569580078125, 0.031005859375, 0.03631591796875, 0.0416259765625, 0.04693603515625, 0.05224609375, 0.05755615234375, 0.0628662109375, 0.06817626953125, 0.073486328125, 0.07879638671875, 0.0841064453125, 0.08941650390625, 0.0947265625, 0.10003662109375, 0.1053466796875, 0.11065673828125, 0.115966796875, 0.12127685546875, 0.1265869140625, 0.13189697265625, 0.13720703125, 0.14251708984375, 0.1478271484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 6.0, 4.0, 12.0, 15.0, 17.0, 17.0, 48.0, 94.0, 87.0, 120.0, 116.0, 123.0, 96.0, 88.0, 62.0, 38.0, 23.0, 14.0, 9.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6215534806251526, -0.5973003506660461, -0.5730472207069397, -0.548794150352478, -0.5245410203933716, -0.5002878904342651, -0.4760347604751587, -0.45178163051605225, -0.4275285303592682, -0.40327540040016174, -0.3790223002433777, -0.35476917028427124, -0.3305160403251648, -0.30626294016838074, -0.2820098102092743, -0.25775671005249023, -0.2335035800933838, -0.20925046503543854, -0.1849973499774933, -0.16074422001838684, -0.1364911049604416, -0.11223798990249634, -0.08798485994338989, -0.06373174488544464, -0.03947862982749939, -0.01522551104426384, 0.00902760773897171, 0.03328073024749756, 0.05753384530544281, 0.08178696036338806, 0.1060400903224945, 0.13029320538043976, 0.154546320438385, 0.17879943549633026, 0.2030525505542755, 0.22730568051338196, 0.251558780670166, 0.27581191062927246, 0.3000650405883789, 0.32431817054748535, 0.3485712707042694, 0.37282440066337585, 0.3970775008201599, 0.42133063077926636, 0.4455837607383728, 0.46983686089515686, 0.4940899908542633, 0.5183430910110474, 0.5425962209701538, 0.5668493509292603, 0.5911024808883667, 0.6153556108474731, 0.6396086812019348, 0.6638618111610413, 0.6881149411201477, 0.7123680710792542, 0.7366211414337158, 0.7608742713928223, 0.7851274013519287, 0.8093805313110352, 0.8336336016654968, 0.8578867316246033, 0.8821398615837097, 0.9063929915428162, 0.9306461215019226]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 5.0, 11.0, 15.0, 17.0, 12.0, 16.0, 17.0, 20.0, 32.0, 31.0, 35.0, 22.0, 32.0, 41.0, 28.0, 35.0, 44.0, 44.0, 41.0, 42.0, 32.0, 49.0, 39.0, 44.0, 34.0, 27.0, 28.0, 18.0, 28.0, 19.0, 19.0, 18.0, 13.0, 12.0, 11.0, 9.0, 11.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.3360586166381836, -0.3264901638031006, -0.3169217109680176, -0.30735328793525696, -0.29778483510017395, -0.28821638226509094, -0.27864792943000793, -0.2690794765949249, -0.2595110535621643, -0.2499426007270813, -0.24037416279315948, -0.23080570995807648, -0.22123727202415466, -0.21166881918907166, -0.20210036635398865, -0.19253191351890564, -0.18296346068382263, -0.17339500784873962, -0.1638265699148178, -0.1542581170797348, -0.144689679145813, -0.13512122631072998, -0.12555277347564697, -0.11598432809114456, -0.10641588270664215, -0.09684743732213974, -0.08727899193763733, -0.07771053910255432, -0.06814209371805191, -0.0585736483335495, -0.04900519922375679, -0.03943675011396408, -0.02986830472946167, -0.02029985748231411, -0.01073141023516655, -0.0011629629880189896, 0.00840548425912857, 0.01797392964363098, 0.02754237875342369, 0.0371108278632164, 0.04667927324771881, 0.05624771863222122, 0.06581616401672363, 0.07538461685180664, 0.08495306223630905, 0.09452150762081146, 0.10408996045589447, 0.11365840584039688, 0.12322685122489929, 0.1327953040599823, 0.1423637419939041, 0.15193219482898712, 0.16150063276290894, 0.17106908559799194, 0.18063753843307495, 0.19020599126815796, 0.19977442920207977, 0.20934288203716278, 0.2189113199710846, 0.2284797728061676, 0.2380482256412506, 0.24761666357517242, 0.25718510150909424, 0.26675355434417725, 0.27632200717926025]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 9.0, 13.0, 21.0, 34.0, 23.0, 42.0, 66.0, 110.0, 158.0, 291.0, 608.0, 1482.0, 3967.0, 12130.0, 41339.0, 160637.0, 441022.0, 281229.0, 74517.0, 20375.0, 6348.0, 2282.0, 859.0, 402.0, 210.0, 97.0, 68.0, 56.0, 30.0, 25.0, 20.0, 14.0, 18.0, 8.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0694580078125, -0.06703948974609375, -0.0646209716796875, -0.06220245361328125, -0.059783935546875, -0.05736541748046875, -0.0549468994140625, -0.05252838134765625, -0.05010986328125, -0.04769134521484375, -0.0452728271484375, -0.04285430908203125, -0.040435791015625, -0.03801727294921875, -0.0355987548828125, -0.03318023681640625, -0.03076171875, -0.02834320068359375, -0.0259246826171875, -0.02350616455078125, -0.021087646484375, -0.01866912841796875, -0.0162506103515625, -0.01383209228515625, -0.01141357421875, -0.00899505615234375, -0.0065765380859375, -0.00415802001953125, -0.001739501953125, 0.00067901611328125, 0.0030975341796875, 0.00551605224609375, 0.0079345703125, 0.01035308837890625, 0.0127716064453125, 0.01519012451171875, 0.017608642578125, 0.02002716064453125, 0.0224456787109375, 0.02486419677734375, 0.02728271484375, 0.02970123291015625, 0.0321197509765625, 0.03453826904296875, 0.036956787109375, 0.03937530517578125, 0.0417938232421875, 0.04421234130859375, 0.046630859375, 0.04904937744140625, 0.0514678955078125, 0.05388641357421875, 0.056304931640625, 0.05872344970703125, 0.0611419677734375, 0.06356048583984375, 0.06597900390625, 0.06839752197265625, 0.0708160400390625, 0.07323455810546875, 0.075653076171875, 0.07807159423828125, 0.0804901123046875, 0.08290863037109375, 0.0853271484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 8.0, 11.0, 14.0, 27.0, 33.0, 32.0, 42.0, 67.0, 58.0, 68.0, 85.0, 82.0, 90.0, 70.0, 60.0, 49.0, 51.0, 39.0, 32.0, 19.0, 24.0, 7.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.426513671875, -0.41339874267578125, -0.4002838134765625, -0.38716888427734375, -0.374053955078125, -0.36093902587890625, -0.3478240966796875, -0.33470916748046875, -0.32159423828125, -0.30847930908203125, -0.2953643798828125, -0.28224945068359375, -0.269134521484375, -0.25601959228515625, -0.2429046630859375, -0.22978973388671875, -0.2166748046875, -0.20355987548828125, -0.1904449462890625, -0.17733001708984375, -0.164215087890625, -0.15110015869140625, -0.1379852294921875, -0.12487030029296875, -0.11175537109375, -0.09864044189453125, -0.0855255126953125, -0.07241058349609375, -0.059295654296875, -0.04618072509765625, -0.0330657958984375, -0.01995086669921875, -0.0068359375, 0.00627899169921875, 0.0193939208984375, 0.03250885009765625, 0.045623779296875, 0.05873870849609375, 0.0718536376953125, 0.08496856689453125, 0.09808349609375, 0.11119842529296875, 0.1243133544921875, 0.13742828369140625, 0.150543212890625, 0.16365814208984375, 0.1767730712890625, 0.18988800048828125, 0.2030029296875, 0.21611785888671875, 0.2292327880859375, 0.24234771728515625, 0.255462646484375, 0.26857757568359375, 0.2816925048828125, 0.29480743408203125, 0.30792236328125, 0.32103729248046875, 0.3341522216796875, 0.34726715087890625, 0.360382080078125, 0.37349700927734375, 0.3866119384765625, 0.39972686767578125, 0.412841796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 13.0, 10.0, 29.0, 29.0, 41.0, 78.0, 107.0, 151.0, 247.0, 452.0, 826.0, 1691.0, 3410.0, 7459.0, 17551.0, 45987.0, 126785.0, 293994.0, 315727.0, 145012.0, 52643.0, 20143.0, 8303.0, 3757.0, 1831.0, 924.0, 510.0, 295.0, 163.0, 124.0, 70.0, 45.0, 35.0, 28.0, 14.0, 17.0, 13.0, 16.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040252685546875, -0.03858041763305664, -0.03690814971923828, -0.03523588180541992, -0.03356361389160156, -0.0318913459777832, -0.030219078063964844, -0.028546810150146484, -0.026874542236328125, -0.025202274322509766, -0.023530006408691406, -0.021857738494873047, -0.020185470581054688, -0.018513202667236328, -0.01684093475341797, -0.01516866683959961, -0.01349639892578125, -0.01182413101196289, -0.010151863098144531, -0.008479595184326172, -0.0068073272705078125, -0.005135059356689453, -0.0034627914428710938, -0.0017905235290527344, -0.000118255615234375, 0.0015540122985839844, 0.0032262802124023438, 0.004898548126220703, 0.0065708160400390625, 0.008243083953857422, 0.009915351867675781, 0.01158761978149414, 0.0132598876953125, 0.01493215560913086, 0.01660442352294922, 0.018276691436767578, 0.019948959350585938, 0.021621227264404297, 0.023293495178222656, 0.024965763092041016, 0.026638031005859375, 0.028310298919677734, 0.029982566833496094, 0.03165483474731445, 0.03332710266113281, 0.03499937057495117, 0.03667163848876953, 0.03834390640258789, 0.04001617431640625, 0.04168844223022461, 0.04336071014404297, 0.04503297805786133, 0.04670524597167969, 0.04837751388549805, 0.050049781799316406, 0.051722049713134766, 0.053394317626953125, 0.055066585540771484, 0.056738853454589844, 0.0584111213684082, 0.06008338928222656, 0.06175565719604492, 0.06342792510986328, 0.06510019302368164, 0.0667724609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 11.0, 20.0, 18.0, 21.0, 9.0, 23.0, 20.0, 28.0, 23.0, 27.0, 22.0, 28.0, 28.0, 38.0, 36.0, 43.0, 42.0, 37.0, 36.0, 48.0, 39.0, 42.0, 30.0, 28.0, 42.0, 34.0, 23.0, 25.0, 30.0, 21.0, 14.0, 14.0, 19.0, 13.0, 6.0, 7.0, 5.0, 8.0, 4.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.453369140625, -0.4403266906738281, -0.42728424072265625, -0.4142417907714844, -0.4011993408203125, -0.3881568908691406, -0.37511444091796875, -0.3620719909667969, -0.349029541015625, -0.3359870910644531, -0.32294464111328125, -0.3099021911621094, -0.2968597412109375, -0.2838172912597656, -0.27077484130859375, -0.2577323913574219, -0.24468994140625, -0.23164749145507812, -0.21860504150390625, -0.20556259155273438, -0.1925201416015625, -0.17947769165039062, -0.16643524169921875, -0.15339279174804688, -0.140350341796875, -0.12730789184570312, -0.11426544189453125, -0.10122299194335938, -0.0881805419921875, -0.07513809204101562, -0.06209564208984375, -0.049053192138671875, -0.0360107421875, -0.022968292236328125, -0.00992584228515625, 0.003116607666015625, 0.0161590576171875, 0.029201507568359375, 0.04224395751953125, 0.055286407470703125, 0.068328857421875, 0.08137130737304688, 0.09441375732421875, 0.10745620727539062, 0.1204986572265625, 0.13354110717773438, 0.14658355712890625, 0.15962600708007812, 0.17266845703125, 0.18571090698242188, 0.19875335693359375, 0.21179580688476562, 0.2248382568359375, 0.23788070678710938, 0.25092315673828125, 0.2639656066894531, 0.277008056640625, 0.2900505065917969, 0.30309295654296875, 0.3161354064941406, 0.3291778564453125, 0.3422203063964844, 0.35526275634765625, 0.3683052062988281, 0.38134765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 9.0, 22.0, 15.0, 18.0, 33.0, 47.0, 111.0, 173.0, 287.0, 483.0, 858.0, 1803.0, 3996.0, 10684.0, 35453.0, 156670.0, 484103.0, 268392.0, 58833.0, 15783.0, 5573.0, 2418.0, 1203.0, 633.0, 343.0, 203.0, 131.0, 89.0, 46.0, 45.0, 27.0, 23.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02655029296875, -0.025826454162597656, -0.025102615356445312, -0.02437877655029297, -0.023654937744140625, -0.02293109893798828, -0.022207260131835938, -0.021483421325683594, -0.02075958251953125, -0.020035743713378906, -0.019311904907226562, -0.01858806610107422, -0.017864227294921875, -0.01714038848876953, -0.016416549682617188, -0.015692710876464844, -0.0149688720703125, -0.014245033264160156, -0.013521194458007812, -0.012797355651855469, -0.012073516845703125, -0.011349678039550781, -0.010625839233398438, -0.009902000427246094, -0.00917816162109375, -0.008454322814941406, -0.0077304840087890625, -0.007006645202636719, -0.006282806396484375, -0.005558967590332031, -0.0048351287841796875, -0.004111289978027344, -0.003387451171875, -0.0026636123657226562, -0.0019397735595703125, -0.0012159347534179688, -0.000492095947265625, 0.00023174285888671875, 0.0009555816650390625, 0.0016794204711914062, 0.00240325927734375, 0.0031270980834960938, 0.0038509368896484375, 0.004574775695800781, 0.005298614501953125, 0.006022453308105469, 0.0067462921142578125, 0.007470130920410156, 0.0081939697265625, 0.008917808532714844, 0.009641647338867188, 0.010365486145019531, 0.011089324951171875, 0.011813163757324219, 0.012537002563476562, 0.013260841369628906, 0.01398468017578125, 0.014708518981933594, 0.015432357788085938, 0.01615619659423828, 0.016880035400390625, 0.01760387420654297, 0.018327713012695312, 0.019051551818847656, 0.019775390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 19.0, 15.0, 28.0, 37.0, 48.0, 51.0, 86.0, 80.0, 104.0, 107.0, 81.0, 88.0, 62.0, 41.0, 45.0, 23.0, 22.0, 16.0, 3.0, 15.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4066696166992188e-05, -1.3568438589572906e-05, -1.3070181012153625e-05, -1.2571923434734344e-05, -1.2073665857315063e-05, -1.1575408279895782e-05, -1.1077150702476501e-05, -1.057889312505722e-05, -1.008063554763794e-05, -9.582377970218658e-06, -9.084120392799377e-06, -8.585862815380096e-06, -8.087605237960815e-06, -7.5893476605415344e-06, -7.091090083122253e-06, -6.592832505702972e-06, -6.094574928283691e-06, -5.59631735086441e-06, -5.098059773445129e-06, -4.599802196025848e-06, -4.101544618606567e-06, -3.6032870411872864e-06, -3.1050294637680054e-06, -2.6067718863487244e-06, -2.1085143089294434e-06, -1.6102567315101624e-06, -1.1119991540908813e-06, -6.137415766716003e-07, -1.1548399925231934e-07, 3.8277357816696167e-07, 8.810311555862427e-07, 1.3792887330055237e-06, 1.8775463104248047e-06, 2.3758038878440857e-06, 2.8740614652633667e-06, 3.3723190426826477e-06, 3.870576620101929e-06, 4.36883419752121e-06, 4.867091774940491e-06, 5.365349352359772e-06, 5.863606929779053e-06, 6.361864507198334e-06, 6.860122084617615e-06, 7.358379662036896e-06, 7.856637239456177e-06, 8.354894816875458e-06, 8.853152394294739e-06, 9.35140997171402e-06, 9.8496675491333e-06, 1.0347925126552582e-05, 1.0846182703971863e-05, 1.1344440281391144e-05, 1.1842697858810425e-05, 1.2340955436229706e-05, 1.2839213013648987e-05, 1.3337470591068268e-05, 1.3835728168487549e-05, 1.433398574590683e-05, 1.483224332332611e-05, 1.5330500900745392e-05, 1.5828758478164673e-05, 1.6327016055583954e-05, 1.6825273633003235e-05, 1.7323531210422516e-05, 1.7821788787841797e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 7.0, 7.0, 12.0, 19.0, 20.0, 29.0, 45.0, 67.0, 132.0, 185.0, 345.0, 722.0, 1556.0, 4466.0, 15375.0, 69882.0, 326642.0, 463226.0, 128542.0, 26243.0, 6783.0, 2200.0, 896.0, 465.0, 237.0, 163.0, 86.0, 55.0, 42.0, 27.0, 17.0, 17.0, 13.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02264404296875, -0.021868228912353516, -0.02109241485595703, -0.020316600799560547, -0.019540786743164062, -0.018764972686767578, -0.017989158630371094, -0.01721334457397461, -0.016437530517578125, -0.01566171646118164, -0.014885902404785156, -0.014110088348388672, -0.013334274291992188, -0.012558460235595703, -0.011782646179199219, -0.011006832122802734, -0.01023101806640625, -0.009455204010009766, -0.008679389953613281, -0.007903575897216797, -0.0071277618408203125, -0.006351947784423828, -0.005576133728027344, -0.004800319671630859, -0.004024505615234375, -0.0032486915588378906, -0.0024728775024414062, -0.0016970634460449219, -0.0009212493896484375, -0.00014543533325195312, 0.0006303787231445312, 0.0014061927795410156, 0.0021820068359375, 0.0029578208923339844, 0.0037336349487304688, 0.004509449005126953, 0.0052852630615234375, 0.006061077117919922, 0.006836891174316406, 0.007612705230712891, 0.008388519287109375, 0.00916433334350586, 0.009940147399902344, 0.010715961456298828, 0.011491775512695312, 0.012267589569091797, 0.013043403625488281, 0.013819217681884766, 0.01459503173828125, 0.015370845794677734, 0.01614665985107422, 0.016922473907470703, 0.017698287963867188, 0.018474102020263672, 0.019249916076660156, 0.02002573013305664, 0.020801544189453125, 0.02157735824584961, 0.022353172302246094, 0.023128986358642578, 0.023904800415039062, 0.024680614471435547, 0.02545642852783203, 0.026232242584228516, 0.027008056640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 6.0, 10.0, 17.0, 21.0, 22.0, 39.0, 55.0, 56.0, 70.0, 73.0, 94.0, 92.0, 79.0, 91.0, 76.0, 42.0, 54.0, 26.0, 19.0, 12.0, 15.0, 10.0, 6.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0092620849609375, -0.00902026891708374, -0.00877845287322998, -0.00853663682937622, -0.008294820785522461, -0.008053004741668701, -0.007811188697814941, -0.007569372653961182, -0.007327556610107422, -0.007085740566253662, -0.006843924522399902, -0.006602108478546143, -0.006360292434692383, -0.006118476390838623, -0.005876660346984863, -0.0056348443031311035, -0.005393028259277344, -0.005151212215423584, -0.004909396171569824, -0.0046675801277160645, -0.004425764083862305, -0.004183948040008545, -0.003942131996154785, -0.0037003159523010254, -0.0034584999084472656, -0.003216683864593506, -0.002974867820739746, -0.0027330517768859863, -0.0024912357330322266, -0.002249419689178467, -0.002007603645324707, -0.0017657876014709473, -0.0015239715576171875, -0.0012821555137634277, -0.001040339469909668, -0.0007985234260559082, -0.0005567073822021484, -0.00031489133834838867, -7.30752944946289e-05, 0.00016874074935913086, 0.0004105567932128906, 0.0006523728370666504, 0.0008941888809204102, 0.00113600492477417, 0.0013778209686279297, 0.0016196370124816895, 0.0018614530563354492, 0.002103269100189209, 0.0023450851440429688, 0.0025869011878967285, 0.0028287172317504883, 0.003070533275604248, 0.003312349319458008, 0.0035541653633117676, 0.0037959814071655273, 0.004037797451019287, 0.004279613494873047, 0.004521429538726807, 0.004763245582580566, 0.005005061626434326, 0.005246877670288086, 0.005488693714141846, 0.0057305097579956055, 0.005972325801849365, 0.006214141845703125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 29.0, 40.0, 115.0, 229.0, 241.0, 200.0, 81.0, 33.0, 20.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7753782272338867, -0.7435557842254639, -0.7117332816123962, -0.6799108386039734, -0.6480883359909058, -0.6162658929824829, -0.5844434499740601, -0.5526210069656372, -0.5207985043525696, -0.48897603154182434, -0.4571535587310791, -0.42533111572265625, -0.393508642911911, -0.36168617010116577, -0.3298637270927429, -0.2980412542819977, -0.26621878147125244, -0.2343963086605072, -0.20257385075092316, -0.1707513928413391, -0.13892892003059387, -0.10710644721984863, -0.07528398931026459, -0.04346153140068054, -0.011639058589935303, 0.02018340677022934, 0.05200587213039398, 0.08382833749055862, 0.11565080285072327, 0.1474732756614685, 0.17929573357105255, 0.2111181914806366, 0.24294066429138184, 0.2747631371021271, 0.3065856099128723, 0.33840805292129517, 0.3702305257320404, 0.40205299854278564, 0.4338754415512085, 0.46569791436195374, 0.497520387172699, 0.5293428301811218, 0.5611653327941895, 0.5929877758026123, 0.6248102188110352, 0.6566327214241028, 0.6884551644325256, 0.7202776670455933, 0.7521001100540161, 0.783922553062439, 0.8157450556755066, 0.8475674986839294, 0.8793900012969971, 0.9112124443054199, 0.9430348873138428, 0.9748573303222656, 1.0066797733306885, 1.0385022163391113, 1.0703246593475342, 1.1021472215652466, 1.1339696645736694, 1.1657921075820923, 1.1976145505905151, 1.229436993598938, 1.2612595558166504]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 5.0, 2.0, 5.0, 5.0, 9.0, 8.0, 22.0, 15.0, 17.0, 21.0, 21.0, 25.0, 45.0, 24.0, 34.0, 33.0, 44.0, 40.0, 48.0, 44.0, 44.0, 46.0, 45.0, 45.0, 45.0, 51.0, 34.0, 25.0, 29.0, 22.0, 24.0, 24.0, 21.0, 13.0, 13.0, 6.0, 9.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.2497846633195877, -0.2425040602684021, -0.2352234423160553, -0.2279428392648697, -0.2206622213125229, -0.21338161826133728, -0.20610100030899048, -0.19882039725780487, -0.19153979420661926, -0.18425919115543365, -0.17697857320308685, -0.16969797015190125, -0.16241735219955444, -0.15513674914836884, -0.14785614609718323, -0.14057552814483643, -0.13329491019248962, -0.12601430714130402, -0.11873368918895721, -0.1114530861377716, -0.1041724681854248, -0.0968918651342392, -0.08961125463247299, -0.08233064413070679, -0.07505003362894058, -0.06776942312717438, -0.06048881262540817, -0.053208205848932266, -0.04592759534716606, -0.03864698484539986, -0.03136637806892395, -0.024085767567157745, -0.016805142164230347, -0.009524532593786716, -0.0022439230233430862, 0.005036685615777969, 0.012317296117544174, 0.01959790661931038, 0.026878513395786285, 0.03415912389755249, 0.041439734399318695, 0.0487203449010849, 0.056000955402851105, 0.06328156590461731, 0.07056216895580292, 0.07784278690814972, 0.08512338995933533, 0.09240400046110153, 0.09968461096286774, 0.10696522146463394, 0.11424583196640015, 0.12152643501758575, 0.12880705296993256, 0.13608765602111816, 0.14336827397346497, 0.15064887702465057, 0.15792948007583618, 0.1652100831270218, 0.1724907010793686, 0.1797713041305542, 0.187051922082901, 0.1943325251340866, 0.20161312818527222, 0.20889374613761902, 0.21617436408996582]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 9.0, 13.0, 16.0, 16.0, 28.0, 39.0, 75.0, 92.0, 134.0, 242.0, 362.0, 577.0, 1018.0, 1968.0, 3805.0, 9002.0, 30185.0, 224484.0, 679510.0, 70076.0, 15213.0, 5574.0, 2665.0, 1366.0, 830.0, 449.0, 283.0, 163.0, 101.0, 72.0, 61.0, 29.0, 32.0, 22.0, 12.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.363525390625, -0.35065460205078125, -0.3377838134765625, -0.32491302490234375, -0.312042236328125, -0.29917144775390625, -0.2863006591796875, -0.27342987060546875, -0.26055908203125, -0.24768829345703125, -0.2348175048828125, -0.22194671630859375, -0.209075927734375, -0.19620513916015625, -0.1833343505859375, -0.17046356201171875, -0.1575927734375, -0.14472198486328125, -0.1318511962890625, -0.11898040771484375, -0.106109619140625, -0.09323883056640625, -0.0803680419921875, -0.06749725341796875, -0.05462646484375, -0.04175567626953125, -0.0288848876953125, -0.01601409912109375, -0.003143310546875, 0.00972747802734375, 0.0225982666015625, 0.03546905517578125, 0.04833984375, 0.06121063232421875, 0.0740814208984375, 0.08695220947265625, 0.099822998046875, 0.11269378662109375, 0.1255645751953125, 0.13843536376953125, 0.15130615234375, 0.16417694091796875, 0.1770477294921875, 0.18991851806640625, 0.202789306640625, 0.21566009521484375, 0.2285308837890625, 0.24140167236328125, 0.2542724609375, 0.26714324951171875, 0.2800140380859375, 0.29288482666015625, 0.305755615234375, 0.31862640380859375, 0.3314971923828125, 0.34436798095703125, 0.35723876953125, 0.37010955810546875, 0.3829803466796875, 0.39585113525390625, 0.408721923828125, 0.42159271240234375, 0.4344635009765625, 0.44733428955078125, 0.460205078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 9.0, 10.0, 12.0, 10.0, 19.0, 15.0, 17.0, 21.0, 34.0, 27.0, 36.0, 40.0, 51.0, 39.0, 42.0, 37.0, 43.0, 48.0, 57.0, 41.0, 40.0, 51.0, 39.0, 48.0, 27.0, 13.0, 31.0, 25.0, 22.0, 19.0, 12.0, 14.0, 6.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42333984375, -0.40883636474609375, -0.3943328857421875, -0.37982940673828125, -0.365325927734375, -0.35082244873046875, -0.3363189697265625, -0.32181549072265625, -0.30731201171875, -0.29280853271484375, -0.2783050537109375, -0.26380157470703125, -0.249298095703125, -0.23479461669921875, -0.2202911376953125, -0.20578765869140625, -0.1912841796875, -0.17678070068359375, -0.1622772216796875, -0.14777374267578125, -0.133270263671875, -0.11876678466796875, -0.1042633056640625, -0.08975982666015625, -0.07525634765625, -0.06075286865234375, -0.0462493896484375, -0.03174591064453125, -0.017242431640625, -0.00273895263671875, 0.0117645263671875, 0.02626800537109375, 0.040771484375, 0.05527496337890625, 0.0697784423828125, 0.08428192138671875, 0.098785400390625, 0.11328887939453125, 0.1277923583984375, 0.14229583740234375, 0.15679931640625, 0.17130279541015625, 0.1858062744140625, 0.20030975341796875, 0.214813232421875, 0.22931671142578125, 0.2438201904296875, 0.25832366943359375, 0.2728271484375, 0.28733062744140625, 0.3018341064453125, 0.31633758544921875, 0.330841064453125, 0.34534454345703125, 0.3598480224609375, 0.37435150146484375, 0.38885498046875, 0.40335845947265625, 0.4178619384765625, 0.43236541748046875, 0.446868896484375, 0.46137237548828125, 0.4758758544921875, 0.49037933349609375, 0.5048828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 6.0, 10.0, 20.0, 30.0, 36.0, 78.0, 115.0, 277.0, 739.0, 2146.0, 9324.0, 193624.0, 818968.0, 18261.0, 3216.0, 963.0, 368.0, 144.0, 84.0, 51.0, 24.0, 16.0, 9.0, 5.0, 4.0, 7.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.65771484375, -0.635162353515625, -0.61260986328125, -0.590057373046875, -0.5675048828125, -0.544952392578125, -0.52239990234375, -0.499847412109375, -0.477294921875, -0.454742431640625, -0.43218994140625, -0.409637451171875, -0.3870849609375, -0.364532470703125, -0.34197998046875, -0.319427490234375, -0.296875, -0.274322509765625, -0.25177001953125, -0.229217529296875, -0.2066650390625, -0.184112548828125, -0.16156005859375, -0.139007568359375, -0.116455078125, -0.093902587890625, -0.07135009765625, -0.048797607421875, -0.0262451171875, -0.003692626953125, 0.01885986328125, 0.041412353515625, 0.06396484375, 0.086517333984375, 0.10906982421875, 0.131622314453125, 0.1541748046875, 0.176727294921875, 0.19927978515625, 0.221832275390625, 0.244384765625, 0.266937255859375, 0.28948974609375, 0.312042236328125, 0.3345947265625, 0.357147216796875, 0.37969970703125, 0.402252197265625, 0.4248046875, 0.447357177734375, 0.46990966796875, 0.492462158203125, 0.5150146484375, 0.537567138671875, 0.56011962890625, 0.582672119140625, 0.605224609375, 0.627777099609375, 0.65032958984375, 0.672882080078125, 0.6954345703125, 0.717987060546875, 0.74053955078125, 0.763092041015625, 0.78564453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 9.0, 9.0, 12.0, 9.0, 13.0, 25.0, 31.0, 21.0, 23.0, 28.0, 41.0, 40.0, 36.0, 41.0, 49.0, 51.0, 43.0, 51.0, 54.0, 50.0, 44.0, 43.0, 32.0, 30.0, 35.0, 37.0, 19.0, 20.0, 11.0, 15.0, 14.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5160980224609375, -0.498016357421875, -0.4799346923828125, -0.46185302734375, -0.4437713623046875, -0.425689697265625, -0.4076080322265625, -0.3895263671875, -0.3714447021484375, -0.353363037109375, -0.3352813720703125, -0.31719970703125, -0.2991180419921875, -0.281036376953125, -0.2629547119140625, -0.244873046875, -0.2267913818359375, -0.208709716796875, -0.1906280517578125, -0.17254638671875, -0.1544647216796875, -0.136383056640625, -0.1183013916015625, -0.1002197265625, -0.0821380615234375, -0.064056396484375, -0.0459747314453125, -0.02789306640625, -0.0098114013671875, 0.008270263671875, 0.0263519287109375, 0.04443359375, 0.0625152587890625, 0.080596923828125, 0.0986785888671875, 0.11676025390625, 0.1348419189453125, 0.152923583984375, 0.1710052490234375, 0.1890869140625, 0.2071685791015625, 0.225250244140625, 0.2433319091796875, 0.26141357421875, 0.2794952392578125, 0.297576904296875, 0.3156585693359375, 0.333740234375, 0.3518218994140625, 0.369903564453125, 0.3879852294921875, 0.40606689453125, 0.4241485595703125, 0.442230224609375, 0.4603118896484375, 0.4783935546875, 0.4964752197265625, 0.514556884765625, 0.5326385498046875, 0.55072021484375, 0.5688018798828125, 0.586883544921875, 0.6049652099609375, 0.623046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 11.0, 15.0, 39.0, 62.0, 178.0, 572.0, 2915.0, 51029.0, 971190.0, 20024.0, 1833.0, 388.0, 149.0, 58.0, 31.0, 15.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352294921875, -0.3384132385253906, -0.32453155517578125, -0.3106498718261719, -0.2967681884765625, -0.2828865051269531, -0.26900482177734375, -0.2551231384277344, -0.241241455078125, -0.22735977172851562, -0.21347808837890625, -0.19959640502929688, -0.1857147216796875, -0.17183303833007812, -0.15795135498046875, -0.14406967163085938, -0.13018798828125, -0.11630630493164062, -0.10242462158203125, -0.08854293823242188, -0.0746612548828125, -0.060779571533203125, -0.04689788818359375, -0.033016204833984375, -0.019134521484375, -0.005252838134765625, 0.00862884521484375, 0.022510528564453125, 0.0363922119140625, 0.050273895263671875, 0.06415557861328125, 0.07803726196289062, 0.0919189453125, 0.10580062866210938, 0.11968231201171875, 0.13356399536132812, 0.1474456787109375, 0.16132736206054688, 0.17520904541015625, 0.18909072875976562, 0.202972412109375, 0.21685409545898438, 0.23073577880859375, 0.24461746215820312, 0.2584991455078125, 0.2723808288574219, 0.28626251220703125, 0.3001441955566406, 0.31402587890625, 0.3279075622558594, 0.34178924560546875, 0.3556709289550781, 0.3695526123046875, 0.3834342956542969, 0.39731597900390625, 0.4111976623535156, 0.425079345703125, 0.4389610290527344, 0.45284271240234375, 0.4667243957519531, 0.4806060791015625, 0.4944877624511719, 0.5083694458007812, 0.5222511291503906, 0.5361328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 5.0, 15.0, 9.0, 23.0, 20.0, 47.0, 57.0, 87.0, 154.0, 180.0, 142.0, 82.0, 59.0, 49.0, 17.0, 13.0, 12.0, 7.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910064697265625e-05, -3.810971975326538e-05, -3.711879253387451e-05, -3.612786531448364e-05, -3.5136938095092773e-05, -3.4146010875701904e-05, -3.3155083656311035e-05, -3.2164156436920166e-05, -3.11732292175293e-05, -3.0182301998138428e-05, -2.919137477874756e-05, -2.820044755935669e-05, -2.720952033996582e-05, -2.621859312057495e-05, -2.5227665901184082e-05, -2.4236738681793213e-05, -2.3245811462402344e-05, -2.2254884243011475e-05, -2.1263957023620605e-05, -2.0273029804229736e-05, -1.9282102584838867e-05, -1.8291175365447998e-05, -1.730024814605713e-05, -1.630932092666626e-05, -1.531839370727539e-05, -1.4327466487884521e-05, -1.3336539268493652e-05, -1.2345612049102783e-05, -1.1354684829711914e-05, -1.0363757610321045e-05, -9.372830390930176e-06, -8.381903171539307e-06, -7.3909759521484375e-06, -6.400048732757568e-06, -5.409121513366699e-06, -4.41819429397583e-06, -3.427267074584961e-06, -2.436339855194092e-06, -1.4454126358032227e-06, -4.544854164123535e-07, 5.364418029785156e-07, 1.5273690223693848e-06, 2.518296241760254e-06, 3.509223461151123e-06, 4.500150680541992e-06, 5.491077899932861e-06, 6.4820051193237305e-06, 7.4729323387146e-06, 8.463859558105469e-06, 9.454786777496338e-06, 1.0445713996887207e-05, 1.1436641216278076e-05, 1.2427568435668945e-05, 1.3418495655059814e-05, 1.4409422874450684e-05, 1.5400350093841553e-05, 1.6391277313232422e-05, 1.738220453262329e-05, 1.837313175201416e-05, 1.936405897140503e-05, 2.03549861907959e-05, 2.1345913410186768e-05, 2.2336840629577637e-05, 2.3327767848968506e-05, 2.4318695068359375e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 15.0, 14.0, 26.0, 43.0, 96.0, 205.0, 469.0, 1301.0, 4921.0, 61194.0, 943611.0, 31176.0, 3633.0, 1057.0, 402.0, 154.0, 81.0, 47.0, 25.0, 16.0, 10.0, 13.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.52001953125, -0.5071487426757812, -0.4942779541015625, -0.48140716552734375, -0.468536376953125, -0.45566558837890625, -0.4427947998046875, -0.42992401123046875, -0.41705322265625, -0.40418243408203125, -0.3913116455078125, -0.37844085693359375, -0.365570068359375, -0.35269927978515625, -0.3398284912109375, -0.32695770263671875, -0.3140869140625, -0.30121612548828125, -0.2883453369140625, -0.27547454833984375, -0.262603759765625, -0.24973297119140625, -0.2368621826171875, -0.22399139404296875, -0.21112060546875, -0.19824981689453125, -0.1853790283203125, -0.17250823974609375, -0.159637451171875, -0.14676666259765625, -0.1338958740234375, -0.12102508544921875, -0.108154296875, -0.09528350830078125, -0.0824127197265625, -0.06954193115234375, -0.056671142578125, -0.04380035400390625, -0.0309295654296875, -0.01805877685546875, -0.00518798828125, 0.00768280029296875, 0.0205535888671875, 0.03342437744140625, 0.046295166015625, 0.05916595458984375, 0.0720367431640625, 0.08490753173828125, 0.0977783203125, 0.11064910888671875, 0.1235198974609375, 0.13639068603515625, 0.149261474609375, 0.16213226318359375, 0.1750030517578125, 0.18787384033203125, 0.20074462890625, 0.21361541748046875, 0.2264862060546875, 0.23935699462890625, 0.252227783203125, 0.26509857177734375, 0.2779693603515625, 0.29084014892578125, 0.3037109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 16.0, 13.0, 27.0, 19.0, 38.0, 62.0, 100.0, 232.0, 201.0, 93.0, 49.0, 37.0, 27.0, 24.0, 12.0, 9.0, 5.0, 3.0, 8.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080322265625, -0.07695960998535156, -0.07359695434570312, -0.07023429870605469, -0.06687164306640625, -0.06350898742675781, -0.060146331787109375, -0.05678367614746094, -0.0534210205078125, -0.05005836486816406, -0.046695709228515625, -0.04333305358886719, -0.03997039794921875, -0.03660774230957031, -0.033245086669921875, -0.029882431030273438, -0.026519775390625, -0.023157119750976562, -0.019794464111328125, -0.016431808471679688, -0.01306915283203125, -0.009706497192382812, -0.006343841552734375, -0.0029811859130859375, 0.0003814697265625, 0.0037441253662109375, 0.007106781005859375, 0.010469436645507812, 0.01383209228515625, 0.017194747924804688, 0.020557403564453125, 0.023920059204101562, 0.02728271484375, 0.030645370483398438, 0.034008026123046875, 0.03737068176269531, 0.04073333740234375, 0.04409599304199219, 0.047458648681640625, 0.05082130432128906, 0.0541839599609375, 0.05754661560058594, 0.060909271240234375, 0.06427192687988281, 0.06763458251953125, 0.07099723815917969, 0.07435989379882812, 0.07772254943847656, 0.081085205078125, 0.08444786071777344, 0.08781051635742188, 0.09117317199707031, 0.09453582763671875, 0.09789848327636719, 0.10126113891601562, 0.10462379455566406, 0.1079864501953125, 0.11134910583496094, 0.11471176147460938, 0.11807441711425781, 0.12143707275390625, 0.12479972839355469, 0.12816238403320312, 0.13152503967285156, 0.1348876953125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 11.0, 29.0, 51.0, 165.0, 292.0, 253.0, 121.0, 38.0, 25.0, 13.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.731217861175537, -1.661611795425415, -1.592005729675293, -1.522399663925171, -1.4527935981750488, -1.3831875324249268, -1.3135814666748047, -1.2439754009246826, -1.1743693351745605, -1.1047632694244385, -1.0351572036743164, -0.9655511379241943, -0.8959450721740723, -0.8263390064239502, -0.7567330002784729, -0.6871269345283508, -0.6175209283828735, -0.5479148626327515, -0.4783087968826294, -0.4087027609348297, -0.33909669518470764, -0.26949062943458557, -0.1998845934867859, -0.13027852773666382, -0.06067246198654175, 0.008933596312999725, 0.0785396546125412, 0.14814570546150208, 0.21775177121162415, 0.2873578369617462, 0.3569638729095459, 0.42656993865966797, 0.49617600440979004, 0.5657820701599121, 0.6353881359100342, 0.7049942016601562, 0.7746002674102783, 0.8442063331604004, 0.9138123393058777, 0.9834184050559998, 1.0530245304107666, 1.1226305961608887, 1.1922366619110107, 1.2618427276611328, 1.3314487934112549, 1.401054859161377, 1.470660924911499, 1.540266990661621, 1.6098729372024536, 1.6794790029525757, 1.7490850687026978, 1.8186911344528198, 1.888297200202942, 1.957903265953064, 2.0275092124938965, 2.0971152782440186, 2.1667213439941406, 2.2363274097442627, 2.3059334754943848, 2.375539541244507, 2.445145606994629, 2.514751672744751, 2.584357738494873, 2.653963804244995, 2.723569869995117]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 3.0, 3.0, 6.0, 8.0, 9.0, 10.0, 14.0, 16.0, 12.0, 18.0, 20.0, 17.0, 20.0, 34.0, 30.0, 32.0, 21.0, 50.0, 26.0, 22.0, 45.0, 44.0, 37.0, 40.0, 36.0, 38.0, 42.0, 37.0, 26.0, 35.0, 29.0, 30.0, 28.0, 15.0, 23.0, 22.0, 16.0, 13.0, 13.0, 12.0, 11.0, 7.0, 5.0, 4.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.8226771354675293, -0.7981719374656677, -0.7736666798591614, -0.7491614818572998, -0.7246562242507935, -0.7001510262489319, -0.6756458282470703, -0.651140570640564, -0.6266353726387024, -0.6021301746368408, -0.5776249170303345, -0.5531197190284729, -0.5286145210266113, -0.504109263420105, -0.4796040654182434, -0.45509883761405945, -0.4305936098098755, -0.40608838200569153, -0.38158315420150757, -0.357077956199646, -0.33257272839546204, -0.3080675005912781, -0.2835623025894165, -0.25905707478523254, -0.23455184698104858, -0.21004661917686462, -0.18554140627384186, -0.1610361933708191, -0.13653096556663513, -0.11202574521303177, -0.0875205248594284, -0.06301531195640564, -0.038510143756866455, -0.014004923403263092, 0.010500296950340271, 0.035005517303943634, 0.059510737657547, 0.08401595801115036, 0.10852117836475372, 0.1330263912677765, 0.15753161907196045, 0.1820368468761444, 0.20654205977916718, 0.23104727268218994, 0.2555525004863739, 0.28005772829055786, 0.30456292629241943, 0.3290681540966034, 0.35357338190078735, 0.3780786097049713, 0.4025838375091553, 0.42708903551101685, 0.4515942633152008, 0.47609949111938477, 0.5006046891212463, 0.5251098871231079, 0.5496151447296143, 0.5741203427314758, 0.5986256003379822, 0.6231307983398438, 0.6476360559463501, 0.6721412539482117, 0.6966464519500732, 0.7211517095565796, 0.7456569075584412]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 11.0, 18.0, 20.0, 53.0, 74.0, 177.0, 309.0, 835.0, 2211.0, 8258.0, 65724.0, 3036684.0, 1043191.0, 29026.0, 5113.0, 1485.0, 569.0, 227.0, 117.0, 59.0, 37.0, 17.0, 10.0, 13.0, 5.0, 6.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8955078125, -0.8664779663085938, -0.8374481201171875, -0.8084182739257812, -0.779388427734375, -0.7503585815429688, -0.7213287353515625, -0.6922988891601562, -0.66326904296875, -0.6342391967773438, -0.6052093505859375, -0.5761795043945312, -0.547149658203125, -0.5181198120117188, -0.4890899658203125, -0.46006011962890625, -0.4310302734375, -0.40200042724609375, -0.3729705810546875, -0.34394073486328125, -0.314910888671875, -0.28588104248046875, -0.2568511962890625, -0.22782135009765625, -0.19879150390625, -0.16976165771484375, -0.1407318115234375, -0.11170196533203125, -0.082672119140625, -0.05364227294921875, -0.0246124267578125, 0.00441741943359375, 0.033447265625, 0.06247711181640625, 0.0915069580078125, 0.12053680419921875, 0.149566650390625, 0.17859649658203125, 0.2076263427734375, 0.23665618896484375, 0.26568603515625, 0.29471588134765625, 0.3237457275390625, 0.35277557373046875, 0.381805419921875, 0.41083526611328125, 0.4398651123046875, 0.46889495849609375, 0.4979248046875, 0.5269546508789062, 0.5559844970703125, 0.5850143432617188, 0.614044189453125, 0.6430740356445312, 0.6721038818359375, 0.7011337280273438, 0.73016357421875, 0.7591934204101562, 0.7882232666015625, 0.8172531127929688, 0.846282958984375, 0.8753128051757812, 0.9043426513671875, 0.9333724975585938, 0.96240234375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 6.0, 5.0, 15.0, 12.0, 13.0, 20.0, 25.0, 23.0, 29.0, 30.0, 35.0, 30.0, 38.0, 41.0, 59.0, 53.0, 46.0, 45.0, 53.0, 43.0, 54.0, 41.0, 38.0, 41.0, 36.0, 29.0, 26.0, 25.0, 12.0, 15.0, 12.0, 7.0, 6.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.265869140625, -0.2570304870605469, -0.24819183349609375, -0.23935317993164062, -0.2305145263671875, -0.22167587280273438, -0.21283721923828125, -0.20399856567382812, -0.195159912109375, -0.18632125854492188, -0.17748260498046875, -0.16864395141601562, -0.1598052978515625, -0.15096664428710938, -0.14212799072265625, -0.13328933715820312, -0.12445068359375, -0.11561203002929688, -0.10677337646484375, -0.09793472290039062, -0.0890960693359375, -0.08025741577148438, -0.07141876220703125, -0.06258010864257812, -0.053741455078125, -0.044902801513671875, -0.03606414794921875, -0.027225494384765625, -0.0183868408203125, -0.009548187255859375, -0.00070953369140625, 0.008129119873046875, 0.0169677734375, 0.025806427001953125, 0.03464508056640625, 0.043483734130859375, 0.0523223876953125, 0.061161041259765625, 0.06999969482421875, 0.07883834838867188, 0.087677001953125, 0.09651565551757812, 0.10535430908203125, 0.11419296264648438, 0.1230316162109375, 0.13187026977539062, 0.14070892333984375, 0.14954757690429688, 0.15838623046875, 0.16722488403320312, 0.17606353759765625, 0.18490219116210938, 0.1937408447265625, 0.20257949829101562, 0.21141815185546875, 0.22025680541992188, 0.229095458984375, 0.23793411254882812, 0.24677276611328125, 0.2556114196777344, 0.2644500732421875, 0.2732887268066406, 0.28212738037109375, 0.2909660339355469, 0.2998046875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 7.0, 6.0, 15.0, 15.0, 22.0, 34.0, 46.0, 51.0, 89.0, 125.0, 271.0, 390.0, 857.0, 2170.0, 6318.0, 28099.0, 278861.0, 3612183.0, 229796.0, 25331.0, 5907.0, 1929.0, 755.0, 423.0, 200.0, 120.0, 78.0, 47.0, 39.0, 19.0, 16.0, 18.0, 7.0, 7.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.71728515625, -0.6981430053710938, -0.6790008544921875, -0.6598587036132812, -0.640716552734375, -0.6215744018554688, -0.6024322509765625, -0.5832901000976562, -0.56414794921875, -0.5450057983398438, -0.5258636474609375, -0.5067214965820312, -0.487579345703125, -0.46843719482421875, -0.4492950439453125, -0.43015289306640625, -0.4110107421875, -0.39186859130859375, -0.3727264404296875, -0.35358428955078125, -0.334442138671875, -0.31529998779296875, -0.2961578369140625, -0.27701568603515625, -0.25787353515625, -0.23873138427734375, -0.2195892333984375, -0.20044708251953125, -0.181304931640625, -0.16216278076171875, -0.1430206298828125, -0.12387847900390625, -0.104736328125, -0.08559417724609375, -0.0664520263671875, -0.04730987548828125, -0.028167724609375, -0.00902557373046875, 0.0101165771484375, 0.02925872802734375, 0.04840087890625, 0.06754302978515625, 0.0866851806640625, 0.10582733154296875, 0.124969482421875, 0.14411163330078125, 0.1632537841796875, 0.18239593505859375, 0.2015380859375, 0.22068023681640625, 0.2398223876953125, 0.25896453857421875, 0.278106689453125, 0.29724884033203125, 0.3163909912109375, 0.33553314208984375, 0.35467529296875, 0.37381744384765625, 0.3929595947265625, 0.41210174560546875, 0.431243896484375, 0.45038604736328125, 0.4695281982421875, 0.48867034912109375, 0.5078125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 14.0, 14.0, 21.0, 35.0, 53.0, 73.0, 103.0, 207.0, 395.0, 661.0, 879.0, 663.0, 364.0, 203.0, 139.0, 67.0, 50.0, 31.0, 30.0, 13.0, 17.0, 6.0, 5.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17822265625, -0.1727313995361328, -0.16724014282226562, -0.16174888610839844, -0.15625762939453125, -0.15076637268066406, -0.14527511596679688, -0.1397838592529297, -0.1342926025390625, -0.1288013458251953, -0.12331008911132812, -0.11781883239746094, -0.11232757568359375, -0.10683631896972656, -0.10134506225585938, -0.09585380554199219, -0.090362548828125, -0.08487129211425781, -0.07938003540039062, -0.07388877868652344, -0.06839752197265625, -0.06290626525878906, -0.057415008544921875, -0.05192375183105469, -0.0464324951171875, -0.04094123840332031, -0.035449981689453125, -0.029958724975585938, -0.02446746826171875, -0.018976211547851562, -0.013484954833984375, -0.007993698120117188, -0.00250244140625, 0.0029888153076171875, 0.008480072021484375, 0.013971328735351562, 0.01946258544921875, 0.024953842163085938, 0.030445098876953125, 0.03593635559082031, 0.0414276123046875, 0.04691886901855469, 0.052410125732421875, 0.05790138244628906, 0.06339263916015625, 0.06888389587402344, 0.07437515258789062, 0.07986640930175781, 0.085357666015625, 0.09084892272949219, 0.09634017944335938, 0.10183143615722656, 0.10732269287109375, 0.11281394958496094, 0.11830520629882812, 0.12379646301269531, 0.1292877197265625, 0.1347789764404297, 0.14027023315429688, 0.14576148986816406, 0.15125274658203125, 0.15674400329589844, 0.16223526000976562, 0.1677265167236328, 0.1732177734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 10.0, 11.0, 15.0, 16.0, 25.0, 37.0, 53.0, 81.0, 98.0, 99.0, 145.0, 105.0, 120.0, 57.0, 43.0, 32.0, 20.0, 14.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5308326482772827, -0.5080342292785645, -0.4852357804775238, -0.46243736147880554, -0.4396389126777649, -0.41684049367904663, -0.39404207468032837, -0.3712436556816101, -0.34844520688056946, -0.3256467878818512, -0.30284833908081055, -0.2800499200820923, -0.257251501083374, -0.23445305228233337, -0.2116546332836151, -0.18885619938373566, -0.1660577654838562, -0.14325933158397675, -0.12046090513467789, -0.09766247868537903, -0.07486404478549957, -0.05206561088562012, -0.029267191886901855, -0.0064687579870224, 0.016329675912857056, 0.03912810608744621, 0.06192653626203537, 0.08472496271133423, 0.10752339661121368, 0.13032183051109314, 0.1531202495098114, 0.17591868340969086, 0.1987171173095703, 0.22151555120944977, 0.24431398510932922, 0.2671124041080475, 0.28991085290908813, 0.3127092719078064, 0.33550769090652466, 0.3583061099052429, 0.38110455870628357, 0.40390297770500183, 0.4267014265060425, 0.44949984550476074, 0.472298264503479, 0.49509671330451965, 0.5178951025009155, 0.5406935811042786, 0.5634920001029968, 0.5862904191017151, 0.6090888381004333, 0.6318873167037964, 0.6546857357025146, 0.6774841547012329, 0.7002825736999512, 0.7230809926986694, 0.7458794116973877, 0.768677830696106, 0.7914762496948242, 0.8142746686935425, 0.8370731472969055, 0.8598715662956238, 0.882669985294342, 0.9054684042930603, 0.9282668828964233]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 8.0, 7.0, 7.0, 12.0, 12.0, 13.0, 26.0, 23.0, 24.0, 33.0, 30.0, 46.0, 32.0, 38.0, 30.0, 30.0, 37.0, 37.0, 39.0, 46.0, 48.0, 41.0, 36.0, 42.0, 42.0, 34.0, 25.0, 26.0, 33.0, 23.0, 23.0, 20.0, 19.0, 10.0, 13.0, 10.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31847622990608215, -0.30862683057785034, -0.29877740144729614, -0.28892800211906433, -0.2790786027908325, -0.2692291736602783, -0.2593797743320465, -0.2495303601026535, -0.2396809458732605, -0.2298315316438675, -0.2199821174144745, -0.21013271808624268, -0.20028330385684967, -0.19043388962745667, -0.18058449029922485, -0.17073507606983185, -0.16088566184043884, -0.15103624761104584, -0.14118683338165283, -0.13133743405342102, -0.12148801982402802, -0.11163860559463501, -0.1017891988158226, -0.09193979203701019, -0.08209037780761719, -0.07224096357822418, -0.062391556799411774, -0.05254214629530907, -0.04269273579120636, -0.03284332528710365, -0.022993914783000946, -0.013144508004188538, -0.00329512357711792, 0.006554286926984787, 0.016403697431087494, 0.0262531079351902, 0.03610251843929291, 0.045951928943395615, 0.05580133944749832, 0.06565074622631073, 0.07550016045570374, 0.08534957468509674, 0.09519898146390915, 0.10504838824272156, 0.11489780247211456, 0.12474721670150757, 0.13459661602973938, 0.14444603025913239, 0.1542954444885254, 0.1641448587179184, 0.1739942729473114, 0.1838436722755432, 0.19369308650493622, 0.20354250073432922, 0.21339190006256104, 0.22324131429195404, 0.23309072852134705, 0.24294014275074005, 0.25278955698013306, 0.26263895630836487, 0.2724883556365967, 0.2823377847671509, 0.2921871840953827, 0.3020365834236145, 0.3118860125541687]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 0.0, 3.0, 10.0, 14.0, 31.0, 46.0, 138.0, 345.0, 923.0, 2830.0, 10380.0, 119000.0, 827631.0, 74976.0, 8535.0, 2364.0, 786.0, 275.0, 132.0, 51.0, 27.0, 17.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16079139709472656, -0.15446853637695312, -0.1481456756591797, -0.14182281494140625, -0.1354999542236328, -0.12917709350585938, -0.12285423278808594, -0.1165313720703125, -0.11020851135253906, -0.10388565063476562, -0.09756278991699219, -0.09123992919921875, -0.08491706848144531, -0.07859420776367188, -0.07227134704589844, -0.065948486328125, -0.05962562561035156, -0.053302764892578125, -0.04697990417480469, -0.04065704345703125, -0.03433418273925781, -0.028011322021484375, -0.021688461303710938, -0.0153656005859375, -0.009042739868164062, -0.002719879150390625, 0.0036029815673828125, 0.00992584228515625, 0.016248703002929688, 0.022571563720703125, 0.028894424438476562, 0.03521728515625, 0.04154014587402344, 0.047863006591796875, 0.05418586730957031, 0.06050872802734375, 0.06683158874511719, 0.07315444946289062, 0.07947731018066406, 0.0858001708984375, 0.09212303161621094, 0.09844589233398438, 0.10476875305175781, 0.11109161376953125, 0.11741447448730469, 0.12373733520507812, 0.13006019592285156, 0.136383056640625, 0.14270591735839844, 0.14902877807617188, 0.1553516387939453, 0.16167449951171875, 0.1679973602294922, 0.17432022094726562, 0.18064308166503906, 0.1869659423828125, 0.19328880310058594, 0.19961166381835938, 0.2059345245361328, 0.21225738525390625, 0.2185802459716797, 0.22490310668945312, 0.23122596740722656, 0.237548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 7.0, 2.0, 7.0, 14.0, 15.0, 17.0, 23.0, 28.0, 39.0, 38.0, 35.0, 42.0, 54.0, 28.0, 49.0, 53.0, 43.0, 59.0, 52.0, 57.0, 48.0, 38.0, 36.0, 43.0, 23.0, 31.0, 21.0, 28.0, 20.0, 11.0, 12.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2832679748535156, -0.27527618408203125, -0.2672843933105469, -0.2592926025390625, -0.2513008117675781, -0.24330902099609375, -0.23531723022460938, -0.227325439453125, -0.21933364868164062, -0.21134185791015625, -0.20335006713867188, -0.1953582763671875, -0.18736648559570312, -0.17937469482421875, -0.17138290405273438, -0.16339111328125, -0.15539932250976562, -0.14740753173828125, -0.13941574096679688, -0.1314239501953125, -0.12343215942382812, -0.11544036865234375, -0.10744857788085938, -0.099456787109375, -0.09146499633789062, -0.08347320556640625, -0.07548141479492188, -0.0674896240234375, -0.059497833251953125, -0.05150604248046875, -0.043514251708984375, -0.0355224609375, -0.027530670166015625, -0.01953887939453125, -0.011547088623046875, -0.0035552978515625, 0.004436492919921875, 0.01242828369140625, 0.020420074462890625, 0.028411865234375, 0.036403656005859375, 0.04439544677734375, 0.052387237548828125, 0.0603790283203125, 0.06837081909179688, 0.07636260986328125, 0.08435440063476562, 0.09234619140625, 0.10033798217773438, 0.10832977294921875, 0.11632156372070312, 0.1243133544921875, 0.13230514526367188, 0.14029693603515625, 0.14828872680664062, 0.156280517578125, 0.16427230834960938, 0.17226409912109375, 0.18025588989257812, 0.1882476806640625, 0.19623947143554688, 0.20423126220703125, 0.21222305297851562, 0.22021484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 9.0, 12.0, 10.0, 16.0, 26.0, 43.0, 72.0, 133.0, 225.0, 441.0, 862.0, 1917.0, 4857.0, 15250.0, 74528.0, 496114.0, 380762.0, 53749.0, 12138.0, 3971.0, 1680.0, 762.0, 397.0, 218.0, 134.0, 93.0, 52.0, 26.0, 20.0, 15.0, 11.0, 8.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10253620147705078, -0.09942054748535156, -0.09630489349365234, -0.09318923950195312, -0.0900735855102539, -0.08695793151855469, -0.08384227752685547, -0.08072662353515625, -0.07761096954345703, -0.07449531555175781, -0.0713796615600586, -0.06826400756835938, -0.06514835357666016, -0.06203269958496094, -0.05891704559326172, -0.0558013916015625, -0.05268573760986328, -0.04957008361816406, -0.046454429626464844, -0.043338775634765625, -0.040223121643066406, -0.03710746765136719, -0.03399181365966797, -0.03087615966796875, -0.02776050567626953, -0.024644851684570312, -0.021529197692871094, -0.018413543701171875, -0.015297889709472656, -0.012182235717773438, -0.009066581726074219, -0.005950927734375, -0.0028352737426757812, 0.0002803802490234375, 0.0033960342407226562, 0.006511688232421875, 0.009627342224121094, 0.012742996215820312, 0.01585865020751953, 0.01897430419921875, 0.02208995819091797, 0.025205612182617188, 0.028321266174316406, 0.031436920166015625, 0.034552574157714844, 0.03766822814941406, 0.04078388214111328, 0.0438995361328125, 0.04701519012451172, 0.05013084411621094, 0.053246498107910156, 0.056362152099609375, 0.059477806091308594, 0.06259346008300781, 0.06570911407470703, 0.06882476806640625, 0.07194042205810547, 0.07505607604980469, 0.0781717300415039, 0.08128738403320312, 0.08440303802490234, 0.08751869201660156, 0.09063434600830078, 0.09375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 12.0, 10.0, 15.0, 18.0, 29.0, 32.0, 28.0, 38.0, 42.0, 42.0, 32.0, 60.0, 53.0, 58.0, 71.0, 58.0, 42.0, 49.0, 40.0, 34.0, 30.0, 27.0, 24.0, 28.0, 19.0, 25.0, 15.0, 13.0, 4.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453125, -0.4381866455078125, -0.423248291015625, -0.4083099365234375, -0.39337158203125, -0.3784332275390625, -0.363494873046875, -0.3485565185546875, -0.3336181640625, -0.3186798095703125, -0.303741455078125, -0.2888031005859375, -0.27386474609375, -0.2589263916015625, -0.243988037109375, -0.2290496826171875, -0.214111328125, -0.1991729736328125, -0.184234619140625, -0.1692962646484375, -0.15435791015625, -0.1394195556640625, -0.124481201171875, -0.1095428466796875, -0.0946044921875, -0.0796661376953125, -0.064727783203125, -0.0497894287109375, -0.03485107421875, -0.0199127197265625, -0.004974365234375, 0.0099639892578125, 0.02490234375, 0.0398406982421875, 0.054779052734375, 0.0697174072265625, 0.08465576171875, 0.0995941162109375, 0.114532470703125, 0.1294708251953125, 0.1444091796875, 0.1593475341796875, 0.174285888671875, 0.1892242431640625, 0.20416259765625, 0.2191009521484375, 0.234039306640625, 0.2489776611328125, 0.263916015625, 0.2788543701171875, 0.293792724609375, 0.3087310791015625, 0.32366943359375, 0.3386077880859375, 0.353546142578125, 0.3684844970703125, 0.3834228515625, 0.3983612060546875, 0.413299560546875, 0.4282379150390625, 0.44317626953125, 0.4581146240234375, 0.473052978515625, 0.4879913330078125, 0.5029296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 14.0, 15.0, 24.0, 35.0, 48.0, 78.0, 105.0, 172.0, 252.0, 410.0, 748.0, 1427.0, 2772.0, 6212.0, 16022.0, 53096.0, 221021.0, 488824.0, 185438.0, 45874.0, 14584.0, 5701.0, 2522.0, 1355.0, 693.0, 416.0, 250.0, 128.0, 93.0, 66.0, 37.0, 30.0, 28.0, 18.0, 14.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.022613525390625, -0.021956920623779297, -0.021300315856933594, -0.02064371109008789, -0.019987106323242188, -0.019330501556396484, -0.01867389678955078, -0.018017292022705078, -0.017360687255859375, -0.016704082489013672, -0.01604747772216797, -0.015390872955322266, -0.014734268188476562, -0.01407766342163086, -0.013421058654785156, -0.012764453887939453, -0.01210784912109375, -0.011451244354248047, -0.010794639587402344, -0.01013803482055664, -0.009481430053710938, -0.008824825286865234, -0.008168220520019531, -0.007511615753173828, -0.006855010986328125, -0.006198406219482422, -0.005541801452636719, -0.004885196685791016, -0.0042285919189453125, -0.0035719871520996094, -0.0029153823852539062, -0.002258777618408203, -0.0016021728515625, -0.0009455680847167969, -0.00028896331787109375, 0.0003676414489746094, 0.0010242462158203125, 0.0016808509826660156, 0.0023374557495117188, 0.002994060516357422, 0.003650665283203125, 0.004307270050048828, 0.004963874816894531, 0.005620479583740234, 0.0062770843505859375, 0.006933689117431641, 0.007590293884277344, 0.008246898651123047, 0.00890350341796875, 0.009560108184814453, 0.010216712951660156, 0.01087331771850586, 0.011529922485351562, 0.012186527252197266, 0.012843132019042969, 0.013499736785888672, 0.014156341552734375, 0.014812946319580078, 0.015469551086425781, 0.016126155853271484, 0.016782760620117188, 0.01743936538696289, 0.018095970153808594, 0.018752574920654297, 0.0194091796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 9.0, 12.0, 14.0, 11.0, 23.0, 26.0, 27.0, 29.0, 37.0, 43.0, 64.0, 55.0, 60.0, 78.0, 67.0, 81.0, 57.0, 56.0, 45.0, 46.0, 23.0, 28.0, 23.0, 14.0, 9.0, 15.0, 4.0, 12.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0462477803230286e-05, -1.0136514902114868e-05, -9.81055200099945e-06, -9.484589099884033e-06, -9.158626198768616e-06, -8.832663297653198e-06, -8.50670039653778e-06, -8.180737495422363e-06, -7.854774594306946e-06, -7.528811693191528e-06, -7.202848792076111e-06, -6.876885890960693e-06, -6.550922989845276e-06, -6.224960088729858e-06, -5.898997187614441e-06, -5.5730342864990234e-06, -5.247071385383606e-06, -4.9211084842681885e-06, -4.595145583152771e-06, -4.2691826820373535e-06, -3.943219780921936e-06, -3.6172568798065186e-06, -3.291293978691101e-06, -2.9653310775756836e-06, -2.639368176460266e-06, -2.3134052753448486e-06, -1.987442374229431e-06, -1.6614794731140137e-06, -1.3355165719985962e-06, -1.0095536708831787e-06, -6.835907697677612e-07, -3.5762786865234375e-07, -3.166496753692627e-08, 2.942979335784912e-07, 6.202608346939087e-07, 9.462237358093262e-07, 1.2721866369247437e-06, 1.5981495380401611e-06, 1.9241124391555786e-06, 2.250075340270996e-06, 2.5760382413864136e-06, 2.902001142501831e-06, 3.2279640436172485e-06, 3.553926944732666e-06, 3.8798898458480835e-06, 4.205852746963501e-06, 4.5318156480789185e-06, 4.857778549194336e-06, 5.183741450309753e-06, 5.509704351425171e-06, 5.835667252540588e-06, 6.161630153656006e-06, 6.487593054771423e-06, 6.813555955886841e-06, 7.139518857002258e-06, 7.465481758117676e-06, 7.791444659233093e-06, 8.11740756034851e-06, 8.443370461463928e-06, 8.769333362579346e-06, 9.095296263694763e-06, 9.42125916481018e-06, 9.747222065925598e-06, 1.0073184967041016e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 11.0, 13.0, 12.0, 27.0, 32.0, 57.0, 83.0, 126.0, 208.0, 355.0, 588.0, 1178.0, 2445.0, 6165.0, 17354.0, 59239.0, 222912.0, 442147.0, 211720.0, 56557.0, 16501.0, 5819.0, 2368.0, 1145.0, 576.0, 313.0, 219.0, 131.0, 78.0, 59.0, 24.0, 22.0, 13.0, 14.0, 5.0, 4.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175628662109375, -0.016899585723876953, -0.016236305236816406, -0.01557302474975586, -0.014909744262695312, -0.014246463775634766, -0.013583183288574219, -0.012919902801513672, -0.012256622314453125, -0.011593341827392578, -0.010930061340332031, -0.010266780853271484, -0.009603500366210938, -0.00894021987915039, -0.008276939392089844, -0.007613658905029297, -0.00695037841796875, -0.006287097930908203, -0.005623817443847656, -0.004960536956787109, -0.0042972564697265625, -0.0036339759826660156, -0.0029706954956054688, -0.002307415008544922, -0.001644134521484375, -0.0009808540344238281, -0.00031757354736328125, 0.0003457069396972656, 0.0010089874267578125, 0.0016722679138183594, 0.0023355484008789062, 0.002998828887939453, 0.003662109375, 0.004325389862060547, 0.004988670349121094, 0.005651950836181641, 0.0063152313232421875, 0.006978511810302734, 0.007641792297363281, 0.008305072784423828, 0.008968353271484375, 0.009631633758544922, 0.010294914245605469, 0.010958194732666016, 0.011621475219726562, 0.01228475570678711, 0.012948036193847656, 0.013611316680908203, 0.01427459716796875, 0.014937877655029297, 0.015601158142089844, 0.01626443862915039, 0.016927719116210938, 0.017590999603271484, 0.01825428009033203, 0.018917560577392578, 0.019580841064453125, 0.020244121551513672, 0.02090740203857422, 0.021570682525634766, 0.022233963012695312, 0.02289724349975586, 0.023560523986816406, 0.024223804473876953, 0.0248870849609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 8.0, 8.0, 12.0, 15.0, 19.0, 19.0, 29.0, 31.0, 42.0, 48.0, 49.0, 65.0, 80.0, 70.0, 59.0, 59.0, 51.0, 58.0, 60.0, 34.0, 28.0, 28.0, 28.0, 13.0, 22.0, 5.0, 8.0, 6.0, 4.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.007099151611328125, -0.006922602653503418, -0.006746053695678711, -0.006569504737854004, -0.006392955780029297, -0.00621640682220459, -0.006039857864379883, -0.005863308906555176, -0.005686759948730469, -0.005510210990905762, -0.005333662033081055, -0.005157113075256348, -0.004980564117431641, -0.004804015159606934, -0.0046274662017822266, -0.0044509172439575195, -0.0042743682861328125, -0.0040978193283081055, -0.0039212703704833984, -0.0037447214126586914, -0.0035681724548339844, -0.0033916234970092773, -0.0032150745391845703, -0.0030385255813598633, -0.0028619766235351562, -0.0026854276657104492, -0.002508878707885742, -0.002332329750061035, -0.002155780792236328, -0.001979231834411621, -0.001802682876586914, -0.001626133918762207, -0.0014495849609375, -0.001273036003112793, -0.001096487045288086, -0.0009199380874633789, -0.0007433891296386719, -0.0005668401718139648, -0.0003902912139892578, -0.00021374225616455078, -3.719329833984375e-05, 0.00013935565948486328, 0.0003159046173095703, 0.0004924535751342773, 0.0006690025329589844, 0.0008455514907836914, 0.0010221004486083984, 0.0011986494064331055, 0.0013751983642578125, 0.0015517473220825195, 0.0017282962799072266, 0.0019048452377319336, 0.0020813941955566406, 0.0022579431533813477, 0.0024344921112060547, 0.0026110410690307617, 0.0027875900268554688, 0.0029641389846801758, 0.003140687942504883, 0.00331723690032959, 0.003493785858154297, 0.003670334815979004, 0.003846883773803711, 0.004023432731628418, 0.004199981689453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 12.0, 27.0, 46.0, 105.0, 211.0, 270.0, 179.0, 91.0, 40.0, 10.0, 6.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5026878714561462, -0.4737480580806732, -0.4448082447052002, -0.4158684015274048, -0.38692858815193176, -0.35798877477645874, -0.32904893159866333, -0.3001091182231903, -0.2711693048477173, -0.24222949147224426, -0.21328966319561005, -0.18434983491897583, -0.1554100215435028, -0.12647020816802979, -0.09753037989139557, -0.06859055161476135, -0.03965073823928833, -0.01071091741323471, 0.01822890341281891, 0.04716872423887253, 0.07610854506492615, 0.10504835844039917, 0.1339881867170334, 0.1629280149936676, 0.19186782836914062, 0.22080764174461365, 0.24974747002124786, 0.2786872982978821, 0.3076271116733551, 0.3365669250488281, 0.36550676822662354, 0.39444658160209656, 0.4233863353729248, 0.4523261487483978, 0.48126596212387085, 0.5102058053016663, 0.5391455888748169, 0.5680854320526123, 0.5970252752304077, 0.6259651184082031, 0.6549049019813538, 0.6838447451591492, 0.7127845287322998, 0.7417243719100952, 0.7706642150878906, 0.7996039986610413, 0.8285438418388367, 0.8574836254119873, 0.8864234685897827, 0.9153633117675781, 0.9443030953407288, 0.9732429385185242, 1.0021827220916748, 1.0311225652694702, 1.0600624084472656, 1.089002251625061, 1.1179420948028564, 1.1468819379806519, 1.1758217811584473, 1.2047615051269531, 1.2337013483047485, 1.262641191482544, 1.2915810346603394, 1.3205208778381348, 1.3494606018066406]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 1.0, 16.0, 8.0, 15.0, 15.0, 25.0, 24.0, 42.0, 33.0, 56.0, 42.0, 44.0, 36.0, 54.0, 37.0, 57.0, 62.0, 63.0, 40.0, 55.0, 42.0, 36.0, 34.0, 32.0, 29.0, 28.0, 21.0, 14.0, 9.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.29349470138549805, -0.28555718064308167, -0.2776196599006653, -0.2696821391582489, -0.2617446184158325, -0.25380709767341614, -0.24586959183216095, -0.23793207108974457, -0.22999455034732819, -0.2220570296049118, -0.21411950886249542, -0.20618198812007904, -0.19824448227882385, -0.19030696153640747, -0.1823694407939911, -0.1744319200515747, -0.16649439930915833, -0.15855687856674194, -0.15061935782432556, -0.14268183708190918, -0.1347443163394928, -0.12680679559707642, -0.11886928975582123, -0.11093176901340485, -0.10299424827098846, -0.09505672752857208, -0.0871192067861557, -0.07918169349431992, -0.07124417275190353, -0.06330665200948715, -0.05536913499236107, -0.047431617975234985, -0.039494067430496216, -0.031556546688079834, -0.02361902967095375, -0.015681510791182518, -0.007743991911411285, 0.00019352883100509644, 0.00813104584813118, 0.016068562865257263, 0.024006083607673645, 0.03194360435009003, 0.03988112136721611, 0.047818638384342194, 0.055756159126758575, 0.06369367986917496, 0.07163119316101074, 0.07956871390342712, 0.0875062346458435, 0.09544375538825989, 0.10338127613067627, 0.11131878942251205, 0.11925631016492844, 0.12719383835792542, 0.1351313441991806, 0.14306886494159698, 0.15100638568401337, 0.15894390642642975, 0.16688142716884613, 0.1748189479112625, 0.1827564537525177, 0.19069397449493408, 0.19863149523735046, 0.20656901597976685, 0.21450653672218323]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 9.0, 8.0, 12.0, 16.0, 34.0, 46.0, 71.0, 118.0, 219.0, 419.0, 787.0, 1548.0, 3218.0, 7573.0, 19814.0, 61345.0, 723252.0, 172201.0, 35335.0, 12534.0, 5225.0, 2288.0, 1176.0, 535.0, 296.0, 176.0, 103.0, 58.0, 38.0, 14.0, 18.0, 12.0, 8.0, 7.0, 3.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.29596710205078125, -0.2860260009765625, -0.27608489990234375, -0.266143798828125, -0.25620269775390625, -0.2462615966796875, -0.23632049560546875, -0.22637939453125, -0.21643829345703125, -0.2064971923828125, -0.19655609130859375, -0.186614990234375, -0.17667388916015625, -0.1667327880859375, -0.15679168701171875, -0.1468505859375, -0.13690948486328125, -0.1269683837890625, -0.11702728271484375, -0.107086181640625, -0.09714508056640625, -0.0872039794921875, -0.07726287841796875, -0.06732177734375, -0.05738067626953125, -0.0474395751953125, -0.03749847412109375, -0.027557373046875, -0.01761627197265625, -0.0076751708984375, 0.00226593017578125, 0.01220703125, 0.02214813232421875, 0.0320892333984375, 0.04203033447265625, 0.051971435546875, 0.06191253662109375, 0.0718536376953125, 0.08179473876953125, 0.09173583984375, 0.10167694091796875, 0.1116180419921875, 0.12155914306640625, 0.131500244140625, 0.14144134521484375, 0.1513824462890625, 0.16132354736328125, 0.1712646484375, 0.18120574951171875, 0.1911468505859375, 0.20108795166015625, 0.211029052734375, 0.22097015380859375, 0.2309112548828125, 0.24085235595703125, 0.25079345703125, 0.26073455810546875, 0.2706756591796875, 0.28061676025390625, 0.290557861328125, 0.30049896240234375, 0.3104400634765625, 0.32038116455078125, 0.330322265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 11.0, 12.0, 14.0, 24.0, 29.0, 43.0, 41.0, 64.0, 59.0, 52.0, 72.0, 61.0, 113.0, 63.0, 60.0, 64.0, 52.0, 41.0, 39.0, 31.0, 21.0, 16.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6651153564453125, -0.642730712890625, -0.6203460693359375, -0.59796142578125, -0.5755767822265625, -0.553192138671875, -0.5308074951171875, -0.5084228515625, -0.4860382080078125, -0.463653564453125, -0.4412689208984375, -0.41888427734375, -0.3964996337890625, -0.374114990234375, -0.3517303466796875, -0.329345703125, -0.3069610595703125, -0.284576416015625, -0.2621917724609375, -0.23980712890625, -0.2174224853515625, -0.195037841796875, -0.1726531982421875, -0.1502685546875, -0.1278839111328125, -0.105499267578125, -0.0831146240234375, -0.06072998046875, -0.0383453369140625, -0.015960693359375, 0.0064239501953125, 0.02880859375, 0.0511932373046875, 0.073577880859375, 0.0959625244140625, 0.11834716796875, 0.1407318115234375, 0.163116455078125, 0.1855010986328125, 0.2078857421875, 0.2302703857421875, 0.252655029296875, 0.2750396728515625, 0.29742431640625, 0.3198089599609375, 0.342193603515625, 0.3645782470703125, 0.386962890625, 0.4093475341796875, 0.431732177734375, 0.4541168212890625, 0.47650146484375, 0.4988861083984375, 0.521270751953125, 0.5436553955078125, 0.5660400390625, 0.5884246826171875, 0.610809326171875, 0.6331939697265625, 0.65557861328125, 0.6779632568359375, 0.700347900390625, 0.7227325439453125, 0.7451171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 8.0, 16.0, 6.0, 15.0, 21.0, 21.0, 18.0, 27.0, 53.0, 47.0, 79.0, 94.0, 153.0, 418.0, 2624.0, 40775.0, 963344.0, 37367.0, 2453.0, 460.0, 137.0, 90.0, 83.0, 53.0, 41.0, 40.0, 28.0, 22.0, 9.0, 6.0, 12.0, 6.0, 11.0, 3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.7556228637695312, -0.7299957275390625, -0.7043685913085938, -0.678741455078125, -0.6531143188476562, -0.6274871826171875, -0.6018600463867188, -0.57623291015625, -0.5506057739257812, -0.5249786376953125, -0.49935150146484375, -0.473724365234375, -0.44809722900390625, -0.4224700927734375, -0.39684295654296875, -0.3712158203125, -0.34558868408203125, -0.3199615478515625, -0.29433441162109375, -0.268707275390625, -0.24308013916015625, -0.2174530029296875, -0.19182586669921875, -0.16619873046875, -0.14057159423828125, -0.1149444580078125, -0.08931732177734375, -0.063690185546875, -0.03806304931640625, -0.0124359130859375, 0.01319122314453125, 0.038818359375, 0.06444549560546875, 0.0900726318359375, 0.11569976806640625, 0.141326904296875, 0.16695404052734375, 0.1925811767578125, 0.21820831298828125, 0.24383544921875, 0.26946258544921875, 0.2950897216796875, 0.32071685791015625, 0.346343994140625, 0.37197113037109375, 0.3975982666015625, 0.42322540283203125, 0.4488525390625, 0.47447967529296875, 0.5001068115234375, 0.5257339477539062, 0.551361083984375, 0.5769882202148438, 0.6026153564453125, 0.6282424926757812, 0.65386962890625, 0.6794967651367188, 0.7051239013671875, 0.7307510375976562, 0.756378173828125, 0.7820053100585938, 0.8076324462890625, 0.8332595825195312, 0.85888671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 1.0, 4.0, 3.0, 8.0, 7.0, 9.0, 16.0, 11.0, 20.0, 25.0, 28.0, 33.0, 26.0, 50.0, 45.0, 41.0, 59.0, 44.0, 36.0, 59.0, 59.0, 64.0, 53.0, 38.0, 40.0, 34.0, 29.0, 29.0, 24.0, 25.0, 19.0, 13.0, 16.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6376953125, -0.618560791015625, -0.59942626953125, -0.580291748046875, -0.5611572265625, -0.542022705078125, -0.52288818359375, -0.503753662109375, -0.484619140625, -0.465484619140625, -0.44635009765625, -0.427215576171875, -0.4080810546875, -0.388946533203125, -0.36981201171875, -0.350677490234375, -0.33154296875, -0.312408447265625, -0.29327392578125, -0.274139404296875, -0.2550048828125, -0.235870361328125, -0.21673583984375, -0.197601318359375, -0.178466796875, -0.159332275390625, -0.14019775390625, -0.121063232421875, -0.1019287109375, -0.082794189453125, -0.06365966796875, -0.044525146484375, -0.025390625, -0.006256103515625, 0.01287841796875, 0.032012939453125, 0.0511474609375, 0.070281982421875, 0.08941650390625, 0.108551025390625, 0.127685546875, 0.146820068359375, 0.16595458984375, 0.185089111328125, 0.2042236328125, 0.223358154296875, 0.24249267578125, 0.261627197265625, 0.28076171875, 0.299896240234375, 0.31903076171875, 0.338165283203125, 0.3572998046875, 0.376434326171875, 0.39556884765625, 0.414703369140625, 0.433837890625, 0.452972412109375, 0.47210693359375, 0.491241455078125, 0.5103759765625, 0.529510498046875, 0.54864501953125, 0.567779541015625, 0.5869140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 11.0, 20.0, 14.0, 17.0, 26.0, 49.0, 90.0, 178.0, 325.0, 776.0, 2071.0, 7648.0, 83154.0, 915758.0, 31207.0, 4498.0, 1379.0, 650.0, 293.0, 142.0, 86.0, 50.0, 41.0, 15.0, 12.0, 14.0, 4.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.355224609375, -0.3470268249511719, -0.33882904052734375, -0.3306312561035156, -0.3224334716796875, -0.3142356872558594, -0.30603790283203125, -0.2978401184082031, -0.289642333984375, -0.2814445495605469, -0.27324676513671875, -0.2650489807128906, -0.2568511962890625, -0.24865341186523438, -0.24045562744140625, -0.23225784301757812, -0.22406005859375, -0.21586227416992188, -0.20766448974609375, -0.19946670532226562, -0.1912689208984375, -0.18307113647460938, -0.17487335205078125, -0.16667556762695312, -0.158477783203125, -0.15027999877929688, -0.14208221435546875, -0.13388442993164062, -0.1256866455078125, -0.11748886108398438, -0.10929107666015625, -0.10109329223632812, -0.0928955078125, -0.08469772338867188, -0.07649993896484375, -0.06830215454101562, -0.0601043701171875, -0.051906585693359375, -0.04370880126953125, -0.035511016845703125, -0.027313232421875, -0.019115447998046875, -0.01091766357421875, -0.002719879150390625, 0.0054779052734375, 0.013675689697265625, 0.02187347412109375, 0.030071258544921875, 0.03826904296875, 0.046466827392578125, 0.05466461181640625, 0.06286239624023438, 0.0710601806640625, 0.07925796508789062, 0.08745574951171875, 0.09565353393554688, 0.103851318359375, 0.11204910278320312, 0.12024688720703125, 0.12844467163085938, 0.1366424560546875, 0.14484024047851562, 0.15303802490234375, 0.16123580932617188, 0.16943359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 13.0, 14.0, 20.0, 35.0, 48.0, 148.0, 517.0, 81.0, 48.0, 32.0, 16.0, 12.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.860494613647461e-05, -6.705615669488907e-05, -6.550736725330353e-05, -6.395857781171799e-05, -6.240978837013245e-05, -6.0860998928546906e-05, -5.9312209486961365e-05, -5.7763420045375824e-05, -5.621463060379028e-05, -5.466584116220474e-05, -5.31170517206192e-05, -5.156826227903366e-05, -5.001947283744812e-05, -4.847068339586258e-05, -4.692189395427704e-05, -4.53731045126915e-05, -4.382431507110596e-05, -4.2275525629520416e-05, -4.0726736187934875e-05, -3.9177946746349335e-05, -3.7629157304763794e-05, -3.608036786317825e-05, -3.453157842159271e-05, -3.298278898000717e-05, -3.143399953842163e-05, -2.988521009683609e-05, -2.833642065525055e-05, -2.678763121366501e-05, -2.5238841772079468e-05, -2.3690052330493927e-05, -2.2141262888908386e-05, -2.0592473447322845e-05, -1.9043684005737305e-05, -1.7494894564151764e-05, -1.5946105122566223e-05, -1.4397315680980682e-05, -1.2848526239395142e-05, -1.12997367978096e-05, -9.75094735622406e-06, -8.20215791463852e-06, -6.6533684730529785e-06, -5.104579031467438e-06, -3.555789589881897e-06, -2.007000148296356e-06, -4.5821070671081543e-07, 1.0905787348747253e-06, 2.639368176460266e-06, 4.188157618045807e-06, 5.736947059631348e-06, 7.2857365012168884e-06, 8.83452594280243e-06, 1.038331538438797e-05, 1.193210482597351e-05, 1.3480894267559052e-05, 1.5029683709144592e-05, 1.6578473150730133e-05, 1.8127262592315674e-05, 1.9676052033901215e-05, 2.1224841475486755e-05, 2.2773630917072296e-05, 2.4322420358657837e-05, 2.5871209800243378e-05, 2.741999924182892e-05, 2.896878868341446e-05, 3.0517578125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 11.0, 18.0, 32.0, 93.0, 163.0, 265.0, 519.0, 1166.0, 4470.0, 90519.0, 932297.0, 15328.0, 2086.0, 763.0, 373.0, 201.0, 100.0, 57.0, 33.0, 20.0, 8.0, 4.0, 3.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.322265625, -0.3104400634765625, -0.298614501953125, -0.2867889404296875, -0.27496337890625, -0.2631378173828125, -0.251312255859375, -0.2394866943359375, -0.2276611328125, -0.2158355712890625, -0.204010009765625, -0.1921844482421875, -0.18035888671875, -0.1685333251953125, -0.156707763671875, -0.1448822021484375, -0.133056640625, -0.1212310791015625, -0.109405517578125, -0.0975799560546875, -0.08575439453125, -0.0739288330078125, -0.062103271484375, -0.0502777099609375, -0.0384521484375, -0.0266265869140625, -0.014801025390625, -0.0029754638671875, 0.00885009765625, 0.0206756591796875, 0.032501220703125, 0.0443267822265625, 0.05615234375, 0.0679779052734375, 0.079803466796875, 0.0916290283203125, 0.10345458984375, 0.1152801513671875, 0.127105712890625, 0.1389312744140625, 0.1507568359375, 0.1625823974609375, 0.174407958984375, 0.1862335205078125, 0.19805908203125, 0.2098846435546875, 0.221710205078125, 0.2335357666015625, 0.245361328125, 0.2571868896484375, 0.269012451171875, 0.2808380126953125, 0.29266357421875, 0.3044891357421875, 0.316314697265625, 0.3281402587890625, 0.3399658203125, 0.3517913818359375, 0.363616943359375, 0.3754425048828125, 0.38726806640625, 0.3990936279296875, 0.410919189453125, 0.4227447509765625, 0.4345703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 10.0, 16.0, 30.0, 52.0, 69.0, 361.0, 289.0, 65.0, 39.0, 24.0, 18.0, 14.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14690303802490234, -0.1429271697998047, -0.13895130157470703, -0.13497543334960938, -0.13099956512451172, -0.12702369689941406, -0.1230478286743164, -0.11907196044921875, -0.1150960922241211, -0.11112022399902344, -0.10714435577392578, -0.10316848754882812, -0.09919261932373047, -0.09521675109863281, -0.09124088287353516, -0.0872650146484375, -0.08328914642333984, -0.07931327819824219, -0.07533740997314453, -0.07136154174804688, -0.06738567352294922, -0.06340980529785156, -0.059433937072753906, -0.05545806884765625, -0.051482200622558594, -0.04750633239746094, -0.04353046417236328, -0.039554595947265625, -0.03557872772216797, -0.03160285949707031, -0.027626991271972656, -0.023651123046875, -0.019675254821777344, -0.015699386596679688, -0.011723518371582031, -0.007747650146484375, -0.0037717819213867188, 0.0002040863037109375, 0.004179954528808594, 0.00815582275390625, 0.012131690979003906, 0.016107559204101562, 0.02008342742919922, 0.024059295654296875, 0.02803516387939453, 0.03201103210449219, 0.035986900329589844, 0.0399627685546875, 0.043938636779785156, 0.04791450500488281, 0.05189037322998047, 0.055866241455078125, 0.05984210968017578, 0.06381797790527344, 0.0677938461303711, 0.07176971435546875, 0.0757455825805664, 0.07972145080566406, 0.08369731903076172, 0.08767318725585938, 0.09164905548095703, 0.09562492370605469, 0.09960079193115234, 0.10357666015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 9.0, 23.0, 65.0, 188.0, 355.0, 262.0, 77.0, 23.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4813905656337738, -0.3963336944580078, -0.31127679347991943, -0.22621992230415344, -0.14116302132606506, -0.056106120347976685, 0.02895072102546692, 0.1140076220035553, 0.19906452298164368, 0.28412139415740967, 0.36917829513549805, 0.45423516631126404, 0.5392920970916748, 0.6243489980697632, 0.709405779838562, 0.7944626808166504, 0.8795195817947388, 0.9645764827728271, 1.0496333837509155, 1.134690284729004, 1.2197470664978027, 1.3048040866851807, 1.3898608684539795, 1.4749177694320679, 1.5599746704101562, 1.6450315713882446, 1.730088472366333, 1.8151452541351318, 1.9002022743225098, 1.9852590560913086, 2.0703158378601074, 2.1553728580474854, 2.2404298782348633, 2.325486660003662, 2.41054368019104, 2.495600461959839, 2.580657482147217, 2.6657142639160156, 2.7507710456848145, 2.8358280658721924, 2.9208850860595703, 3.005941867828369, 3.090998888015747, 3.176055669784546, 3.261112689971924, 3.3461694717407227, 3.4312262535095215, 3.5162832736968994, 3.6013400554656982, 3.686396837234497, 3.771453857421875, 3.856510639190674, 3.9415676593780518, 4.02662467956543, 4.1116814613342285, 4.196738243103027, 4.281795024871826, 4.366851806640625, 4.451908588409424, 4.536965847015381, 4.62202262878418, 4.7070794105529785, 4.792136192321777, 4.877193450927734, 4.962250232696533]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 4.0, 2.0, 12.0, 16.0, 10.0, 10.0, 19.0, 11.0, 25.0, 20.0, 26.0, 23.0, 23.0, 35.0, 38.0, 42.0, 38.0, 47.0, 30.0, 51.0, 36.0, 40.0, 38.0, 45.0, 39.0, 38.0, 30.0, 47.0, 36.0, 26.0, 23.0, 18.0, 11.0, 19.0, 8.0, 14.0, 11.0, 10.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8738496899604797, -0.8473448157310486, -0.8208399415016174, -0.7943350672721863, -0.7678301930427551, -0.741325318813324, -0.7148204445838928, -0.6883155703544617, -0.6618106961250305, -0.6353058218955994, -0.6088009476661682, -0.5822960734367371, -0.5557911992073059, -0.5292863249778748, -0.5027814507484436, -0.47627657651901245, -0.4497717320919037, -0.42326685786247253, -0.3967619836330414, -0.37025710940361023, -0.3437522351741791, -0.3172473907470703, -0.29074251651763916, -0.264237642288208, -0.23773275315761566, -0.2112278789281845, -0.18472300469875336, -0.1582181453704834, -0.13171327114105225, -0.1052083969116211, -0.07870352268218994, -0.05219864845275879, -0.025693774223327637, 0.0008110981434583664, 0.02731597051024437, 0.05382084101438522, 0.08032571524381638, 0.10683058202266693, 0.13333545625209808, 0.15984033048152924, 0.1863452047109604, 0.21285007894039154, 0.2393549531698227, 0.26585981249809265, 0.2923646867275238, 0.31886956095695496, 0.3453744351863861, 0.37187930941581726, 0.3983841836452484, 0.42488905787467957, 0.4513939321041107, 0.47789880633354187, 0.5044036507606506, 0.5309085249900818, 0.5574133992195129, 0.5839182734489441, 0.6104231476783752, 0.6369280219078064, 0.6634328961372375, 0.6899377703666687, 0.7164426445960999, 0.742947518825531, 0.7694523930549622, 0.7959572672843933, 0.8224621415138245]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 10.0, 17.0, 23.0, 23.0, 30.0, 50.0, 56.0, 146.0, 251.0, 452.0, 1401.0, 4552.0, 21710.0, 419023.0, 3617665.0, 112161.0, 12039.0, 2807.0, 978.0, 386.0, 178.0, 97.0, 71.0, 51.0, 24.0, 21.0, 18.0, 6.0, 6.0, 3.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.7046051025390625, -0.676788330078125, -0.6489715576171875, -0.62115478515625, -0.5933380126953125, -0.565521240234375, -0.5377044677734375, -0.5098876953125, -0.4820709228515625, -0.454254150390625, -0.4264373779296875, -0.39862060546875, -0.3708038330078125, -0.342987060546875, -0.3151702880859375, -0.287353515625, -0.2595367431640625, -0.231719970703125, -0.2039031982421875, -0.17608642578125, -0.1482696533203125, -0.120452880859375, -0.0926361083984375, -0.0648193359375, -0.0370025634765625, -0.009185791015625, 0.0186309814453125, 0.04644775390625, 0.0742645263671875, 0.102081298828125, 0.1298980712890625, 0.15771484375, 0.1855316162109375, 0.213348388671875, 0.2411651611328125, 0.26898193359375, 0.2967987060546875, 0.324615478515625, 0.3524322509765625, 0.3802490234375, 0.4080657958984375, 0.435882568359375, 0.4636993408203125, 0.49151611328125, 0.5193328857421875, 0.547149658203125, 0.5749664306640625, 0.602783203125, 0.6305999755859375, 0.658416748046875, 0.6862335205078125, 0.71405029296875, 0.7418670654296875, 0.769683837890625, 0.7975006103515625, 0.8253173828125, 0.8531341552734375, 0.880950927734375, 0.9087677001953125, 0.93658447265625, 0.9644012451171875, 0.992218017578125, 1.0200347900390625, 1.0478515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 5.0, 7.0, 7.0, 21.0, 15.0, 12.0, 21.0, 19.0, 36.0, 25.0, 44.0, 39.0, 47.0, 48.0, 40.0, 51.0, 60.0, 59.0, 57.0, 51.0, 50.0, 36.0, 37.0, 41.0, 33.0, 29.0, 23.0, 9.0, 20.0, 12.0, 11.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.2958564758300781, -0.28702545166015625, -0.2781944274902344, -0.2693634033203125, -0.2605323791503906, -0.25170135498046875, -0.24287033081054688, -0.234039306640625, -0.22520828247070312, -0.21637725830078125, -0.20754623413085938, -0.1987152099609375, -0.18988418579101562, -0.18105316162109375, -0.17222213745117188, -0.16339111328125, -0.15456008911132812, -0.14572906494140625, -0.13689804077148438, -0.1280670166015625, -0.11923599243164062, -0.11040496826171875, -0.10157394409179688, -0.092742919921875, -0.08391189575195312, -0.07508087158203125, -0.06624984741210938, -0.0574188232421875, -0.048587799072265625, -0.03975677490234375, -0.030925750732421875, -0.0220947265625, -0.013263702392578125, -0.00443267822265625, 0.004398345947265625, 0.0132293701171875, 0.022060394287109375, 0.03089141845703125, 0.039722442626953125, 0.048553466796875, 0.057384490966796875, 0.06621551513671875, 0.07504653930664062, 0.0838775634765625, 0.09270858764648438, 0.10153961181640625, 0.11037063598632812, 0.11920166015625, 0.12803268432617188, 0.13686370849609375, 0.14569473266601562, 0.1545257568359375, 0.16335678100585938, 0.17218780517578125, 0.18101882934570312, 0.189849853515625, 0.19868087768554688, 0.20751190185546875, 0.21634292602539062, 0.2251739501953125, 0.23400497436523438, 0.24283599853515625, 0.2516670227050781, 0.260498046875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 11.0, 23.0, 31.0, 50.0, 133.0, 313.0, 871.0, 3555.0, 42983.0, 3934223.0, 202189.0, 7672.0, 1428.0, 445.0, 167.0, 76.0, 51.0, 15.0, 16.0, 8.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2099609375, -1.1705322265625, -1.131103515625, -1.0916748046875, -1.05224609375, -1.0128173828125, -0.973388671875, -0.9339599609375, -0.89453125, -0.8551025390625, -0.815673828125, -0.7762451171875, -0.73681640625, -0.6973876953125, -0.657958984375, -0.6185302734375, -0.5791015625, -0.5396728515625, -0.500244140625, -0.4608154296875, -0.42138671875, -0.3819580078125, -0.342529296875, -0.3031005859375, -0.263671875, -0.2242431640625, -0.184814453125, -0.1453857421875, -0.10595703125, -0.0665283203125, -0.027099609375, 0.0123291015625, 0.0517578125, 0.0911865234375, 0.130615234375, 0.1700439453125, 0.20947265625, 0.2489013671875, 0.288330078125, 0.3277587890625, 0.3671875, 0.4066162109375, 0.446044921875, 0.4854736328125, 0.52490234375, 0.5643310546875, 0.603759765625, 0.6431884765625, 0.6826171875, 0.7220458984375, 0.761474609375, 0.8009033203125, 0.84033203125, 0.8797607421875, 0.919189453125, 0.9586181640625, 0.998046875, 1.0374755859375, 1.076904296875, 1.1163330078125, 1.15576171875, 1.1951904296875, 1.234619140625, 1.2740478515625, 1.3134765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 12.0, 14.0, 41.0, 53.0, 94.0, 173.0, 363.0, 841.0, 1210.0, 676.0, 274.0, 139.0, 63.0, 45.0, 26.0, 14.0, 11.0, 5.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334228515625, -0.32614707946777344, -0.3180656433105469, -0.3099842071533203, -0.30190277099609375, -0.2938213348388672, -0.2857398986816406, -0.27765846252441406, -0.2695770263671875, -0.26149559020996094, -0.2534141540527344, -0.2453327178955078, -0.23725128173828125, -0.2291698455810547, -0.22108840942382812, -0.21300697326660156, -0.204925537109375, -0.19684410095214844, -0.18876266479492188, -0.1806812286376953, -0.17259979248046875, -0.1645183563232422, -0.15643692016601562, -0.14835548400878906, -0.1402740478515625, -0.13219261169433594, -0.12411117553710938, -0.11602973937988281, -0.10794830322265625, -0.09986686706542969, -0.09178543090820312, -0.08370399475097656, -0.07562255859375, -0.06754112243652344, -0.059459686279296875, -0.05137825012207031, -0.04329681396484375, -0.03521537780761719, -0.027133941650390625, -0.019052505493164062, -0.0109710693359375, -0.0028896331787109375, 0.005191802978515625, 0.013273239135742188, 0.02135467529296875, 0.029436111450195312, 0.037517547607421875, 0.04559898376464844, 0.053680419921875, 0.06176185607910156, 0.06984329223632812, 0.07792472839355469, 0.08600616455078125, 0.09408760070800781, 0.10216903686523438, 0.11025047302246094, 0.1183319091796875, 0.12641334533691406, 0.13449478149414062, 0.1425762176513672, 0.15065765380859375, 0.1587390899658203, 0.16682052612304688, 0.17490196228027344, 0.1829833984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 20.0, 16.0, 39.0, 43.0, 74.0, 80.0, 100.0, 121.0, 128.0, 107.0, 96.0, 54.0, 38.0, 30.0, 11.0, 16.0, 11.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7881006598472595, -0.7657932639122009, -0.7434858679771423, -0.7211785316467285, -0.6988711357116699, -0.6765637397766113, -0.6542563438415527, -0.6319489479064941, -0.6096415519714355, -0.587334156036377, -0.5650267601013184, -0.5427193641662598, -0.520412027835846, -0.49810463190078735, -0.47579723596572876, -0.45348984003067017, -0.43118247389793396, -0.40887507796287537, -0.38656771183013916, -0.36426031589508057, -0.341952919960022, -0.3196455240249634, -0.2973381578922272, -0.2750307619571686, -0.2527233958244324, -0.23041601479053497, -0.20810861885547638, -0.18580123782157898, -0.16349384188652039, -0.14118646085262299, -0.11887907981872559, -0.09657168388366699, -0.0742642879486084, -0.0519568994641304, -0.029649514704942703, -0.007342129945755005, 0.014965258538722992, 0.03727264702320099, 0.05958002805709839, 0.08188742399215698, 0.10419480502605438, 0.12650218605995178, 0.14880958199501038, 0.17111696302890778, 0.19342434406280518, 0.21573173999786377, 0.23803912103176117, 0.26034653186798096, 0.28265389800071716, 0.30496129393577576, 0.32726866006851196, 0.34957605600357056, 0.37188345193862915, 0.39419084787368774, 0.41649821400642395, 0.43880560994148254, 0.46111297607421875, 0.48342037200927734, 0.5057277679443359, 0.5280351638793945, 0.5503425002098083, 0.5726498961448669, 0.5949572920799255, 0.6172646880149841, 0.6395720839500427]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 9.0, 13.0, 16.0, 15.0, 14.0, 20.0, 17.0, 20.0, 27.0, 32.0, 46.0, 27.0, 31.0, 48.0, 39.0, 57.0, 47.0, 38.0, 39.0, 44.0, 43.0, 26.0, 33.0, 29.0, 29.0, 31.0, 26.0, 21.0, 22.0, 20.0, 9.0, 19.0, 17.0, 8.0, 9.0, 5.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32736608386039734, -0.3176831007003784, -0.3080001473426819, -0.29831716418266296, -0.28863418102264404, -0.2789512276649475, -0.2692682445049286, -0.25958526134490967, -0.24990229308605194, -0.2402193248271942, -0.2305363416671753, -0.22085337340831757, -0.21117040514945984, -0.20148742198944092, -0.1918044537305832, -0.18212148547172546, -0.17243850231170654, -0.16275553405284882, -0.1530725508928299, -0.14338958263397217, -0.13370659947395325, -0.12402363121509552, -0.11434066295623779, -0.10465768724679947, -0.09497471153736115, -0.08529173582792282, -0.0756087601184845, -0.06592579185962677, -0.056242816150188446, -0.04655984044075012, -0.0368768684566021, -0.02719389647245407, -0.017510920763015747, -0.007827946916222572, 0.0018550269305706024, 0.011538000777363777, 0.021220974624156952, 0.030903950333595276, 0.0405869223177433, 0.05026989430189133, 0.05995287001132965, 0.06963584572076797, 0.0793188214302063, 0.08900178968906403, 0.09868476539850235, 0.10836774110794067, 0.1180507093667984, 0.12773367762565613, 0.13741666078567505, 0.14709962904453278, 0.1567826122045517, 0.16646558046340942, 0.17614856362342834, 0.18583153188228607, 0.1955145001411438, 0.20519748330116272, 0.21488045156002045, 0.22456341981887817, 0.2342464029788971, 0.24392937123775482, 0.25361233949661255, 0.26329532265663147, 0.2729783058166504, 0.2826612591743469, 0.29234424233436584]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 5.0, 11.0, 8.0, 18.0, 20.0, 40.0, 63.0, 101.0, 258.0, 455.0, 932.0, 2073.0, 4916.0, 12592.0, 48545.0, 530922.0, 391153.0, 37620.0, 10989.0, 4365.0, 1812.0, 829.0, 369.0, 202.0, 102.0, 49.0, 29.0, 18.0, 17.0, 6.0, 6.0, 6.0, 7.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1983642578125, -0.19173622131347656, -0.18510818481445312, -0.1784801483154297, -0.17185211181640625, -0.1652240753173828, -0.15859603881835938, -0.15196800231933594, -0.1453399658203125, -0.13871192932128906, -0.13208389282226562, -0.1254558563232422, -0.11882781982421875, -0.11219978332519531, -0.10557174682617188, -0.09894371032714844, -0.092315673828125, -0.08568763732910156, -0.07905960083007812, -0.07243156433105469, -0.06580352783203125, -0.05917549133300781, -0.052547454833984375, -0.04591941833496094, -0.0392913818359375, -0.03266334533691406, -0.026035308837890625, -0.019407272338867188, -0.01277923583984375, -0.0061511993408203125, 0.000476837158203125, 0.0071048736572265625, 0.01373291015625, 0.020360946655273438, 0.026988983154296875, 0.03361701965332031, 0.04024505615234375, 0.04687309265136719, 0.053501129150390625, 0.06012916564941406, 0.0667572021484375, 0.07338523864746094, 0.08001327514648438, 0.08664131164550781, 0.09326934814453125, 0.09989738464355469, 0.10652542114257812, 0.11315345764160156, 0.119781494140625, 0.12640953063964844, 0.13303756713867188, 0.1396656036376953, 0.14629364013671875, 0.1529216766357422, 0.15954971313476562, 0.16617774963378906, 0.1728057861328125, 0.17943382263183594, 0.18606185913085938, 0.1926898956298828, 0.19931793212890625, 0.2059459686279297, 0.21257400512695312, 0.21920204162597656, 0.225830078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 14.0, 13.0, 17.0, 20.0, 21.0, 25.0, 25.0, 42.0, 42.0, 56.0, 36.0, 66.0, 63.0, 58.0, 55.0, 56.0, 52.0, 44.0, 50.0, 47.0, 35.0, 32.0, 25.0, 24.0, 19.0, 20.0, 8.0, 9.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2749481201171875, -0.265472412109375, -0.2559967041015625, -0.24652099609375, -0.2370452880859375, -0.227569580078125, -0.2180938720703125, -0.2086181640625, -0.1991424560546875, -0.189666748046875, -0.1801910400390625, -0.17071533203125, -0.1612396240234375, -0.151763916015625, -0.1422882080078125, -0.1328125, -0.1233367919921875, -0.113861083984375, -0.1043853759765625, -0.09490966796875, -0.0854339599609375, -0.075958251953125, -0.0664825439453125, -0.0570068359375, -0.0475311279296875, -0.038055419921875, -0.0285797119140625, -0.01910400390625, -0.0096282958984375, -0.000152587890625, 0.0093231201171875, 0.018798828125, 0.0282745361328125, 0.037750244140625, 0.0472259521484375, 0.05670166015625, 0.0661773681640625, 0.075653076171875, 0.0851287841796875, 0.0946044921875, 0.1040802001953125, 0.113555908203125, 0.1230316162109375, 0.13250732421875, 0.1419830322265625, 0.151458740234375, 0.1609344482421875, 0.17041015625, 0.1798858642578125, 0.189361572265625, 0.1988372802734375, 0.20831298828125, 0.2177886962890625, 0.227264404296875, 0.2367401123046875, 0.2462158203125, 0.2556915283203125, 0.265167236328125, 0.2746429443359375, 0.28411865234375, 0.2935943603515625, 0.303070068359375, 0.3125457763671875, 0.322021484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 13.0, 17.0, 18.0, 29.0, 42.0, 40.0, 81.0, 122.0, 138.0, 219.0, 339.0, 578.0, 951.0, 1671.0, 3203.0, 6877.0, 15393.0, 41863.0, 148197.0, 448736.0, 268096.0, 69813.0, 22853.0, 9428.0, 4385.0, 2244.0, 1237.0, 687.0, 418.0, 256.0, 167.0, 123.0, 91.0, 55.0, 35.0, 39.0, 31.0, 21.0, 18.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0916748046875, -0.08895587921142578, -0.08623695373535156, -0.08351802825927734, -0.08079910278320312, -0.0780801773071289, -0.07536125183105469, -0.07264232635498047, -0.06992340087890625, -0.06720447540283203, -0.06448554992675781, -0.061766624450683594, -0.059047698974609375, -0.056328773498535156, -0.05360984802246094, -0.05089092254638672, -0.0481719970703125, -0.04545307159423828, -0.04273414611816406, -0.040015220642089844, -0.037296295166015625, -0.034577369689941406, -0.03185844421386719, -0.02913951873779297, -0.02642059326171875, -0.02370166778564453, -0.020982742309570312, -0.018263816833496094, -0.015544891357421875, -0.012825965881347656, -0.010107040405273438, -0.007388114929199219, -0.004669189453125, -0.0019502639770507812, 0.0007686614990234375, 0.0034875869750976562, 0.006206512451171875, 0.008925437927246094, 0.011644363403320312, 0.014363288879394531, 0.01708221435546875, 0.01980113983154297, 0.022520065307617188, 0.025238990783691406, 0.027957916259765625, 0.030676841735839844, 0.03339576721191406, 0.03611469268798828, 0.0388336181640625, 0.04155254364013672, 0.04427146911621094, 0.046990394592285156, 0.049709320068359375, 0.052428245544433594, 0.05514717102050781, 0.05786609649658203, 0.06058502197265625, 0.06330394744873047, 0.06602287292480469, 0.0687417984008789, 0.07146072387695312, 0.07417964935302734, 0.07689857482910156, 0.07961750030517578, 0.08233642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 11.0, 4.0, 6.0, 16.0, 14.0, 18.0, 11.0, 14.0, 17.0, 18.0, 26.0, 32.0, 24.0, 40.0, 35.0, 57.0, 48.0, 56.0, 50.0, 41.0, 45.0, 56.0, 35.0, 44.0, 39.0, 41.0, 34.0, 43.0, 21.0, 18.0, 10.0, 12.0, 13.0, 10.0, 10.0, 9.0, 2.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.49017333984375, -0.4739990234375, -0.45782470703125, -0.441650390625, -0.42547607421875, -0.4093017578125, -0.39312744140625, -0.376953125, -0.36077880859375, -0.3446044921875, -0.32843017578125, -0.312255859375, -0.29608154296875, -0.2799072265625, -0.26373291015625, -0.24755859375, -0.23138427734375, -0.2152099609375, -0.19903564453125, -0.182861328125, -0.16668701171875, -0.1505126953125, -0.13433837890625, -0.1181640625, -0.10198974609375, -0.0858154296875, -0.06964111328125, -0.053466796875, -0.03729248046875, -0.0211181640625, -0.00494384765625, 0.01123046875, 0.02740478515625, 0.0435791015625, 0.05975341796875, 0.075927734375, 0.09210205078125, 0.1082763671875, 0.12445068359375, 0.140625, 0.15679931640625, 0.1729736328125, 0.18914794921875, 0.205322265625, 0.22149658203125, 0.2376708984375, 0.25384521484375, 0.27001953125, 0.28619384765625, 0.3023681640625, 0.31854248046875, 0.334716796875, 0.35089111328125, 0.3670654296875, 0.38323974609375, 0.3994140625, 0.41558837890625, 0.4317626953125, 0.44793701171875, 0.464111328125, 0.48028564453125, 0.4964599609375, 0.51263427734375, 0.52880859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 7.0, 19.0, 17.0, 37.0, 54.0, 93.0, 150.0, 320.0, 611.0, 1228.0, 3025.0, 9222.0, 44813.0, 379836.0, 523678.0, 66679.0, 12088.0, 3629.0, 1476.0, 699.0, 361.0, 191.0, 109.0, 59.0, 47.0, 26.0, 22.0, 14.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041656494140625, -0.04046964645385742, -0.039282798767089844, -0.038095951080322266, -0.03690910339355469, -0.03572225570678711, -0.03453540802001953, -0.03334856033325195, -0.032161712646484375, -0.030974864959716797, -0.02978801727294922, -0.02860116958618164, -0.027414321899414062, -0.026227474212646484, -0.025040626525878906, -0.023853778839111328, -0.02266693115234375, -0.021480083465576172, -0.020293235778808594, -0.019106388092041016, -0.017919540405273438, -0.01673269271850586, -0.015545845031738281, -0.014358997344970703, -0.013172149658203125, -0.011985301971435547, -0.010798454284667969, -0.00961160659790039, -0.008424758911132812, -0.007237911224365234, -0.006051063537597656, -0.004864215850830078, -0.0036773681640625, -0.002490520477294922, -0.0013036727905273438, -0.00011682510375976562, 0.0010700225830078125, 0.0022568702697753906, 0.0034437179565429688, 0.004630565643310547, 0.005817413330078125, 0.007004261016845703, 0.008191108703613281, 0.00937795639038086, 0.010564804077148438, 0.011751651763916016, 0.012938499450683594, 0.014125347137451172, 0.01531219482421875, 0.016499042510986328, 0.017685890197753906, 0.018872737884521484, 0.020059585571289062, 0.02124643325805664, 0.02243328094482422, 0.023620128631591797, 0.024806976318359375, 0.025993824005126953, 0.02718067169189453, 0.02836751937866211, 0.029554367065429688, 0.030741214752197266, 0.031928062438964844, 0.03311491012573242, 0.0343017578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 15.0, 8.0, 16.0, 34.0, 56.0, 87.0, 124.0, 138.0, 140.0, 133.0, 93.0, 52.0, 35.0, 24.0, 13.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-05, -2.299528568983078e-05, -2.214871346950531e-05, -2.130214124917984e-05, -2.045556902885437e-05, -1.96089968085289e-05, -1.876242458820343e-05, -1.791585236787796e-05, -1.706928014755249e-05, -1.622270792722702e-05, -1.537613570690155e-05, -1.452956348657608e-05, -1.368299126625061e-05, -1.283641904592514e-05, -1.198984682559967e-05, -1.11432746052742e-05, -1.029670238494873e-05, -9.45013016462326e-06, -8.60355794429779e-06, -7.75698572397232e-06, -6.910413503646851e-06, -6.063841283321381e-06, -5.217269062995911e-06, -4.370696842670441e-06, -3.5241246223449707e-06, -2.6775524020195007e-06, -1.8309801816940308e-06, -9.844079613685608e-07, -1.3783574104309082e-07, 7.087364792823792e-07, 1.5553086996078491e-06, 2.401880919933319e-06, 3.248453140258789e-06, 4.095025360584259e-06, 4.941597580909729e-06, 5.788169801235199e-06, 6.634742021560669e-06, 7.481314241886139e-06, 8.327886462211609e-06, 9.174458682537079e-06, 1.0021030902862549e-05, 1.0867603123188019e-05, 1.1714175343513489e-05, 1.2560747563838959e-05, 1.3407319784164429e-05, 1.4253892004489899e-05, 1.5100464224815369e-05, 1.594703644514084e-05, 1.679360866546631e-05, 1.764018088579178e-05, 1.848675310611725e-05, 1.933332532644272e-05, 2.017989754676819e-05, 2.102646976709366e-05, 2.187304198741913e-05, 2.27196142077446e-05, 2.356618642807007e-05, 2.441275864839554e-05, 2.5259330868721008e-05, 2.6105903089046478e-05, 2.6952475309371948e-05, 2.7799047529697418e-05, 2.8645619750022888e-05, 2.9492191970348358e-05, 3.0338764190673828e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 13.0, 18.0, 22.0, 26.0, 44.0, 67.0, 146.0, 238.0, 431.0, 813.0, 1470.0, 3254.0, 8793.0, 33870.0, 169471.0, 545038.0, 223441.0, 43398.0, 10623.0, 3728.0, 1623.0, 815.0, 497.0, 280.0, 150.0, 94.0, 64.0, 36.0, 30.0, 17.0, 11.0, 8.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0], "bins": [-0.03485107421875, -0.033843278884887695, -0.03283548355102539, -0.031827688217163086, -0.03081989288330078, -0.029812097549438477, -0.028804302215576172, -0.027796506881713867, -0.026788711547851562, -0.025780916213989258, -0.024773120880126953, -0.02376532554626465, -0.022757530212402344, -0.02174973487854004, -0.020741939544677734, -0.01973414421081543, -0.018726348876953125, -0.01771855354309082, -0.016710758209228516, -0.01570296287536621, -0.014695167541503906, -0.013687372207641602, -0.012679576873779297, -0.011671781539916992, -0.010663986206054688, -0.009656190872192383, -0.008648395538330078, -0.0076406002044677734, -0.006632804870605469, -0.005625009536743164, -0.004617214202880859, -0.0036094188690185547, -0.00260162353515625, -0.0015938282012939453, -0.0005860328674316406, 0.00042176246643066406, 0.0014295578002929688, 0.0024373531341552734, 0.003445148468017578, 0.004452943801879883, 0.0054607391357421875, 0.006468534469604492, 0.007476329803466797, 0.008484125137329102, 0.009491920471191406, 0.010499715805053711, 0.011507511138916016, 0.01251530647277832, 0.013523101806640625, 0.01453089714050293, 0.015538692474365234, 0.01654648780822754, 0.017554283142089844, 0.01856207847595215, 0.019569873809814453, 0.020577669143676758, 0.021585464477539062, 0.022593259811401367, 0.023601055145263672, 0.024608850479125977, 0.02561664581298828, 0.026624441146850586, 0.02763223648071289, 0.028640031814575195, 0.0296478271484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 5.0, 8.0, 9.0, 11.0, 15.0, 19.0, 20.0, 35.0, 39.0, 56.0, 60.0, 100.0, 91.0, 76.0, 62.0, 72.0, 64.0, 60.0, 38.0, 34.0, 26.0, 25.0, 12.0, 13.0, 7.0, 9.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.01062774658203125, -0.01036381721496582, -0.01009988784790039, -0.009835958480834961, -0.009572029113769531, -0.009308099746704102, -0.009044170379638672, -0.008780241012573242, -0.008516311645507812, -0.008252382278442383, -0.007988452911376953, -0.0077245235443115234, -0.007460594177246094, -0.007196664810180664, -0.006932735443115234, -0.006668806076049805, -0.006404876708984375, -0.006140947341918945, -0.005877017974853516, -0.005613088607788086, -0.005349159240722656, -0.0050852298736572266, -0.004821300506591797, -0.004557371139526367, -0.0042934417724609375, -0.004029512405395508, -0.003765583038330078, -0.0035016536712646484, -0.0032377243041992188, -0.002973794937133789, -0.0027098655700683594, -0.0024459362030029297, -0.0021820068359375, -0.0019180774688720703, -0.0016541481018066406, -0.001390218734741211, -0.0011262893676757812, -0.0008623600006103516, -0.0005984306335449219, -0.0003345012664794922, -7.05718994140625e-05, 0.0001933574676513672, 0.0004572868347167969, 0.0007212162017822266, 0.0009851455688476562, 0.001249074935913086, 0.0015130043029785156, 0.0017769336700439453, 0.002040863037109375, 0.0023047924041748047, 0.0025687217712402344, 0.002832651138305664, 0.0030965805053710938, 0.0033605098724365234, 0.003624439239501953, 0.003888368606567383, 0.0041522979736328125, 0.004416227340698242, 0.004680156707763672, 0.0049440860748291016, 0.005208015441894531, 0.005471944808959961, 0.005735874176025391, 0.00599980354309082, 0.00626373291015625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 21.0, 25.0, 62.0, 73.0, 132.0, 177.0, 167.0, 149.0, 73.0, 64.0, 34.0, 11.0, 9.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31661269068717957, -0.2956339716911316, -0.2746552526950836, -0.25367653369903564, -0.23269784450531006, -0.21171912550926208, -0.1907404065132141, -0.16976170241832733, -0.14878298342227936, -0.12780426442623138, -0.1068255603313446, -0.08584684133529663, -0.06486812978982925, -0.04388941824436188, -0.022910699248313904, -0.001931995153427124, 0.01904672384262085, 0.040025435388088226, 0.0610041506588459, 0.08198286592960358, 0.10296157747507095, 0.12394028902053833, 0.1449190080165863, 0.16589771211147308, 0.18687643110752106, 0.20785515010356903, 0.2288338541984558, 0.24981257319450378, 0.27079129219055176, 0.29176998138427734, 0.3127487301826477, 0.3337274193763733, 0.3547061085700989, 0.37568482756614685, 0.3966635465621948, 0.4176422357559204, 0.4386209547519684, 0.45959967374801636, 0.48057839274406433, 0.5015571117401123, 0.5225358009338379, 0.5435144901275635, 0.5644932389259338, 0.5854719281196594, 0.6064506769180298, 0.6274293661117554, 0.648408055305481, 0.6693868041038513, 0.6903655529022217, 0.7113442420959473, 0.7323229908943176, 0.7533016800880432, 0.7742804288864136, 0.7952591180801392, 0.8162378072738647, 0.8372165560722351, 0.8581952452659607, 0.8791739344596863, 0.9001526832580566, 0.9211313724517822, 0.9421101212501526, 0.9630888104438782, 0.9840675592422485, 1.0050462484359741, 1.0260249376296997]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 11.0, 14.0, 15.0, 22.0, 17.0, 19.0, 22.0, 32.0, 30.0, 41.0, 46.0, 57.0, 58.0, 52.0, 59.0, 53.0, 54.0, 58.0, 42.0, 40.0, 39.0, 38.0, 29.0, 29.0, 20.0, 24.0, 18.0, 10.0, 14.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25978797674179077, -0.25141122937202454, -0.2430344671010971, -0.23465770483016968, -0.22628095746040344, -0.2179042100906372, -0.20952744781970978, -0.20115068554878235, -0.1927739381790161, -0.18439719080924988, -0.17602042853832245, -0.16764366626739502, -0.15926691889762878, -0.15089017152786255, -0.14251340925693512, -0.1341366469860077, -0.12575989961624146, -0.11738314479589462, -0.10900638997554779, -0.10062963515520096, -0.09225288033485413, -0.0838761255145073, -0.07549937069416046, -0.06712261587381363, -0.0587458610534668, -0.050369106233119965, -0.04199235141277313, -0.0336155965924263, -0.025238841772079468, -0.016862086951732635, -0.008485332131385803, -0.00010857731103897095, 0.008268177509307861, 0.016644932329654694, 0.025021687150001526, 0.03339844197034836, 0.04177519679069519, 0.05015195161104202, 0.058528706431388855, 0.06690546125173569, 0.07528221607208252, 0.08365897089242935, 0.09203572571277618, 0.10041248053312302, 0.10878923535346985, 0.11716599017381668, 0.1255427449941635, 0.13391950726509094, 0.14229625463485718, 0.1506730020046234, 0.15904976427555084, 0.16742652654647827, 0.1758032739162445, 0.18418002128601074, 0.19255678355693817, 0.2009335458278656, 0.20931029319763184, 0.21768704056739807, 0.2260638028383255, 0.23444056510925293, 0.24281731247901917, 0.2511940598487854, 0.259570837020874, 0.26794758439064026, 0.2763243317604065]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 10.0, 12.0, 7.0, 29.0, 22.0, 40.0, 72.0, 107.0, 171.0, 274.0, 537.0, 1031.0, 2020.0, 4444.0, 10585.0, 29835.0, 117059.0, 681518.0, 144236.0, 34883.0, 11996.0, 4858.0, 2253.0, 1192.0, 601.0, 313.0, 159.0, 98.0, 62.0, 40.0, 28.0, 11.0, 14.0, 10.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33642578125, -0.323760986328125, -0.31109619140625, -0.298431396484375, -0.2857666015625, -0.273101806640625, -0.26043701171875, -0.247772216796875, -0.235107421875, -0.222442626953125, -0.20977783203125, -0.197113037109375, -0.1844482421875, -0.171783447265625, -0.15911865234375, -0.146453857421875, -0.1337890625, -0.121124267578125, -0.10845947265625, -0.095794677734375, -0.0831298828125, -0.070465087890625, -0.05780029296875, -0.045135498046875, -0.032470703125, -0.019805908203125, -0.00714111328125, 0.005523681640625, 0.0181884765625, 0.030853271484375, 0.04351806640625, 0.056182861328125, 0.06884765625, 0.081512451171875, 0.09417724609375, 0.106842041015625, 0.1195068359375, 0.132171630859375, 0.14483642578125, 0.157501220703125, 0.170166015625, 0.182830810546875, 0.19549560546875, 0.208160400390625, 0.2208251953125, 0.233489990234375, 0.24615478515625, 0.258819580078125, 0.271484375, 0.284149169921875, 0.29681396484375, 0.309478759765625, 0.3221435546875, 0.334808349609375, 0.34747314453125, 0.360137939453125, 0.372802734375, 0.385467529296875, 0.39813232421875, 0.410797119140625, 0.4234619140625, 0.436126708984375, 0.44879150390625, 0.461456298828125, 0.47412109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 4.0, 3.0, 11.0, 15.0, 26.0, 34.0, 36.0, 47.0, 56.0, 86.0, 93.0, 82.0, 82.0, 105.0, 68.0, 55.0, 56.0, 43.0, 31.0, 30.0, 14.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.47954559326171875, -0.4556732177734375, -0.43180084228515625, -0.407928466796875, -0.38405609130859375, -0.3601837158203125, -0.33631134033203125, -0.31243896484375, -0.28856658935546875, -0.2646942138671875, -0.24082183837890625, -0.216949462890625, -0.19307708740234375, -0.1692047119140625, -0.14533233642578125, -0.1214599609375, -0.09758758544921875, -0.0737152099609375, -0.04984283447265625, -0.025970458984375, -0.00209808349609375, 0.0217742919921875, 0.04564666748046875, 0.06951904296875, 0.09339141845703125, 0.1172637939453125, 0.14113616943359375, 0.165008544921875, 0.18888092041015625, 0.2127532958984375, 0.23662567138671875, 0.260498046875, 0.28437042236328125, 0.3082427978515625, 0.33211517333984375, 0.355987548828125, 0.37985992431640625, 0.4037322998046875, 0.42760467529296875, 0.45147705078125, 0.47534942626953125, 0.4992218017578125, 0.5230941772460938, 0.546966552734375, 0.5708389282226562, 0.5947113037109375, 0.6185836791992188, 0.6424560546875, 0.6663284301757812, 0.6902008056640625, 0.7140731811523438, 0.737945556640625, 0.7618179321289062, 0.7856903076171875, 0.8095626831054688, 0.83343505859375, 0.8573074340820312, 0.8811798095703125, 0.9050521850585938, 0.928924560546875, 0.9527969360351562, 0.9766693115234375, 1.0005416870117188, 1.0244140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 3.0, 13.0, 10.0, 13.0, 17.0, 17.0, 25.0, 39.0, 40.0, 63.0, 93.0, 136.0, 251.0, 555.0, 1896.0, 11908.0, 184246.0, 818668.0, 25520.0, 3351.0, 826.0, 304.0, 145.0, 112.0, 74.0, 38.0, 42.0, 31.0, 28.0, 14.0, 20.0, 4.0, 10.0, 9.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.762481689453125, -0.73541259765625, -0.708343505859375, -0.6812744140625, -0.654205322265625, -0.62713623046875, -0.600067138671875, -0.572998046875, -0.545928955078125, -0.51885986328125, -0.491790771484375, -0.4647216796875, -0.437652587890625, -0.41058349609375, -0.383514404296875, -0.3564453125, -0.329376220703125, -0.30230712890625, -0.275238037109375, -0.2481689453125, -0.221099853515625, -0.19403076171875, -0.166961669921875, -0.139892578125, -0.112823486328125, -0.08575439453125, -0.058685302734375, -0.0316162109375, -0.004547119140625, 0.02252197265625, 0.049591064453125, 0.07666015625, 0.103729248046875, 0.13079833984375, 0.157867431640625, 0.1849365234375, 0.212005615234375, 0.23907470703125, 0.266143798828125, 0.293212890625, 0.320281982421875, 0.34735107421875, 0.374420166015625, 0.4014892578125, 0.428558349609375, 0.45562744140625, 0.482696533203125, 0.509765625, 0.536834716796875, 0.56390380859375, 0.590972900390625, 0.6180419921875, 0.645111083984375, 0.67218017578125, 0.699249267578125, 0.726318359375, 0.753387451171875, 0.78045654296875, 0.807525634765625, 0.8345947265625, 0.861663818359375, 0.88873291015625, 0.915802001953125, 0.94287109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 7.0, 12.0, 10.0, 14.0, 19.0, 21.0, 23.0, 29.0, 36.0, 31.0, 43.0, 58.0, 47.0, 43.0, 46.0, 53.0, 50.0, 52.0, 39.0, 46.0, 47.0, 41.0, 38.0, 23.0, 26.0, 19.0, 18.0, 19.0, 13.0, 12.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.51116943359375, -0.4945068359375, -0.47784423828125, -0.461181640625, -0.44451904296875, -0.4278564453125, -0.41119384765625, -0.39453125, -0.37786865234375, -0.3612060546875, -0.34454345703125, -0.327880859375, -0.31121826171875, -0.2945556640625, -0.27789306640625, -0.26123046875, -0.24456787109375, -0.2279052734375, -0.21124267578125, -0.194580078125, -0.17791748046875, -0.1612548828125, -0.14459228515625, -0.1279296875, -0.11126708984375, -0.0946044921875, -0.07794189453125, -0.061279296875, -0.04461669921875, -0.0279541015625, -0.01129150390625, 0.00537109375, 0.02203369140625, 0.0386962890625, 0.05535888671875, 0.072021484375, 0.08868408203125, 0.1053466796875, 0.12200927734375, 0.138671875, 0.15533447265625, 0.1719970703125, 0.18865966796875, 0.205322265625, 0.22198486328125, 0.2386474609375, 0.25531005859375, 0.27197265625, 0.28863525390625, 0.3052978515625, 0.32196044921875, 0.338623046875, 0.35528564453125, 0.3719482421875, 0.38861083984375, 0.4052734375, 0.42193603515625, 0.4385986328125, 0.45526123046875, 0.471923828125, 0.48858642578125, 0.5052490234375, 0.52191162109375, 0.53857421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 6.0, 27.0, 29.0, 40.0, 110.0, 185.0, 367.0, 1112.0, 4477.0, 34412.0, 875485.0, 119417.0, 9939.0, 1885.0, 528.0, 237.0, 123.0, 49.0, 42.0, 27.0, 13.0, 8.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2010498046875, -0.1929149627685547, -0.18478012084960938, -0.17664527893066406, -0.16851043701171875, -0.16037559509277344, -0.15224075317382812, -0.1441059112548828, -0.1359710693359375, -0.1278362274169922, -0.11970138549804688, -0.11156654357910156, -0.10343170166015625, -0.09529685974121094, -0.08716201782226562, -0.07902717590332031, -0.070892333984375, -0.06275749206542969, -0.054622650146484375, -0.04648780822753906, -0.03835296630859375, -0.030218124389648438, -0.022083282470703125, -0.013948440551757812, -0.0058135986328125, 0.0023212432861328125, 0.010456085205078125, 0.018590927124023438, 0.02672576904296875, 0.03486061096191406, 0.042995452880859375, 0.05113029479980469, 0.05926513671875, 0.06739997863769531, 0.07553482055664062, 0.08366966247558594, 0.09180450439453125, 0.09993934631347656, 0.10807418823242188, 0.11620903015136719, 0.1243438720703125, 0.1324787139892578, 0.14061355590820312, 0.14874839782714844, 0.15688323974609375, 0.16501808166503906, 0.17315292358398438, 0.1812877655029297, 0.189422607421875, 0.1975574493408203, 0.20569229125976562, 0.21382713317871094, 0.22196197509765625, 0.23009681701660156, 0.23823165893554688, 0.2463665008544922, 0.2545013427734375, 0.2626361846923828, 0.2707710266113281, 0.27890586853027344, 0.28704071044921875, 0.29517555236816406, 0.3033103942871094, 0.3114452362060547, 0.319580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 6.0, 7.0, 8.0, 7.0, 12.0, 25.0, 26.0, 45.0, 66.0, 140.0, 254.0, 167.0, 77.0, 42.0, 46.0, 25.0, 9.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4557113647460938e-05, -2.3558735847473145e-05, -2.256035804748535e-05, -2.156198024749756e-05, -2.0563602447509766e-05, -1.9565224647521973e-05, -1.856684684753418e-05, -1.7568469047546387e-05, -1.6570091247558594e-05, -1.55717134475708e-05, -1.4573335647583008e-05, -1.3574957847595215e-05, -1.2576580047607422e-05, -1.1578202247619629e-05, -1.0579824447631836e-05, -9.581446647644043e-06, -8.58306884765625e-06, -7.584691047668457e-06, -6.586313247680664e-06, -5.587935447692871e-06, -4.589557647705078e-06, -3.591179847717285e-06, -2.592802047729492e-06, -1.5944242477416992e-06, -5.960464477539062e-07, 4.023313522338867e-07, 1.4007091522216797e-06, 2.3990869522094727e-06, 3.3974647521972656e-06, 4.395842552185059e-06, 5.3942203521728516e-06, 6.3925981521606445e-06, 7.3909759521484375e-06, 8.38935375213623e-06, 9.387731552124023e-06, 1.0386109352111816e-05, 1.138448715209961e-05, 1.2382864952087402e-05, 1.3381242752075195e-05, 1.4379620552062988e-05, 1.537799835205078e-05, 1.6376376152038574e-05, 1.7374753952026367e-05, 1.837313175201416e-05, 1.9371509552001953e-05, 2.0369887351989746e-05, 2.136826515197754e-05, 2.2366642951965332e-05, 2.3365020751953125e-05, 2.4363398551940918e-05, 2.536177635192871e-05, 2.6360154151916504e-05, 2.7358531951904297e-05, 2.835690975189209e-05, 2.9355287551879883e-05, 3.0353665351867676e-05, 3.135204315185547e-05, 3.235042095184326e-05, 3.3348798751831055e-05, 3.434717655181885e-05, 3.534555435180664e-05, 3.6343932151794434e-05, 3.7342309951782227e-05, 3.834068775177002e-05, 3.933906555175781e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 10.0, 16.0, 23.0, 36.0, 73.0, 100.0, 194.0, 336.0, 721.0, 1865.0, 8157.0, 85213.0, 884771.0, 57695.0, 6366.0, 1583.0, 634.0, 304.0, 186.0, 95.0, 59.0, 42.0, 23.0, 10.0, 9.0, 2.0, 10.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.3154296875, -0.3074302673339844, -0.29943084716796875, -0.2914314270019531, -0.2834320068359375, -0.2754325866699219, -0.26743316650390625, -0.2594337463378906, -0.251434326171875, -0.24343490600585938, -0.23543548583984375, -0.22743606567382812, -0.2194366455078125, -0.21143722534179688, -0.20343780517578125, -0.19543838500976562, -0.18743896484375, -0.17943954467773438, -0.17144012451171875, -0.16344070434570312, -0.1554412841796875, -0.14744186401367188, -0.13944244384765625, -0.13144302368164062, -0.123443603515625, -0.11544418334960938, -0.10744476318359375, -0.09944534301757812, -0.0914459228515625, -0.08344650268554688, -0.07544708251953125, -0.06744766235351562, -0.0594482421875, -0.051448822021484375, -0.04344940185546875, -0.035449981689453125, -0.0274505615234375, -0.019451141357421875, -0.01145172119140625, -0.003452301025390625, 0.004547119140625, 0.012546539306640625, 0.02054595947265625, 0.028545379638671875, 0.0365447998046875, 0.044544219970703125, 0.05254364013671875, 0.060543060302734375, 0.06854248046875, 0.07654190063476562, 0.08454132080078125, 0.09254074096679688, 0.1005401611328125, 0.10853958129882812, 0.11653900146484375, 0.12453842163085938, 0.132537841796875, 0.14053726196289062, 0.14853668212890625, 0.15653610229492188, 0.1645355224609375, 0.17253494262695312, 0.18053436279296875, 0.18853378295898438, 0.196533203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 7.0, 2.0, 13.0, 13.0, 11.0, 9.0, 28.0, 18.0, 30.0, 35.0, 56.0, 71.0, 158.0, 193.0, 97.0, 55.0, 39.0, 27.0, 34.0, 24.0, 19.0, 14.0, 11.0, 9.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045318603515625, -0.04343843460083008, -0.041558265686035156, -0.039678096771240234, -0.03779792785644531, -0.03591775894165039, -0.03403759002685547, -0.03215742111206055, -0.030277252197265625, -0.028397083282470703, -0.02651691436767578, -0.02463674545288086, -0.022756576538085938, -0.020876407623291016, -0.018996238708496094, -0.017116069793701172, -0.01523590087890625, -0.013355731964111328, -0.011475563049316406, -0.009595394134521484, -0.0077152252197265625, -0.005835056304931641, -0.003954887390136719, -0.002074718475341797, -0.000194549560546875, 0.0016856193542480469, 0.0035657882690429688, 0.005445957183837891, 0.0073261260986328125, 0.009206295013427734, 0.011086463928222656, 0.012966632843017578, 0.0148468017578125, 0.016726970672607422, 0.018607139587402344, 0.020487308502197266, 0.022367477416992188, 0.02424764633178711, 0.02612781524658203, 0.028007984161376953, 0.029888153076171875, 0.0317683219909668, 0.03364849090576172, 0.03552865982055664, 0.03740882873535156, 0.039288997650146484, 0.041169166564941406, 0.04304933547973633, 0.04492950439453125, 0.04680967330932617, 0.048689842224121094, 0.050570011138916016, 0.05245018005371094, 0.05433034896850586, 0.05621051788330078, 0.0580906867980957, 0.059970855712890625, 0.06185102462768555, 0.06373119354248047, 0.06561136245727539, 0.06749153137207031, 0.06937170028686523, 0.07125186920166016, 0.07313203811645508, 0.07501220703125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [10.0, 24.0, 52.0, 161.0, 318.0, 259.0, 132.0, 35.0, 19.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35728853940963745, -0.2844151258468628, -0.21154168248176575, -0.1386682540178299, -0.06579482555389404, 0.007078588008880615, 0.07995203137397766, 0.1528254747390747, 0.22569888830184937, 0.298572301864624, 0.37144574522972107, 0.4443191885948181, 0.5171926021575928, 0.5900660157203674, 0.6629394292831421, 0.7358129024505615, 0.8086863160133362, 0.8815597295761108, 0.9544332027435303, 1.0273065567016602, 1.1001800298690796, 1.173053503036499, 1.245926856994629, 1.3188003301620483, 1.3916738033294678, 1.4645472764968872, 1.537420630455017, 1.6102941036224365, 1.6831674575805664, 1.7560409307479858, 1.8289144039154053, 1.9017877578735352, 1.9746613502502441, 2.047534704208374, 2.120408296585083, 2.193281650543213, 2.2661550045013428, 2.3390283584594727, 2.4119019508361816, 2.4847753047943115, 2.5576486587524414, 2.6305220127105713, 2.7033956050872803, 2.77626895904541, 2.84914231300354, 2.92201566696167, 2.994889259338379, 3.067762613296509, 3.1406362056732178, 3.2135095596313477, 3.2863831520080566, 3.3592565059661865, 3.4321298599243164, 3.5050034523010254, 3.5778768062591553, 3.650750160217285, 3.723623752593994, 3.796497106552124, 3.869370698928833, 3.942244052886963, 4.015117645263672, 4.087990760803223, 4.160864353179932, 4.233737945556641, 4.306611061096191]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 26.0, 19.0, 20.0, 26.0, 27.0, 28.0, 34.0, 37.0, 41.0, 39.0, 50.0, 48.0, 42.0, 48.0, 55.0, 46.0, 49.0, 50.0, 33.0, 36.0, 25.0, 28.0, 35.0, 20.0, 21.0, 11.0, 13.0, 9.0, 13.0, 4.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7250390648841858, -0.6977466344833374, -0.6704542636871338, -0.6431618332862854, -0.615869402885437, -0.5885770320892334, -0.561284601688385, -0.5339921712875366, -0.506699800491333, -0.479407399892807, -0.452114999294281, -0.4248225688934326, -0.3975301682949066, -0.3702377676963806, -0.3429453372955322, -0.3156529366970062, -0.2883605360984802, -0.2610681354999542, -0.23377572000026703, -0.20648330450057983, -0.17919090390205383, -0.15189850330352783, -0.12460608780384064, -0.09731367230415344, -0.07002127170562744, -0.042728863656520844, -0.015436455607414246, 0.011855952441692352, 0.03914836049079895, 0.06644076108932495, 0.09373317658901215, 0.12102559208869934, 0.14831793308258057, 0.17561033368110657, 0.20290274918079376, 0.23019516468048096, 0.25748756527900696, 0.28477996587753296, 0.31207239627838135, 0.33936479687690735, 0.36665719747543335, 0.39394959807395935, 0.42124199867248535, 0.44853442907333374, 0.47582682967185974, 0.5031192302703857, 0.5304116606712341, 0.5577040910720825, 0.5849964618682861, 0.6122888922691345, 0.6395812630653381, 0.6668736934661865, 0.6941660642623901, 0.7214584946632385, 0.7487509250640869, 0.7760432958602905, 0.8033357262611389, 0.8306281566619873, 0.8579205274581909, 0.8852129578590393, 0.9125053882598877, 0.9397977590560913, 0.9670901894569397, 0.9943826198577881, 1.0216749906539917]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 25.0, 36.0, 85.0, 139.0, 288.0, 584.0, 1489.0, 5168.0, 28102.0, 814403.0, 3238712.0, 90786.0, 10295.0, 2447.0, 921.0, 378.0, 193.0, 90.0, 50.0, 29.0, 15.0, 8.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82763671875, -0.8034515380859375, -0.779266357421875, -0.7550811767578125, -0.73089599609375, -0.7067108154296875, -0.682525634765625, -0.6583404541015625, -0.6341552734375, -0.6099700927734375, -0.585784912109375, -0.5615997314453125, -0.53741455078125, -0.5132293701171875, -0.489044189453125, -0.4648590087890625, -0.440673828125, -0.4164886474609375, -0.392303466796875, -0.3681182861328125, -0.34393310546875, -0.3197479248046875, -0.295562744140625, -0.2713775634765625, -0.2471923828125, -0.2230072021484375, -0.198822021484375, -0.1746368408203125, -0.15045166015625, -0.1262664794921875, -0.102081298828125, -0.0778961181640625, -0.0537109375, -0.0295257568359375, -0.005340576171875, 0.0188446044921875, 0.04302978515625, 0.0672149658203125, 0.091400146484375, 0.1155853271484375, 0.1397705078125, 0.1639556884765625, 0.188140869140625, 0.2123260498046875, 0.23651123046875, 0.2606964111328125, 0.284881591796875, 0.3090667724609375, 0.333251953125, 0.3574371337890625, 0.381622314453125, 0.4058074951171875, 0.42999267578125, 0.4541778564453125, 0.478363037109375, 0.5025482177734375, 0.5267333984375, 0.5509185791015625, 0.575103759765625, 0.5992889404296875, 0.62347412109375, 0.6476593017578125, 0.671844482421875, 0.6960296630859375, 0.72021484375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 9.0, 2.0, 11.0, 15.0, 14.0, 16.0, 15.0, 18.0, 26.0, 27.0, 24.0, 31.0, 44.0, 41.0, 46.0, 37.0, 50.0, 47.0, 42.0, 42.0, 41.0, 43.0, 52.0, 39.0, 30.0, 33.0, 30.0, 26.0, 25.0, 13.0, 19.0, 14.0, 16.0, 8.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.252197265625, -0.24477386474609375, -0.2373504638671875, -0.22992706298828125, -0.222503662109375, -0.21508026123046875, -0.2076568603515625, -0.20023345947265625, -0.19281005859375, -0.18538665771484375, -0.1779632568359375, -0.17053985595703125, -0.163116455078125, -0.15569305419921875, -0.1482696533203125, -0.14084625244140625, -0.1334228515625, -0.12599945068359375, -0.1185760498046875, -0.11115264892578125, -0.103729248046875, -0.09630584716796875, -0.0888824462890625, -0.08145904541015625, -0.07403564453125, -0.06661224365234375, -0.0591888427734375, -0.05176544189453125, -0.044342041015625, -0.03691864013671875, -0.0294952392578125, -0.02207183837890625, -0.0146484375, -0.00722503662109375, 0.0001983642578125, 0.00762176513671875, 0.015045166015625, 0.02246856689453125, 0.0298919677734375, 0.03731536865234375, 0.04473876953125, 0.05216217041015625, 0.0595855712890625, 0.06700897216796875, 0.074432373046875, 0.08185577392578125, 0.0892791748046875, 0.09670257568359375, 0.1041259765625, 0.11154937744140625, 0.1189727783203125, 0.12639617919921875, 0.133819580078125, 0.14124298095703125, 0.1486663818359375, 0.15608978271484375, 0.16351318359375, 0.17093658447265625, 0.1783599853515625, 0.18578338623046875, 0.193206787109375, 0.20063018798828125, 0.2080535888671875, 0.21547698974609375, 0.222900390625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 3.0, 11.0, 11.0, 9.0, 27.0, 44.0, 45.0, 75.0, 205.0, 503.0, 1676.0, 9685.0, 293513.0, 3848566.0, 34818.0, 3592.0, 872.0, 307.0, 153.0, 65.0, 36.0, 16.0, 14.0, 7.0, 7.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.26171875, -1.2237701416015625, -1.185821533203125, -1.1478729248046875, -1.10992431640625, -1.0719757080078125, -1.034027099609375, -0.9960784912109375, -0.9581298828125, -0.9201812744140625, -0.882232666015625, -0.8442840576171875, -0.80633544921875, -0.7683868408203125, -0.730438232421875, -0.6924896240234375, -0.654541015625, -0.6165924072265625, -0.578643798828125, -0.5406951904296875, -0.50274658203125, -0.4647979736328125, -0.426849365234375, -0.3889007568359375, -0.3509521484375, -0.3130035400390625, -0.275054931640625, -0.2371063232421875, -0.19915771484375, -0.1612091064453125, -0.123260498046875, -0.0853118896484375, -0.04736328125, -0.0094146728515625, 0.028533935546875, 0.0664825439453125, 0.10443115234375, 0.1423797607421875, 0.180328369140625, 0.2182769775390625, 0.2562255859375, 0.2941741943359375, 0.332122802734375, 0.3700714111328125, 0.40802001953125, 0.4459686279296875, 0.483917236328125, 0.5218658447265625, 0.559814453125, 0.5977630615234375, 0.635711669921875, 0.6736602783203125, 0.71160888671875, 0.7495574951171875, 0.787506103515625, 0.8254547119140625, 0.8634033203125, 0.9013519287109375, 0.939300537109375, 0.9772491455078125, 1.01519775390625, 1.0531463623046875, 1.091094970703125, 1.1290435791015625, 1.1669921875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 11.0, 8.0, 11.0, 13.0, 15.0, 28.0, 27.0, 55.0, 90.0, 142.0, 264.0, 423.0, 595.0, 759.0, 619.0, 358.0, 231.0, 134.0, 89.0, 50.0, 33.0, 39.0, 14.0, 7.0, 10.0, 8.0, 10.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15185546875, -0.14686012268066406, -0.14186477661132812, -0.1368694305419922, -0.13187408447265625, -0.1268787384033203, -0.12188339233398438, -0.11688804626464844, -0.1118927001953125, -0.10689735412597656, -0.10190200805664062, -0.09690666198730469, -0.09191131591796875, -0.08691596984863281, -0.08192062377929688, -0.07692527770996094, -0.071929931640625, -0.06693458557128906, -0.061939239501953125, -0.05694389343261719, -0.05194854736328125, -0.04695320129394531, -0.041957855224609375, -0.03696250915527344, -0.0319671630859375, -0.026971817016601562, -0.021976470947265625, -0.016981124877929688, -0.01198577880859375, -0.0069904327392578125, -0.001995086669921875, 0.0030002593994140625, 0.00799560546875, 0.012990951538085938, 0.017986297607421875, 0.022981643676757812, 0.02797698974609375, 0.03297233581542969, 0.037967681884765625, 0.04296302795410156, 0.0479583740234375, 0.05295372009277344, 0.057949066162109375, 0.06294441223144531, 0.06793975830078125, 0.07293510437011719, 0.07793045043945312, 0.08292579650878906, 0.087921142578125, 0.09291648864746094, 0.09791183471679688, 0.10290718078613281, 0.10790252685546875, 0.11289787292480469, 0.11789321899414062, 0.12288856506347656, 0.1278839111328125, 0.13287925720214844, 0.13787460327148438, 0.1428699493408203, 0.14786529541015625, 0.1528606414794922, 0.15785598754882812, 0.16285133361816406, 0.1678466796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 6.0, 11.0, 3.0, 16.0, 12.0, 22.0, 24.0, 31.0, 34.0, 36.0, 44.0, 58.0, 75.0, 65.0, 75.0, 55.0, 75.0, 59.0, 68.0, 34.0, 38.0, 31.0, 28.0, 30.0, 20.0, 10.0, 14.0, 7.0, 6.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.5012553334236145, -0.48900681734085083, -0.47675830125808716, -0.4645098149776459, -0.4522612988948822, -0.44001278281211853, -0.42776426672935486, -0.4155157804489136, -0.4032672643661499, -0.39101874828338623, -0.37877023220062256, -0.3665217459201813, -0.3542732298374176, -0.34202471375465393, -0.32977619767189026, -0.317527711391449, -0.3052791953086853, -0.29303067922592163, -0.28078216314315796, -0.2685336768627167, -0.256285160779953, -0.24403664469718933, -0.23178812861442566, -0.21953962743282318, -0.20729109644889832, -0.19504258036613464, -0.18279407918453217, -0.1705455631017685, -0.15829706192016602, -0.14604854583740234, -0.13380002975463867, -0.1215515285730362, -0.10930302739143372, -0.09705451875925064, -0.08480601012706757, -0.0725574940443039, -0.06030898913741112, -0.04806048050522804, -0.03581196814775467, -0.023563459515571594, -0.01131495088338852, 0.0009335586801171303, 0.01318206824362278, 0.025430578738451004, 0.03767908737063408, 0.049927596002817154, 0.06217610836029053, 0.0744246169924736, 0.08667312562465668, 0.09892163425683975, 0.11117014288902283, 0.1234186589717865, 0.13566716015338898, 0.14791567623615265, 0.16016417741775513, 0.1724126935005188, 0.18466120958328247, 0.19690972566604614, 0.20915822684764862, 0.2214067429304123, 0.23365524411201477, 0.24590376019477844, 0.2581522762775421, 0.2704007625579834, 0.28264927864074707]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 6.0, 12.0, 12.0, 11.0, 17.0, 16.0, 16.0, 20.0, 28.0, 20.0, 20.0, 34.0, 41.0, 32.0, 36.0, 30.0, 39.0, 35.0, 45.0, 42.0, 40.0, 41.0, 40.0, 39.0, 28.0, 38.0, 26.0, 34.0, 26.0, 25.0, 18.0, 24.0, 14.0, 10.0, 10.0, 14.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.29343488812446594, -0.28508466482162476, -0.27673447132110596, -0.26838427782058716, -0.26003405451774597, -0.2516838312149048, -0.243333637714386, -0.234983429312706, -0.226633220911026, -0.218283012509346, -0.20993280410766602, -0.20158259570598602, -0.19323238730430603, -0.18488217890262604, -0.17653197050094604, -0.16818176209926605, -0.15983155369758606, -0.15148134529590607, -0.14313113689422607, -0.13478092849254608, -0.1264307200908661, -0.1180805116891861, -0.1097303032875061, -0.10138009488582611, -0.09302988648414612, -0.08467967808246613, -0.07632946968078613, -0.06797926127910614, -0.05962905287742615, -0.051278844475746155, -0.04292863607406616, -0.03457842767238617, -0.02622818946838379, -0.017877981066703796, -0.009527772665023804, -0.001177564263343811, 0.007172644138336182, 0.015522852540016174, 0.023873060941696167, 0.03222326934337616, 0.04057347774505615, 0.048923686146736145, 0.05727389454841614, 0.06562410295009613, 0.07397431135177612, 0.08232451975345612, 0.09067472815513611, 0.0990249365568161, 0.1073751449584961, 0.11572535336017609, 0.12407556176185608, 0.13242577016353607, 0.14077597856521606, 0.14912618696689606, 0.15747639536857605, 0.16582660377025604, 0.17417681217193604, 0.18252702057361603, 0.19087722897529602, 0.199227437376976, 0.207577645778656, 0.215927854180336, 0.224278062582016, 0.23262827098369598, 0.24097847938537598]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 8.0, 10.0, 7.0, 22.0, 33.0, 59.0, 86.0, 113.0, 179.0, 271.0, 411.0, 664.0, 1044.0, 1578.0, 2627.0, 4698.0, 8145.0, 16173.0, 46722.0, 231198.0, 534816.0, 137593.0, 32196.0, 12892.0, 6733.0, 3944.0, 2360.0, 1484.0, 906.0, 571.0, 343.0, 218.0, 145.0, 79.0, 80.0, 54.0, 22.0, 14.0, 17.0, 12.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12066650390625, -0.11704826354980469, -0.11343002319335938, -0.10981178283691406, -0.10619354248046875, -0.10257530212402344, -0.09895706176757812, -0.09533882141113281, -0.0917205810546875, -0.08810234069824219, -0.08448410034179688, -0.08086585998535156, -0.07724761962890625, -0.07362937927246094, -0.07001113891601562, -0.06639289855957031, -0.062774658203125, -0.05915641784667969, -0.055538177490234375, -0.05191993713378906, -0.04830169677734375, -0.04468345642089844, -0.041065216064453125, -0.03744697570800781, -0.0338287353515625, -0.030210494995117188, -0.026592254638671875, -0.022974014282226562, -0.01935577392578125, -0.015737533569335938, -0.012119293212890625, -0.008501052856445312, -0.0048828125, -0.0012645721435546875, 0.002353668212890625, 0.0059719085693359375, 0.00959014892578125, 0.013208389282226562, 0.016826629638671875, 0.020444869995117188, 0.0240631103515625, 0.027681350708007812, 0.031299591064453125, 0.03491783142089844, 0.03853607177734375, 0.04215431213378906, 0.045772552490234375, 0.04939079284667969, 0.053009033203125, 0.05662727355957031, 0.060245513916015625, 0.06386375427246094, 0.06748199462890625, 0.07110023498535156, 0.07471847534179688, 0.07833671569824219, 0.0819549560546875, 0.08557319641113281, 0.08919143676757812, 0.09280967712402344, 0.09642791748046875, 0.10004615783691406, 0.10366439819335938, 0.10728263854980469, 0.11090087890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 8.0, 3.0, 7.0, 9.0, 5.0, 7.0, 12.0, 14.0, 15.0, 13.0, 19.0, 30.0, 20.0, 38.0, 42.0, 32.0, 33.0, 33.0, 38.0, 53.0, 35.0, 42.0, 46.0, 38.0, 43.0, 50.0, 39.0, 39.0, 31.0, 35.0, 28.0, 18.0, 16.0, 17.0, 15.0, 15.0, 12.0, 7.0, 10.0, 8.0, 2.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.17919921875, -0.17395401000976562, -0.16870880126953125, -0.16346359252929688, -0.1582183837890625, -0.15297317504882812, -0.14772796630859375, -0.14248275756835938, -0.137237548828125, -0.13199234008789062, -0.12674713134765625, -0.12150192260742188, -0.1162567138671875, -0.11101150512695312, -0.10576629638671875, -0.10052108764648438, -0.09527587890625, -0.09003067016601562, -0.08478546142578125, -0.07954025268554688, -0.0742950439453125, -0.06904983520507812, -0.06380462646484375, -0.058559417724609375, -0.053314208984375, -0.048069000244140625, -0.04282379150390625, -0.037578582763671875, -0.0323333740234375, -0.027088165283203125, -0.02184295654296875, -0.016597747802734375, -0.0113525390625, -0.006107330322265625, -0.00086212158203125, 0.004383087158203125, 0.0096282958984375, 0.014873504638671875, 0.02011871337890625, 0.025363922119140625, 0.030609130859375, 0.035854339599609375, 0.04109954833984375, 0.046344757080078125, 0.0515899658203125, 0.056835174560546875, 0.06208038330078125, 0.06732559204101562, 0.07257080078125, 0.07781600952148438, 0.08306121826171875, 0.08830642700195312, 0.0935516357421875, 0.09879684448242188, 0.10404205322265625, 0.10928726196289062, 0.114532470703125, 0.11977767944335938, 0.12502288818359375, 0.13026809692382812, 0.1355133056640625, 0.14075851440429688, 0.14600372314453125, 0.15124893188476562, 0.156494140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 5.0, 4.0, 3.0, 3.0, 7.0, 1.0, 8.0, 7.0, 16.0, 35.0, 31.0, 51.0, 60.0, 113.0, 166.0, 309.0, 462.0, 793.0, 1533.0, 3271.0, 7348.0, 19212.0, 68785.0, 321895.0, 458665.0, 118339.0, 28540.0, 10060.0, 4314.0, 1988.0, 1082.0, 604.0, 310.0, 191.0, 137.0, 75.0, 40.0, 29.0, 24.0, 13.0, 10.0, 4.0, 6.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08935546875, -0.08681488037109375, -0.0842742919921875, -0.08173370361328125, -0.079193115234375, -0.07665252685546875, -0.0741119384765625, -0.07157135009765625, -0.06903076171875, -0.06649017333984375, -0.0639495849609375, -0.06140899658203125, -0.058868408203125, -0.05632781982421875, -0.0537872314453125, -0.05124664306640625, -0.0487060546875, -0.04616546630859375, -0.0436248779296875, -0.04108428955078125, -0.038543701171875, -0.03600311279296875, -0.0334625244140625, -0.03092193603515625, -0.02838134765625, -0.02584075927734375, -0.0233001708984375, -0.02075958251953125, -0.018218994140625, -0.01567840576171875, -0.0131378173828125, -0.01059722900390625, -0.008056640625, -0.00551605224609375, -0.0029754638671875, -0.00043487548828125, 0.002105712890625, 0.00464630126953125, 0.0071868896484375, 0.00972747802734375, 0.01226806640625, 0.01480865478515625, 0.0173492431640625, 0.01988983154296875, 0.022430419921875, 0.02497100830078125, 0.0275115966796875, 0.03005218505859375, 0.0325927734375, 0.03513336181640625, 0.0376739501953125, 0.04021453857421875, 0.042755126953125, 0.04529571533203125, 0.0478363037109375, 0.05037689208984375, 0.05291748046875, 0.05545806884765625, 0.0579986572265625, 0.06053924560546875, 0.063079833984375, 0.06562042236328125, 0.0681610107421875, 0.07070159912109375, 0.0732421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 15.0, 9.0, 16.0, 22.0, 17.0, 17.0, 19.0, 25.0, 21.0, 27.0, 28.0, 26.0, 40.0, 30.0, 33.0, 29.0, 41.0, 45.0, 40.0, 49.0, 40.0, 41.0, 39.0, 37.0, 35.0, 42.0, 28.0, 22.0, 21.0, 16.0, 14.0, 11.0, 12.0, 11.0, 16.0, 7.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2958984375, -0.286376953125, -0.27685546875, -0.267333984375, -0.2578125, -0.248291015625, -0.23876953125, -0.229248046875, -0.2197265625, -0.210205078125, -0.20068359375, -0.191162109375, -0.181640625, -0.172119140625, -0.16259765625, -0.153076171875, -0.1435546875, -0.134033203125, -0.12451171875, -0.114990234375, -0.10546875, -0.095947265625, -0.08642578125, -0.076904296875, -0.0673828125, -0.057861328125, -0.04833984375, -0.038818359375, -0.029296875, -0.019775390625, -0.01025390625, -0.000732421875, 0.0087890625, 0.018310546875, 0.02783203125, 0.037353515625, 0.046875, 0.056396484375, 0.06591796875, 0.075439453125, 0.0849609375, 0.094482421875, 0.10400390625, 0.113525390625, 0.123046875, 0.132568359375, 0.14208984375, 0.151611328125, 0.1611328125, 0.170654296875, 0.18017578125, 0.189697265625, 0.19921875, 0.208740234375, 0.21826171875, 0.227783203125, 0.2373046875, 0.246826171875, 0.25634765625, 0.265869140625, 0.275390625, 0.284912109375, 0.29443359375, 0.303955078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 6.0, 11.0, 15.0, 37.0, 66.0, 107.0, 163.0, 293.0, 562.0, 1007.0, 2300.0, 5793.0, 16660.0, 61985.0, 278616.0, 490884.0, 140168.0, 32768.0, 10007.0, 3814.0, 1602.0, 762.0, 358.0, 202.0, 132.0, 82.0, 49.0, 27.0, 20.0, 15.0, 7.0, 8.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0234375, -0.022608518600463867, -0.021779537200927734, -0.0209505558013916, -0.02012157440185547, -0.019292593002319336, -0.018463611602783203, -0.01763463020324707, -0.016805648803710938, -0.015976667404174805, -0.015147686004638672, -0.014318704605102539, -0.013489723205566406, -0.012660741806030273, -0.01183176040649414, -0.011002779006958008, -0.010173797607421875, -0.009344816207885742, -0.00851583480834961, -0.0076868534088134766, -0.006857872009277344, -0.006028890609741211, -0.005199909210205078, -0.004370927810668945, -0.0035419464111328125, -0.0027129650115966797, -0.0018839836120605469, -0.001055002212524414, -0.00022602081298828125, 0.0006029605865478516, 0.0014319419860839844, 0.002260923385620117, 0.00308990478515625, 0.003918886184692383, 0.004747867584228516, 0.0055768489837646484, 0.006405830383300781, 0.007234811782836914, 0.008063793182373047, 0.00889277458190918, 0.009721755981445312, 0.010550737380981445, 0.011379718780517578, 0.012208700180053711, 0.013037681579589844, 0.013866662979125977, 0.01469564437866211, 0.015524625778198242, 0.016353607177734375, 0.017182588577270508, 0.01801156997680664, 0.018840551376342773, 0.019669532775878906, 0.02049851417541504, 0.021327495574951172, 0.022156476974487305, 0.022985458374023438, 0.02381443977355957, 0.024643421173095703, 0.025472402572631836, 0.02630138397216797, 0.0271303653717041, 0.027959346771240234, 0.028788328170776367, 0.0296173095703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 1.0, 1.0, 4.0, 4.0, 11.0, 2.0, 10.0, 6.0, 16.0, 24.0, 24.0, 29.0, 45.0, 55.0, 61.0, 81.0, 93.0, 71.0, 76.0, 72.0, 73.0, 62.0, 35.0, 32.0, 33.0, 18.0, 9.0, 15.0, 12.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-05, -1.2025237083435059e-05, -1.1533498764038086e-05, -1.1041760444641113e-05, -1.055002212524414e-05, -1.0058283805847168e-05, -9.566545486450195e-06, -9.074807167053223e-06, -8.58306884765625e-06, -8.091330528259277e-06, -7.599592208862305e-06, -7.107853889465332e-06, -6.616115570068359e-06, -6.124377250671387e-06, -5.632638931274414e-06, -5.140900611877441e-06, -4.649162292480469e-06, -4.157423973083496e-06, -3.6656856536865234e-06, -3.1739473342895508e-06, -2.682209014892578e-06, -2.1904706954956055e-06, -1.6987323760986328e-06, -1.2069940567016602e-06, -7.152557373046875e-07, -2.2351741790771484e-07, 2.682209014892578e-07, 7.599592208862305e-07, 1.2516975402832031e-06, 1.7434358596801758e-06, 2.2351741790771484e-06, 2.726912498474121e-06, 3.2186508178710938e-06, 3.7103891372680664e-06, 4.202127456665039e-06, 4.693865776062012e-06, 5.185604095458984e-06, 5.677342414855957e-06, 6.16908073425293e-06, 6.660819053649902e-06, 7.152557373046875e-06, 7.644295692443848e-06, 8.13603401184082e-06, 8.627772331237793e-06, 9.119510650634766e-06, 9.611248970031738e-06, 1.0102987289428711e-05, 1.0594725608825684e-05, 1.1086463928222656e-05, 1.1578202247619629e-05, 1.2069940567016602e-05, 1.2561678886413574e-05, 1.3053417205810547e-05, 1.354515552520752e-05, 1.4036893844604492e-05, 1.4528632164001465e-05, 1.5020370483398438e-05, 1.551210880279541e-05, 1.6003847122192383e-05, 1.6495585441589355e-05, 1.6987323760986328e-05, 1.74790620803833e-05, 1.7970800399780273e-05, 1.8462538719177246e-05, 1.895427703857422e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 11.0, 10.0, 12.0, 12.0, 29.0, 29.0, 52.0, 65.0, 95.0, 138.0, 209.0, 318.0, 564.0, 882.0, 1543.0, 2682.0, 4897.0, 9906.0, 21999.0, 51450.0, 131740.0, 299048.0, 298017.0, 130078.0, 51141.0, 21825.0, 9991.0, 5013.0, 2737.0, 1530.0, 951.0, 543.0, 322.0, 227.0, 146.0, 100.0, 66.0, 45.0, 29.0, 33.0, 18.0, 18.0, 9.0, 8.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0214691162109375, -0.020818471908569336, -0.020167827606201172, -0.019517183303833008, -0.018866539001464844, -0.01821589469909668, -0.017565250396728516, -0.01691460609436035, -0.016263961791992188, -0.015613317489624023, -0.01496267318725586, -0.014312028884887695, -0.013661384582519531, -0.013010740280151367, -0.012360095977783203, -0.011709451675415039, -0.011058807373046875, -0.010408163070678711, -0.009757518768310547, -0.009106874465942383, -0.008456230163574219, -0.007805585861206055, -0.007154941558837891, -0.0065042972564697266, -0.0058536529541015625, -0.0052030086517333984, -0.004552364349365234, -0.0039017200469970703, -0.0032510757446289062, -0.002600431442260742, -0.0019497871398925781, -0.001299142837524414, -0.00064849853515625, 2.1457672119140625e-06, 0.0006527900695800781, 0.0013034343719482422, 0.0019540786743164062, 0.0026047229766845703, 0.0032553672790527344, 0.0039060115814208984, 0.0045566558837890625, 0.0052073001861572266, 0.005857944488525391, 0.006508588790893555, 0.007159233093261719, 0.007809877395629883, 0.008460521697998047, 0.009111166000366211, 0.009761810302734375, 0.010412454605102539, 0.011063098907470703, 0.011713743209838867, 0.012364387512207031, 0.013015031814575195, 0.01366567611694336, 0.014316320419311523, 0.014966964721679688, 0.015617609024047852, 0.016268253326416016, 0.01691889762878418, 0.017569541931152344, 0.018220186233520508, 0.018870830535888672, 0.019521474838256836, 0.020172119140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 1.0, 4.0, 6.0, 6.0, 9.0, 7.0, 14.0, 16.0, 13.0, 19.0, 32.0, 33.0, 35.0, 30.0, 43.0, 46.0, 69.0, 61.0, 58.0, 38.0, 55.0, 64.0, 57.0, 39.0, 29.0, 42.0, 27.0, 34.0, 20.0, 19.0, 8.0, 8.0, 4.0, 8.0, 5.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005176544189453125, -0.005019545555114746, -0.004862546920776367, -0.004705548286437988, -0.004548549652099609, -0.0043915510177612305, -0.0042345523834228516, -0.004077553749084473, -0.003920555114746094, -0.003763556480407715, -0.003606557846069336, -0.003449559211730957, -0.003292560577392578, -0.0031355619430541992, -0.0029785633087158203, -0.0028215646743774414, -0.0026645660400390625, -0.0025075674057006836, -0.0023505687713623047, -0.0021935701370239258, -0.002036571502685547, -0.001879572868347168, -0.001722574234008789, -0.0015655755996704102, -0.0014085769653320312, -0.0012515783309936523, -0.0010945796966552734, -0.0009375810623168945, -0.0007805824279785156, -0.0006235837936401367, -0.0004665851593017578, -0.0003095865249633789, -0.000152587890625, 4.410743713378906e-06, 0.0001614093780517578, 0.0003184080123901367, 0.0004754066467285156, 0.0006324052810668945, 0.0007894039154052734, 0.0009464025497436523, 0.0011034011840820312, 0.0012603998184204102, 0.001417398452758789, 0.001574397087097168, 0.0017313957214355469, 0.0018883943557739258, 0.0020453929901123047, 0.0022023916244506836, 0.0023593902587890625, 0.0025163888931274414, 0.0026733875274658203, 0.0028303861618041992, 0.002987384796142578, 0.003144383430480957, 0.003301382064819336, 0.003458380699157715, 0.0036153793334960938, 0.0037723779678344727, 0.0039293766021728516, 0.0040863752365112305, 0.004243373870849609, 0.004400372505187988, 0.004557371139526367, 0.004714369773864746, 0.004871368408203125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 8.0, 3.0, 7.0, 10.0, 19.0, 23.0, 17.0, 45.0, 56.0, 53.0, 95.0, 85.0, 97.0, 91.0, 81.0, 75.0, 71.0, 56.0, 38.0, 39.0, 15.0, 12.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3764435350894928, -0.36676907539367676, -0.3570946455001831, -0.34742018580436707, -0.3377457559108734, -0.3280712962150574, -0.3183968663215637, -0.3087224066257477, -0.29904794692993164, -0.2893734872341156, -0.27969905734062195, -0.2700245976448059, -0.26035016775131226, -0.2506757080554962, -0.24100126326084137, -0.23132681846618652, -0.22165237367153168, -0.21197792887687683, -0.20230348408222198, -0.19262903928756714, -0.1829545795917511, -0.17328013479709625, -0.1636056900024414, -0.15393123030662537, -0.1442568004131317, -0.13458235561847687, -0.12490790337324142, -0.11523345857858658, -0.10555900633335114, -0.09588456153869629, -0.08621011674404144, -0.076535664498806, -0.06686121225357056, -0.05718676373362541, -0.04751231521368027, -0.03783787041902542, -0.028163421899080276, -0.018488973379135132, -0.008814528584480286, 0.0008599236607551575, 0.010534368455410004, 0.02020881697535515, 0.029883263632655144, 0.03955771028995514, 0.049232158809900284, 0.05890660732984543, 0.06858105212450027, 0.07825550436973572, 0.08792994916439056, 0.09760439395904541, 0.10727884620428085, 0.1169532909989357, 0.12662774324417114, 0.136302188038826, 0.14597663283348083, 0.15565109252929688, 0.16532552242279053, 0.17499996721744537, 0.18467441201210022, 0.19434887170791626, 0.2040233165025711, 0.21369776129722595, 0.2233722060918808, 0.23304665088653564, 0.24272111058235168]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 8.0, 14.0, 10.0, 8.0, 14.0, 20.0, 22.0, 23.0, 21.0, 35.0, 21.0, 37.0, 54.0, 41.0, 41.0, 39.0, 50.0, 57.0, 60.0, 43.0, 49.0, 35.0, 46.0, 41.0, 34.0, 22.0, 29.0, 28.0, 14.0, 15.0, 14.0, 7.0, 11.0, 4.0, 8.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717919558286667, -0.16606242954730988, -0.16033290326595306, -0.15460337698459625, -0.14887385070323944, -0.14314432442188263, -0.13741478323936462, -0.1316852569580078, -0.125955730676651, -0.12022620439529419, -0.11449667811393738, -0.10876715183258057, -0.10303762555122375, -0.09730809926986694, -0.09157856553792953, -0.08584903925657272, -0.08011952042579651, -0.0743899941444397, -0.06866046786308289, -0.06293094158172607, -0.057201411575078964, -0.05147188529372215, -0.04574235528707504, -0.04001282900571823, -0.03428330272436142, -0.028553776443004608, -0.022824248299002647, -0.017094720155000687, -0.011365193873643875, -0.005635667592287064, 9.386241436004639e-05, 0.005823388695716858, 0.01155291497707367, 0.01728244125843048, 0.02301196940243244, 0.028741497546434402, 0.034471023827791214, 0.040200550109148026, 0.045930080115795135, 0.05165960639715195, 0.05738913267850876, 0.06311865895986557, 0.06884818524122238, 0.07457771897315979, 0.0803072452545166, 0.08603677153587341, 0.09176629781723022, 0.09749582409858704, 0.10322535037994385, 0.10895487666130066, 0.11468440294265747, 0.12041392922401428, 0.1261434555053711, 0.1318729817867279, 0.13760250806808472, 0.14333203434944153, 0.14906156063079834, 0.15479108691215515, 0.16052061319351196, 0.16625013947486877, 0.17197966575622559, 0.1777091920375824, 0.1834387183189392, 0.18916824460029602, 0.19489778578281403]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 11.0, 16.0, 14.0, 26.0, 34.0, 53.0, 74.0, 126.0, 162.0, 292.0, 451.0, 707.0, 1313.0, 2366.0, 4698.0, 9488.0, 20863.0, 51985.0, 175029.0, 494756.0, 188870.0, 54771.0, 21845.0, 9863.0, 4824.0, 2465.0, 1400.0, 792.0, 451.0, 266.0, 184.0, 112.0, 77.0, 54.0, 37.0, 31.0, 16.0, 10.0, 10.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.234375, -0.225860595703125, -0.21734619140625, -0.208831787109375, -0.2003173828125, -0.191802978515625, -0.18328857421875, -0.174774169921875, -0.166259765625, -0.157745361328125, -0.14923095703125, -0.140716552734375, -0.1322021484375, -0.123687744140625, -0.11517333984375, -0.106658935546875, -0.09814453125, -0.089630126953125, -0.08111572265625, -0.072601318359375, -0.0640869140625, -0.055572509765625, -0.04705810546875, -0.038543701171875, -0.030029296875, -0.021514892578125, -0.01300048828125, -0.004486083984375, 0.0040283203125, 0.012542724609375, 0.02105712890625, 0.029571533203125, 0.0380859375, 0.046600341796875, 0.05511474609375, 0.063629150390625, 0.0721435546875, 0.080657958984375, 0.08917236328125, 0.097686767578125, 0.106201171875, 0.114715576171875, 0.12322998046875, 0.131744384765625, 0.1402587890625, 0.148773193359375, 0.15728759765625, 0.165802001953125, 0.17431640625, 0.182830810546875, 0.19134521484375, 0.199859619140625, 0.2083740234375, 0.216888427734375, 0.22540283203125, 0.233917236328125, 0.242431640625, 0.250946044921875, 0.25946044921875, 0.267974853515625, 0.2764892578125, 0.285003662109375, 0.29351806640625, 0.302032470703125, 0.310546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 7.0, 12.0, 17.0, 15.0, 17.0, 27.0, 27.0, 21.0, 25.0, 41.0, 47.0, 50.0, 63.0, 61.0, 65.0, 59.0, 53.0, 54.0, 58.0, 47.0, 41.0, 32.0, 30.0, 34.0, 16.0, 13.0, 15.0, 13.0, 7.0, 6.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3564643859863281, -0.34256744384765625, -0.3286705017089844, -0.3147735595703125, -0.3008766174316406, -0.28697967529296875, -0.2730827331542969, -0.259185791015625, -0.24528884887695312, -0.23139190673828125, -0.21749496459960938, -0.2035980224609375, -0.18970108032226562, -0.17580413818359375, -0.16190719604492188, -0.14801025390625, -0.13411331176757812, -0.12021636962890625, -0.10631942749023438, -0.0924224853515625, -0.07852554321289062, -0.06462860107421875, -0.050731658935546875, -0.036834716796875, -0.022937774658203125, -0.00904083251953125, 0.004856109619140625, 0.0187530517578125, 0.032649993896484375, 0.04654693603515625, 0.060443878173828125, 0.0743408203125, 0.08823776245117188, 0.10213470458984375, 0.11603164672851562, 0.1299285888671875, 0.14382553100585938, 0.15772247314453125, 0.17161941528320312, 0.185516357421875, 0.19941329956054688, 0.21331024169921875, 0.22720718383789062, 0.2411041259765625, 0.2550010681152344, 0.26889801025390625, 0.2827949523925781, 0.29669189453125, 0.3105888366699219, 0.32448577880859375, 0.3383827209472656, 0.3522796630859375, 0.3661766052246094, 0.38007354736328125, 0.3939704895019531, 0.407867431640625, 0.4217643737792969, 0.43566131591796875, 0.4495582580566406, 0.4634552001953125, 0.4773521423339844, 0.49124908447265625, 0.5051460266113281, 0.51904296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 13.0, 20.0, 29.0, 34.0, 67.0, 117.0, 286.0, 777.0, 3118.0, 19574.0, 282712.0, 699936.0, 34872.0, 5211.0, 1061.0, 335.0, 143.0, 78.0, 51.0, 39.0, 12.0, 22.0, 10.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5527191162109375, -0.530731201171875, -0.5087432861328125, -0.48675537109375, -0.4647674560546875, -0.442779541015625, -0.4207916259765625, -0.3988037109375, -0.3768157958984375, -0.354827880859375, -0.3328399658203125, -0.31085205078125, -0.2888641357421875, -0.266876220703125, -0.2448883056640625, -0.222900390625, -0.2009124755859375, -0.178924560546875, -0.1569366455078125, -0.13494873046875, -0.1129608154296875, -0.090972900390625, -0.0689849853515625, -0.0469970703125, -0.0250091552734375, -0.003021240234375, 0.0189666748046875, 0.04095458984375, 0.0629425048828125, 0.084930419921875, 0.1069183349609375, 0.12890625, 0.1508941650390625, 0.172882080078125, 0.1948699951171875, 0.21685791015625, 0.2388458251953125, 0.260833740234375, 0.2828216552734375, 0.3048095703125, 0.3267974853515625, 0.348785400390625, 0.3707733154296875, 0.39276123046875, 0.4147491455078125, 0.436737060546875, 0.4587249755859375, 0.480712890625, 0.5027008056640625, 0.524688720703125, 0.5466766357421875, 0.56866455078125, 0.5906524658203125, 0.612640380859375, 0.6346282958984375, 0.6566162109375, 0.6786041259765625, 0.700592041015625, 0.7225799560546875, 0.74456787109375, 0.7665557861328125, 0.788543701171875, 0.8105316162109375, 0.83251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 9.0, 10.0, 12.0, 20.0, 26.0, 31.0, 35.0, 33.0, 58.0, 51.0, 50.0, 57.0, 64.0, 57.0, 59.0, 60.0, 61.0, 54.0, 40.0, 38.0, 30.0, 26.0, 19.0, 16.0, 18.0, 8.0, 13.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62451171875, -0.6078262329101562, -0.5911407470703125, -0.5744552612304688, -0.557769775390625, -0.5410842895507812, -0.5243988037109375, -0.5077133178710938, -0.49102783203125, -0.47434234619140625, -0.4576568603515625, -0.44097137451171875, -0.424285888671875, -0.40760040283203125, -0.3909149169921875, -0.37422943115234375, -0.3575439453125, -0.34085845947265625, -0.3241729736328125, -0.30748748779296875, -0.290802001953125, -0.27411651611328125, -0.2574310302734375, -0.24074554443359375, -0.22406005859375, -0.20737457275390625, -0.1906890869140625, -0.17400360107421875, -0.157318115234375, -0.14063262939453125, -0.1239471435546875, -0.10726165771484375, -0.090576171875, -0.07389068603515625, -0.0572052001953125, -0.04051971435546875, -0.023834228515625, -0.00714874267578125, 0.0095367431640625, 0.02622222900390625, 0.04290771484375, 0.05959320068359375, 0.0762786865234375, 0.09296417236328125, 0.109649658203125, 0.12633514404296875, 0.1430206298828125, 0.15970611572265625, 0.1763916015625, 0.19307708740234375, 0.2097625732421875, 0.22644805908203125, 0.243133544921875, 0.25981903076171875, 0.2765045166015625, 0.29319000244140625, 0.30987548828125, 0.32656097412109375, 0.3432464599609375, 0.35993194580078125, 0.376617431640625, 0.39330291748046875, 0.4099884033203125, 0.42667388916015625, 0.443359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 13.0, 15.0, 15.0, 19.0, 39.0, 49.0, 119.0, 169.0, 335.0, 697.0, 1479.0, 3756.0, 13766.0, 82554.0, 664613.0, 239263.0, 30762.0, 6659.0, 2238.0, 918.0, 472.0, 262.0, 111.0, 86.0, 55.0, 27.0, 16.0, 10.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.132080078125, -0.12838459014892578, -0.12468910217285156, -0.12099361419677734, -0.11729812622070312, -0.1136026382446289, -0.10990715026855469, -0.10621166229248047, -0.10251617431640625, -0.09882068634033203, -0.09512519836425781, -0.0914297103881836, -0.08773422241210938, -0.08403873443603516, -0.08034324645996094, -0.07664775848388672, -0.0729522705078125, -0.06925678253173828, -0.06556129455566406, -0.061865806579589844, -0.058170318603515625, -0.054474830627441406, -0.05077934265136719, -0.04708385467529297, -0.04338836669921875, -0.03969287872314453, -0.03599739074707031, -0.032301902770996094, -0.028606414794921875, -0.024910926818847656, -0.021215438842773438, -0.01751995086669922, -0.013824462890625, -0.010128974914550781, -0.0064334869384765625, -0.0027379989624023438, 0.000957489013671875, 0.004652976989746094, 0.008348464965820312, 0.012043952941894531, 0.01573944091796875, 0.01943492889404297, 0.023130416870117188, 0.026825904846191406, 0.030521392822265625, 0.034216880798339844, 0.03791236877441406, 0.04160785675048828, 0.0453033447265625, 0.04899883270263672, 0.05269432067871094, 0.056389808654785156, 0.060085296630859375, 0.0637807846069336, 0.06747627258300781, 0.07117176055908203, 0.07486724853515625, 0.07856273651123047, 0.08225822448730469, 0.0859537124633789, 0.08964920043945312, 0.09334468841552734, 0.09704017639160156, 0.10073566436767578, 0.10443115234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 7.0, 11.0, 6.0, 18.0, 12.0, 20.0, 23.0, 42.0, 33.0, 52.0, 63.0, 79.0, 91.0, 112.0, 87.0, 70.0, 58.0, 53.0, 38.0, 21.0, 15.0, 19.0, 11.0, 14.0, 7.0, 8.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.519918441772461e-05, -1.4727935194969177e-05, -1.4256685972213745e-05, -1.3785436749458313e-05, -1.3314187526702881e-05, -1.2842938303947449e-05, -1.2371689081192017e-05, -1.1900439858436584e-05, -1.1429190635681152e-05, -1.095794141292572e-05, -1.0486692190170288e-05, -1.0015442967414856e-05, -9.544193744659424e-06, -9.072944521903992e-06, -8.60169529914856e-06, -8.130446076393127e-06, -7.659196853637695e-06, -7.187947630882263e-06, -6.716698408126831e-06, -6.245449185371399e-06, -5.774199962615967e-06, -5.302950739860535e-06, -4.8317015171051025e-06, -4.36045229434967e-06, -3.889203071594238e-06, -3.417953848838806e-06, -2.946704626083374e-06, -2.475455403327942e-06, -2.0042061805725098e-06, -1.5329569578170776e-06, -1.0617077350616455e-06, -5.904585123062134e-07, -1.1920928955078125e-07, 3.520399332046509e-07, 8.23289155960083e-07, 1.2945383787155151e-06, 1.7657876014709473e-06, 2.2370368242263794e-06, 2.7082860469818115e-06, 3.1795352697372437e-06, 3.6507844924926758e-06, 4.122033715248108e-06, 4.59328293800354e-06, 5.064532160758972e-06, 5.535781383514404e-06, 6.0070306062698364e-06, 6.4782798290252686e-06, 6.949529051780701e-06, 7.420778274536133e-06, 7.892027497291565e-06, 8.363276720046997e-06, 8.83452594280243e-06, 9.305775165557861e-06, 9.777024388313293e-06, 1.0248273611068726e-05, 1.0719522833824158e-05, 1.119077205657959e-05, 1.1662021279335022e-05, 1.2133270502090454e-05, 1.2604519724845886e-05, 1.3075768947601318e-05, 1.354701817035675e-05, 1.4018267393112183e-05, 1.4489516615867615e-05, 1.4960765838623047e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 8.0, 10.0, 23.0, 36.0, 65.0, 106.0, 212.0, 467.0, 1049.0, 2643.0, 9233.0, 65880.0, 723375.0, 217917.0, 20194.0, 4427.0, 1592.0, 669.0, 293.0, 173.0, 83.0, 32.0, 17.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16492080688476562, -0.15955352783203125, -0.15418624877929688, -0.1488189697265625, -0.14345169067382812, -0.13808441162109375, -0.13271713256835938, -0.127349853515625, -0.12198257446289062, -0.11661529541015625, -0.11124801635742188, -0.1058807373046875, -0.10051345825195312, -0.09514617919921875, -0.08977890014648438, -0.08441162109375, -0.07904434204101562, -0.07367706298828125, -0.06830978393554688, -0.0629425048828125, -0.057575225830078125, -0.05220794677734375, -0.046840667724609375, -0.041473388671875, -0.036106109619140625, -0.03073883056640625, -0.025371551513671875, -0.0200042724609375, -0.014636993408203125, -0.00926971435546875, -0.003902435302734375, 0.00146484375, 0.006832122802734375, 0.01219940185546875, 0.017566680908203125, 0.0229339599609375, 0.028301239013671875, 0.03366851806640625, 0.039035797119140625, 0.044403076171875, 0.049770355224609375, 0.05513763427734375, 0.060504913330078125, 0.0658721923828125, 0.07123947143554688, 0.07660675048828125, 0.08197402954101562, 0.08734130859375, 0.09270858764648438, 0.09807586669921875, 0.10344314575195312, 0.1088104248046875, 0.11417770385742188, 0.11954498291015625, 0.12491226196289062, 0.130279541015625, 0.13564682006835938, 0.14101409912109375, 0.14638137817382812, 0.1517486572265625, 0.15711593627929688, 0.16248321533203125, 0.16785049438476562, 0.1732177734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 14.0, 16.0, 18.0, 21.0, 29.0, 60.0, 86.0, 136.0, 145.0, 148.0, 93.0, 68.0, 41.0, 40.0, 26.0, 16.0, 14.0, 3.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0670166015625, -0.06490612030029297, -0.06279563903808594, -0.060685157775878906, -0.058574676513671875, -0.056464195251464844, -0.05435371398925781, -0.05224323272705078, -0.05013275146484375, -0.04802227020263672, -0.04591178894042969, -0.043801307678222656, -0.041690826416015625, -0.039580345153808594, -0.03746986389160156, -0.03535938262939453, -0.0332489013671875, -0.03113842010498047, -0.029027938842773438, -0.026917457580566406, -0.024806976318359375, -0.022696495056152344, -0.020586013793945312, -0.01847553253173828, -0.01636505126953125, -0.014254570007324219, -0.012144088745117188, -0.010033607482910156, -0.007923126220703125, -0.005812644958496094, -0.0037021636962890625, -0.0015916824340820312, 0.000518798828125, 0.0026292800903320312, 0.0047397613525390625, 0.006850242614746094, 0.008960723876953125, 0.011071205139160156, 0.013181686401367188, 0.015292167663574219, 0.01740264892578125, 0.01951313018798828, 0.021623611450195312, 0.023734092712402344, 0.025844573974609375, 0.027955055236816406, 0.030065536499023438, 0.03217601776123047, 0.0342864990234375, 0.03639698028564453, 0.03850746154785156, 0.040617942810058594, 0.042728424072265625, 0.044838905334472656, 0.04694938659667969, 0.04905986785888672, 0.05117034912109375, 0.05328083038330078, 0.05539131164550781, 0.057501792907714844, 0.059612274169921875, 0.061722755432128906, 0.06383323669433594, 0.06594371795654297, 0.06805419921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 32.0, 87.0, 176.0, 280.0, 248.0, 116.0, 54.0, 11.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8445942997932434, -0.7835565805435181, -0.7225189208984375, -0.6614812016487122, -0.6004435420036316, -0.5394058227539062, -0.4783681333065033, -0.41733044385910034, -0.3562927544116974, -0.29525506496429443, -0.23421737551689148, -0.17317967116832733, -0.11214198172092438, -0.05110427737236023, 0.009933412075042725, 0.07097110152244568, 0.13200879096984863, 0.1930464804172516, 0.25408416986465454, 0.3151218891143799, 0.37615954875946045, 0.4371972680091858, 0.49823495745658875, 0.5592726469039917, 0.6203103065490723, 0.6813480257987976, 0.7423856854438782, 0.8034234046936035, 0.8644610643386841, 0.9254987835884094, 0.9865365028381348, 1.0475741624832153, 1.1086119413375854, 1.169649600982666, 1.2306873798370361, 1.2917250394821167, 1.3527626991271973, 1.4138004779815674, 1.474838137626648, 1.5358757972717285, 1.596913456916809, 1.6579511165618896, 1.7189888954162598, 1.7800265550613403, 1.841064214706421, 1.902101993560791, 1.9631396532058716, 2.024177312850952, 2.0852150917053223, 2.1462528705596924, 2.2072904109954834, 2.2683281898498535, 2.3293659687042236, 2.3904035091400146, 2.4514412879943848, 2.512478828430176, 2.573516607284546, 2.634554386138916, 2.695591926574707, 2.756629705429077, 2.8176674842834473, 2.8787050247192383, 2.9397428035736084, 3.0007805824279785, 3.0618181228637695]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 9.0, 19.0, 10.0, 13.0, 21.0, 24.0, 24.0, 23.0, 27.0, 31.0, 29.0, 42.0, 39.0, 37.0, 38.0, 42.0, 51.0, 51.0, 48.0, 55.0, 41.0, 38.0, 44.0, 43.0, 32.0, 19.0, 29.0, 17.0, 20.0, 11.0, 15.0, 12.0, 12.0, 6.0, 3.0, 10.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6871644258499146, -0.6649504899978638, -0.6427364945411682, -0.6205225586891174, -0.5983086228370667, -0.5760946869850159, -0.5538806915283203, -0.5316667556762695, -0.5094528198242188, -0.4872388541698456, -0.4650249183177948, -0.44281095266342163, -0.42059701681137085, -0.3983830511569977, -0.3761690855026245, -0.35395514965057373, -0.33174118399620056, -0.3095272183418274, -0.2873132824897766, -0.26509931683540344, -0.24288538098335266, -0.2206714153289795, -0.19845746457576752, -0.17624351382255554, -0.15402956306934357, -0.1318156123161316, -0.10960166156291962, -0.08738770335912704, -0.06517375260591507, -0.042959801852703094, -0.020745843648910522, 0.0014681071043014526, 0.023682057857513428, 0.0458960086107254, 0.06810995936393738, 0.09032391756772995, 0.11253786832094193, 0.1347518265247345, 0.15696577727794647, 0.17917972803115845, 0.20139367878437042, 0.2236076295375824, 0.24582158029079437, 0.26803553104400635, 0.2902494966983795, 0.3124634325504303, 0.33467739820480347, 0.35689133405685425, 0.3791052997112274, 0.4013192653656006, 0.42353320121765137, 0.44574716687202454, 0.4679611027240753, 0.4901750683784485, 0.5123890042304993, 0.5346029996871948, 0.5568169355392456, 0.5790308713912964, 0.6012448668479919, 0.6234588027000427, 0.6456727385520935, 0.6678866744041443, 0.6901006698608398, 0.7123146057128906, 0.7345285415649414]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 11.0, 10.0, 13.0, 12.0, 15.0, 19.0, 25.0, 40.0, 67.0, 105.0, 167.0, 346.0, 710.0, 1585.0, 3491.0, 9441.0, 34293.0, 377416.0, 3245929.0, 466798.0, 37175.0, 9898.0, 3630.0, 1558.0, 723.0, 342.0, 162.0, 98.0, 46.0, 42.0, 25.0, 21.0, 13.0, 12.0, 10.0, 8.0, 3.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51953125, -0.5044822692871094, -0.48943328857421875, -0.4743843078613281, -0.4593353271484375, -0.4442863464355469, -0.42923736572265625, -0.4141883850097656, -0.399139404296875, -0.3840904235839844, -0.36904144287109375, -0.3539924621582031, -0.3389434814453125, -0.3238945007324219, -0.30884552001953125, -0.2937965393066406, -0.27874755859375, -0.2636985778808594, -0.24864959716796875, -0.23360061645507812, -0.2185516357421875, -0.20350265502929688, -0.18845367431640625, -0.17340469360351562, -0.158355712890625, -0.14330673217773438, -0.12825775146484375, -0.11320877075195312, -0.0981597900390625, -0.08311080932617188, -0.06806182861328125, -0.053012847900390625, -0.0379638671875, -0.022914886474609375, -0.00786590576171875, 0.007183074951171875, 0.0222320556640625, 0.037281036376953125, 0.05233001708984375, 0.06737899780273438, 0.082427978515625, 0.09747695922851562, 0.11252593994140625, 0.12757492065429688, 0.1426239013671875, 0.15767288208007812, 0.17272186279296875, 0.18777084350585938, 0.20281982421875, 0.21786880493164062, 0.23291778564453125, 0.24796676635742188, 0.2630157470703125, 0.2780647277832031, 0.29311370849609375, 0.3081626892089844, 0.323211669921875, 0.3382606506347656, 0.35330963134765625, 0.3683586120605469, 0.3834075927734375, 0.3984565734863281, 0.41350555419921875, 0.4285545349121094, 0.443603515625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 11.0, 8.0, 16.0, 16.0, 10.0, 15.0, 21.0, 29.0, 25.0, 34.0, 32.0, 29.0, 27.0, 45.0, 40.0, 48.0, 37.0, 51.0, 41.0, 56.0, 50.0, 51.0, 41.0, 41.0, 44.0, 33.0, 22.0, 21.0, 13.0, 10.0, 13.0, 18.0, 9.0, 8.0, 2.0, 6.0, 3.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.222412109375, -0.21626853942871094, -0.21012496948242188, -0.2039813995361328, -0.19783782958984375, -0.1916942596435547, -0.18555068969726562, -0.17940711975097656, -0.1732635498046875, -0.16711997985839844, -0.16097640991210938, -0.1548328399658203, -0.14868927001953125, -0.1425457000732422, -0.13640213012695312, -0.13025856018066406, -0.124114990234375, -0.11797142028808594, -0.11182785034179688, -0.10568428039550781, -0.09954071044921875, -0.09339714050292969, -0.08725357055664062, -0.08111000061035156, -0.0749664306640625, -0.06882286071777344, -0.06267929077148438, -0.05653572082519531, -0.05039215087890625, -0.04424858093261719, -0.038105010986328125, -0.03196144104003906, -0.02581787109375, -0.019674301147460938, -0.013530731201171875, -0.0073871612548828125, -0.00124359130859375, 0.0048999786376953125, 0.011043548583984375, 0.017187118530273438, 0.0233306884765625, 0.029474258422851562, 0.035617828369140625, 0.04176139831542969, 0.04790496826171875, 0.05404853820800781, 0.060192108154296875, 0.06633567810058594, 0.072479248046875, 0.07862281799316406, 0.08476638793945312, 0.09090995788574219, 0.09705352783203125, 0.10319709777832031, 0.10934066772460938, 0.11548423767089844, 0.1216278076171875, 0.12777137756347656, 0.13391494750976562, 0.1400585174560547, 0.14620208740234375, 0.1523456573486328, 0.15848922729492188, 0.16463279724121094, 0.1707763671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 12.0, 12.0, 19.0, 40.0, 70.0, 141.0, 317.0, 989.0, 5383.0, 119756.0, 4015424.0, 47472.0, 3407.0, 726.0, 244.0, 120.0, 64.0, 42.0, 16.0, 11.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4150390625, -1.3781814575195312, -1.3413238525390625, -1.3044662475585938, -1.267608642578125, -1.2307510375976562, -1.1938934326171875, -1.1570358276367188, -1.12017822265625, -1.0833206176757812, -1.0464630126953125, -1.0096054077148438, -0.972747802734375, -0.9358901977539062, -0.8990325927734375, -0.8621749877929688, -0.8253173828125, -0.7884597778320312, -0.7516021728515625, -0.7147445678710938, -0.677886962890625, -0.6410293579101562, -0.6041717529296875, -0.5673141479492188, -0.53045654296875, -0.49359893798828125, -0.4567413330078125, -0.41988372802734375, -0.383026123046875, -0.34616851806640625, -0.3093109130859375, -0.27245330810546875, -0.235595703125, -0.19873809814453125, -0.1618804931640625, -0.12502288818359375, -0.088165283203125, -0.05130767822265625, -0.0144500732421875, 0.02240753173828125, 0.05926513671875, 0.09612274169921875, 0.1329803466796875, 0.16983795166015625, 0.206695556640625, 0.24355316162109375, 0.2804107666015625, 0.31726837158203125, 0.3541259765625, 0.39098358154296875, 0.4278411865234375, 0.46469879150390625, 0.501556396484375, 0.5384140014648438, 0.5752716064453125, 0.6121292114257812, 0.64898681640625, 0.6858444213867188, 0.7227020263671875, 0.7595596313476562, 0.796417236328125, 0.8332748413085938, 0.8701324462890625, 0.9069900512695312, 0.94384765625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 18.0, 19.0, 33.0, 67.0, 110.0, 251.0, 638.0, 1180.0, 930.0, 432.0, 170.0, 96.0, 46.0, 34.0, 19.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20533180236816406, -0.19765090942382812, -0.1899700164794922, -0.18228912353515625, -0.1746082305908203, -0.16692733764648438, -0.15924644470214844, -0.1515655517578125, -0.14388465881347656, -0.13620376586914062, -0.1285228729248047, -0.12084197998046875, -0.11316108703613281, -0.10548019409179688, -0.09779930114746094, -0.090118408203125, -0.08243751525878906, -0.07475662231445312, -0.06707572937011719, -0.05939483642578125, -0.05171394348144531, -0.044033050537109375, -0.03635215759277344, -0.0286712646484375, -0.020990371704101562, -0.013309478759765625, -0.0056285858154296875, 0.00205230712890625, 0.009733200073242188, 0.017414093017578125, 0.025094985961914062, 0.03277587890625, 0.04045677185058594, 0.048137664794921875, 0.05581855773925781, 0.06349945068359375, 0.07118034362792969, 0.07886123657226562, 0.08654212951660156, 0.0942230224609375, 0.10190391540527344, 0.10958480834960938, 0.11726570129394531, 0.12494659423828125, 0.1326274871826172, 0.14030838012695312, 0.14798927307128906, 0.155670166015625, 0.16335105895996094, 0.17103195190429688, 0.1787128448486328, 0.18639373779296875, 0.1940746307373047, 0.20175552368164062, 0.20943641662597656, 0.2171173095703125, 0.22479820251464844, 0.23247909545898438, 0.2401599884033203, 0.24784088134765625, 0.2555217742919922, 0.2632026672363281, 0.27088356018066406, 0.278564453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 13.0, 16.0, 21.0, 28.0, 36.0, 47.0, 55.0, 70.0, 56.0, 77.0, 69.0, 73.0, 71.0, 49.0, 56.0, 56.0, 42.0, 34.0, 28.0, 19.0, 21.0, 10.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5387060642242432, -0.5260964632034302, -0.5134868621826172, -0.5008772611618042, -0.4882676601409912, -0.4756580591201782, -0.46304845809936523, -0.45043885707855225, -0.43782925605773926, -0.42521965503692627, -0.4126100540161133, -0.4000004529953003, -0.3873908519744873, -0.3747812509536743, -0.36217164993286133, -0.34956204891204834, -0.33695247769355774, -0.32434287667274475, -0.31173327565193176, -0.2991236746311188, -0.2865140736103058, -0.2739044725894928, -0.2612949013710022, -0.24868528544902802, -0.23607568442821503, -0.22346608340740204, -0.21085648238658905, -0.19824689626693726, -0.18563729524612427, -0.17302769422531128, -0.1604180932044983, -0.1478084921836853, -0.1351989209651947, -0.12258931994438171, -0.10997971892356873, -0.09737012535333633, -0.08476052433252335, -0.07215092331171036, -0.059541329741477966, -0.04693172872066498, -0.03432212769985199, -0.02171252854168415, -0.009102929383516312, 0.003506667912006378, 0.016116268932819366, 0.028725869953632355, 0.041335463523864746, 0.053945064544677734, 0.06655466556549072, 0.07916426658630371, 0.0917738676071167, 0.10438346117734909, 0.11699306219816208, 0.12960267066955566, 0.14221225678920746, 0.15482185781002045, 0.16743145883083344, 0.18004105985164642, 0.1926506608724594, 0.2052602469921112, 0.2178698480129242, 0.23047944903373718, 0.24308905005455017, 0.25569865107536316, 0.26830825209617615]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 10.0, 15.0, 9.0, 15.0, 14.0, 19.0, 18.0, 19.0, 33.0, 24.0, 43.0, 43.0, 42.0, 31.0, 40.0, 42.0, 55.0, 46.0, 37.0, 38.0, 29.0, 29.0, 46.0, 32.0, 35.0, 34.0, 28.0, 29.0, 19.0, 14.0, 14.0, 12.0, 12.0, 16.0, 9.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.28750863671302795, -0.27930018305778503, -0.2710916996002197, -0.2628832459449768, -0.2546747624874115, -0.24646630883216858, -0.23825784027576447, -0.23004937171936035, -0.22184090316295624, -0.21363243460655212, -0.205423966050148, -0.1972154974937439, -0.18900704383850098, -0.18079856038093567, -0.17259010672569275, -0.16438163816928864, -0.15617316961288452, -0.1479647010564804, -0.1397562325000763, -0.13154776394367218, -0.12333930283784866, -0.11513083428144455, -0.10692237317562103, -0.09871390461921692, -0.0905054360628128, -0.08229696750640869, -0.07408849895000458, -0.06588003784418106, -0.05767156928777695, -0.04946310073137283, -0.04125463590025902, -0.0330461710691452, -0.02483770251274109, -0.016629235818982124, -0.00842076912522316, -0.00021230243146419525, 0.00799616426229477, 0.016204632818698883, 0.0244130976498127, 0.032621562480926514, 0.04083003103733063, 0.04903849959373474, 0.057246964424848557, 0.06545542925596237, 0.07366389781236649, 0.0818723663687706, 0.09008082747459412, 0.09828929603099823, 0.10649776458740234, 0.11470623314380646, 0.12291470170021057, 0.13112317025661469, 0.1393316388130188, 0.14754009246826172, 0.15574856102466583, 0.16395702958106995, 0.17216549813747406, 0.18037396669387817, 0.1885824352502823, 0.1967909038066864, 0.20499935746192932, 0.21320784091949463, 0.22141629457473755, 0.22962476313114166, 0.23783323168754578]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 6.0, 15.0, 15.0, 25.0, 35.0, 43.0, 63.0, 78.0, 127.0, 169.0, 275.0, 446.0, 748.0, 1351.0, 2614.0, 4878.0, 9645.0, 22662.0, 80507.0, 429180.0, 384246.0, 71049.0, 20718.0, 9354.0, 4667.0, 2422.0, 1283.0, 695.0, 386.0, 250.0, 163.0, 126.0, 75.0, 50.0, 41.0, 28.0, 29.0, 13.0, 14.0, 14.0, 3.0, 8.0, 13.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.10528564453125, -0.10218524932861328, -0.09908485412597656, -0.09598445892333984, -0.09288406372070312, -0.0897836685180664, -0.08668327331542969, -0.08358287811279297, -0.08048248291015625, -0.07738208770751953, -0.07428169250488281, -0.0711812973022461, -0.06808090209960938, -0.06498050689697266, -0.06188011169433594, -0.05877971649169922, -0.0556793212890625, -0.05257892608642578, -0.04947853088378906, -0.046378135681152344, -0.043277740478515625, -0.040177345275878906, -0.03707695007324219, -0.03397655487060547, -0.03087615966796875, -0.02777576446533203, -0.024675369262695312, -0.021574974060058594, -0.018474578857421875, -0.015374183654785156, -0.012273788452148438, -0.009173393249511719, -0.006072998046875, -0.0029726028442382812, 0.0001277923583984375, 0.0032281875610351562, 0.006328582763671875, 0.009428977966308594, 0.012529373168945312, 0.01562976837158203, 0.01873016357421875, 0.02183055877685547, 0.024930953979492188, 0.028031349182128906, 0.031131744384765625, 0.034232139587402344, 0.03733253479003906, 0.04043292999267578, 0.0435333251953125, 0.04663372039794922, 0.04973411560058594, 0.052834510803222656, 0.055934906005859375, 0.059035301208496094, 0.06213569641113281, 0.06523609161376953, 0.06833648681640625, 0.07143688201904297, 0.07453727722167969, 0.0776376724243164, 0.08073806762695312, 0.08383846282958984, 0.08693885803222656, 0.09003925323486328, 0.0931396484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 10.0, 12.0, 12.0, 11.0, 14.0, 17.0, 23.0, 18.0, 26.0, 25.0, 37.0, 27.0, 54.0, 40.0, 35.0, 62.0, 50.0, 45.0, 47.0, 38.0, 41.0, 31.0, 42.0, 36.0, 25.0, 33.0, 27.0, 32.0, 16.0, 16.0, 19.0, 19.0, 9.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16146469116210938, -0.15581512451171875, -0.15016555786132812, -0.1445159912109375, -0.13886642456054688, -0.13321685791015625, -0.12756729125976562, -0.121917724609375, -0.11626815795898438, -0.11061859130859375, -0.10496902465820312, -0.0993194580078125, -0.09366989135742188, -0.08802032470703125, -0.08237075805664062, -0.07672119140625, -0.07107162475585938, -0.06542205810546875, -0.059772491455078125, -0.0541229248046875, -0.048473358154296875, -0.04282379150390625, -0.037174224853515625, -0.031524658203125, -0.025875091552734375, -0.02022552490234375, -0.014575958251953125, -0.0089263916015625, -0.003276824951171875, 0.00237274169921875, 0.008022308349609375, 0.013671875, 0.019321441650390625, 0.02497100830078125, 0.030620574951171875, 0.0362701416015625, 0.041919708251953125, 0.04756927490234375, 0.053218841552734375, 0.058868408203125, 0.06451797485351562, 0.07016754150390625, 0.07581710815429688, 0.0814666748046875, 0.08711624145507812, 0.09276580810546875, 0.09841537475585938, 0.10406494140625, 0.10971450805664062, 0.11536407470703125, 0.12101364135742188, 0.1266632080078125, 0.13231277465820312, 0.13796234130859375, 0.14361190795898438, 0.149261474609375, 0.15491104125976562, 0.16056060791015625, 0.16621017456054688, 0.1718597412109375, 0.17750930786132812, 0.18315887451171875, 0.18880844116210938, 0.1944580078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 11.0, 9.0, 22.0, 23.0, 29.0, 43.0, 56.0, 100.0, 122.0, 188.0, 263.0, 446.0, 741.0, 1186.0, 2126.0, 4014.0, 8343.0, 19397.0, 54304.0, 191389.0, 441353.0, 219992.0, 62742.0, 22341.0, 9155.0, 4450.0, 2317.0, 1234.0, 766.0, 485.0, 309.0, 168.0, 122.0, 85.0, 49.0, 46.0, 33.0, 20.0, 21.0, 11.0, 9.0, 3.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06194019317626953, -0.06003761291503906, -0.058135032653808594, -0.056232452392578125, -0.054329872131347656, -0.05242729187011719, -0.05052471160888672, -0.04862213134765625, -0.04671955108642578, -0.04481697082519531, -0.042914390563964844, -0.041011810302734375, -0.039109230041503906, -0.03720664978027344, -0.03530406951904297, -0.0334014892578125, -0.03149890899658203, -0.029596328735351562, -0.027693748474121094, -0.025791168212890625, -0.023888587951660156, -0.021986007690429688, -0.02008342742919922, -0.01818084716796875, -0.01627826690673828, -0.014375686645507812, -0.012473106384277344, -0.010570526123046875, -0.008667945861816406, -0.0067653656005859375, -0.004862785339355469, -0.002960205078125, -0.0010576248168945312, 0.0008449554443359375, 0.0027475357055664062, 0.004650115966796875, 0.006552696228027344, 0.008455276489257812, 0.010357856750488281, 0.01226043701171875, 0.014163017272949219, 0.016065597534179688, 0.017968177795410156, 0.019870758056640625, 0.021773338317871094, 0.023675918579101562, 0.02557849884033203, 0.0274810791015625, 0.02938365936279297, 0.03128623962402344, 0.033188819885253906, 0.035091400146484375, 0.036993980407714844, 0.03889656066894531, 0.04079914093017578, 0.04270172119140625, 0.04460430145263672, 0.04650688171386719, 0.048409461975097656, 0.050312042236328125, 0.052214622497558594, 0.05411720275878906, 0.05601978302001953, 0.05792236328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 7.0, 12.0, 11.0, 12.0, 15.0, 19.0, 13.0, 23.0, 21.0, 22.0, 31.0, 28.0, 31.0, 41.0, 38.0, 51.0, 40.0, 34.0, 38.0, 30.0, 33.0, 41.0, 31.0, 29.0, 38.0, 32.0, 34.0, 33.0, 30.0, 29.0, 23.0, 23.0, 19.0, 13.0, 8.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0], "bins": [-0.4091796875, -0.3971672058105469, -0.38515472412109375, -0.3731422424316406, -0.3611297607421875, -0.3491172790527344, -0.33710479736328125, -0.3250923156738281, -0.313079833984375, -0.3010673522949219, -0.28905487060546875, -0.2770423889160156, -0.2650299072265625, -0.2530174255371094, -0.24100494384765625, -0.22899246215820312, -0.21697998046875, -0.20496749877929688, -0.19295501708984375, -0.18094253540039062, -0.1689300537109375, -0.15691757202148438, -0.14490509033203125, -0.13289260864257812, -0.120880126953125, -0.10886764526367188, -0.09685516357421875, -0.08484268188476562, -0.0728302001953125, -0.060817718505859375, -0.04880523681640625, -0.036792755126953125, -0.0247802734375, -0.012767791748046875, -0.00075531005859375, 0.011257171630859375, 0.0232696533203125, 0.035282135009765625, 0.04729461669921875, 0.059307098388671875, 0.071319580078125, 0.08333206176757812, 0.09534454345703125, 0.10735702514648438, 0.1193695068359375, 0.13138198852539062, 0.14339447021484375, 0.15540695190429688, 0.16741943359375, 0.17943191528320312, 0.19144439697265625, 0.20345687866210938, 0.2154693603515625, 0.22748184204101562, 0.23949432373046875, 0.2515068054199219, 0.263519287109375, 0.2755317687988281, 0.28754425048828125, 0.2995567321777344, 0.3115692138671875, 0.3235816955566406, 0.33559417724609375, 0.3476066589355469, 0.359619140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 11.0, 7.0, 12.0, 7.0, 20.0, 14.0, 19.0, 43.0, 76.0, 137.0, 191.0, 373.0, 867.0, 1689.0, 3908.0, 10736.0, 40895.0, 383763.0, 527420.0, 56922.0, 12972.0, 4544.0, 1959.0, 912.0, 463.0, 231.0, 152.0, 64.0, 44.0, 32.0, 21.0, 12.0, 14.0, 10.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.047332763671875, -0.04598379135131836, -0.04463481903076172, -0.04328584671020508, -0.04193687438964844, -0.0405879020690918, -0.039238929748535156, -0.037889957427978516, -0.036540985107421875, -0.035192012786865234, -0.033843040466308594, -0.03249406814575195, -0.031145095825195312, -0.029796123504638672, -0.02844715118408203, -0.02709817886352539, -0.02574920654296875, -0.02440023422241211, -0.02305126190185547, -0.021702289581298828, -0.020353317260742188, -0.019004344940185547, -0.017655372619628906, -0.016306400299072266, -0.014957427978515625, -0.013608455657958984, -0.012259483337402344, -0.010910511016845703, -0.009561538696289062, -0.008212566375732422, -0.006863594055175781, -0.005514621734619141, -0.0041656494140625, -0.0028166770935058594, -0.0014677047729492188, -0.00011873245239257812, 0.0012302398681640625, 0.002579212188720703, 0.003928184509277344, 0.005277156829833984, 0.006626129150390625, 0.007975101470947266, 0.009324073791503906, 0.010673046112060547, 0.012022018432617188, 0.013370990753173828, 0.014719963073730469, 0.01606893539428711, 0.01741790771484375, 0.01876688003540039, 0.02011585235595703, 0.021464824676513672, 0.022813796997070312, 0.024162769317626953, 0.025511741638183594, 0.026860713958740234, 0.028209686279296875, 0.029558658599853516, 0.030907630920410156, 0.0322566032409668, 0.03360557556152344, 0.03495454788208008, 0.03630352020263672, 0.03765249252319336, 0.03900146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 7.0, 6.0, 13.0, 24.0, 51.0, 71.0, 149.0, 182.0, 183.0, 132.0, 65.0, 38.0, 19.0, 9.0, 9.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8133392333984375e-05, -2.7156434953212738e-05, -2.61794775724411e-05, -2.5202520191669464e-05, -2.4225562810897827e-05, -2.324860543012619e-05, -2.2271648049354553e-05, -2.1294690668582916e-05, -2.031773328781128e-05, -1.9340775907039642e-05, -1.8363818526268005e-05, -1.738686114549637e-05, -1.640990376472473e-05, -1.5432946383953094e-05, -1.4455989003181458e-05, -1.347903162240982e-05, -1.2502074241638184e-05, -1.1525116860866547e-05, -1.054815948009491e-05, -9.571202099323273e-06, -8.594244718551636e-06, -7.617287337779999e-06, -6.640329957008362e-06, -5.663372576236725e-06, -4.686415195465088e-06, -3.709457814693451e-06, -2.732500433921814e-06, -1.755543053150177e-06, -7.7858567237854e-07, 1.9837170839309692e-07, 1.1753290891647339e-06, 2.152286469936371e-06, 3.129243850708008e-06, 4.106201231479645e-06, 5.083158612251282e-06, 6.060115993022919e-06, 7.037073373794556e-06, 8.014030754566193e-06, 8.99098813533783e-06, 9.967945516109467e-06, 1.0944902896881104e-05, 1.192186027765274e-05, 1.2898817658424377e-05, 1.3875775039196014e-05, 1.4852732419967651e-05, 1.582968980073929e-05, 1.6806647181510925e-05, 1.7783604562282562e-05, 1.87605619430542e-05, 1.9737519323825836e-05, 2.0714476704597473e-05, 2.169143408536911e-05, 2.2668391466140747e-05, 2.3645348846912384e-05, 2.462230622768402e-05, 2.5599263608455658e-05, 2.6576220989227295e-05, 2.7553178369998932e-05, 2.853013575077057e-05, 2.9507093131542206e-05, 3.0484050512313843e-05, 3.146100789308548e-05, 3.243796527385712e-05, 3.3414922654628754e-05, 3.439188003540039e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 9.0, 6.0, 11.0, 19.0, 23.0, 39.0, 40.0, 79.0, 96.0, 189.0, 251.0, 417.0, 644.0, 1087.0, 1834.0, 3132.0, 6124.0, 12462.0, 30140.0, 93762.0, 303068.0, 381388.0, 138189.0, 42257.0, 16342.0, 7531.0, 4019.0, 2129.0, 1260.0, 694.0, 466.0, 284.0, 176.0, 126.0, 84.0, 63.0, 34.0, 23.0, 17.0, 13.0, 8.0, 15.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02618408203125, -0.02531576156616211, -0.02444744110107422, -0.023579120635986328, -0.022710800170898438, -0.021842479705810547, -0.020974159240722656, -0.020105838775634766, -0.019237518310546875, -0.018369197845458984, -0.017500877380371094, -0.016632556915283203, -0.015764236450195312, -0.014895915985107422, -0.014027595520019531, -0.01315927505493164, -0.01229095458984375, -0.01142263412475586, -0.010554313659667969, -0.009685993194580078, -0.008817672729492188, -0.007949352264404297, -0.007081031799316406, -0.006212711334228516, -0.005344390869140625, -0.004476070404052734, -0.0036077499389648438, -0.002739429473876953, -0.0018711090087890625, -0.0010027885437011719, -0.00013446807861328125, 0.0007338523864746094, 0.0016021728515625, 0.0024704933166503906, 0.0033388137817382812, 0.004207134246826172, 0.0050754547119140625, 0.005943775177001953, 0.006812095642089844, 0.007680416107177734, 0.008548736572265625, 0.009417057037353516, 0.010285377502441406, 0.011153697967529297, 0.012022018432617188, 0.012890338897705078, 0.013758659362792969, 0.01462697982788086, 0.01549530029296875, 0.01636362075805664, 0.01723194122314453, 0.018100261688232422, 0.018968582153320312, 0.019836902618408203, 0.020705223083496094, 0.021573543548583984, 0.022441864013671875, 0.023310184478759766, 0.024178504943847656, 0.025046825408935547, 0.025915145874023438, 0.026783466339111328, 0.02765178680419922, 0.02852010726928711, 0.029388427734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 13.0, 9.0, 16.0, 20.0, 17.0, 38.0, 48.0, 77.0, 90.0, 83.0, 107.0, 92.0, 76.0, 85.0, 50.0, 39.0, 28.0, 21.0, 11.0, 19.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01061248779296875, -0.0102766752243042, -0.009940862655639648, -0.009605050086975098, -0.009269237518310547, -0.008933424949645996, -0.008597612380981445, -0.008261799812316895, -0.007925987243652344, -0.007590174674987793, -0.007254362106323242, -0.006918549537658691, -0.006582736968994141, -0.00624692440032959, -0.005911111831665039, -0.005575299263000488, -0.0052394866943359375, -0.004903674125671387, -0.004567861557006836, -0.004232048988342285, -0.0038962364196777344, -0.0035604238510131836, -0.003224611282348633, -0.002888798713684082, -0.0025529861450195312, -0.0022171735763549805, -0.0018813610076904297, -0.001545548439025879, -0.0012097358703613281, -0.0008739233016967773, -0.0005381107330322266, -0.00020229816436767578, 0.000133514404296875, 0.0004693269729614258, 0.0008051395416259766, 0.0011409521102905273, 0.0014767646789550781, 0.001812577247619629, 0.0021483898162841797, 0.0024842023849487305, 0.0028200149536132812, 0.003155827522277832, 0.003491640090942383, 0.0038274526596069336, 0.004163265228271484, 0.004499077796936035, 0.004834890365600586, 0.005170702934265137, 0.0055065155029296875, 0.005842328071594238, 0.006178140640258789, 0.00651395320892334, 0.006849765777587891, 0.007185578346252441, 0.007521390914916992, 0.007857203483581543, 0.008193016052246094, 0.008528828620910645, 0.008864641189575195, 0.009200453758239746, 0.009536266326904297, 0.009872078895568848, 0.010207891464233398, 0.01054370403289795, 0.0108795166015625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 6.0, 13.0, 13.0, 9.0, 13.0, 13.0, 24.0, 19.0, 46.0, 57.0, 48.0, 47.0, 52.0, 62.0, 56.0, 61.0, 61.0, 52.0, 52.0, 48.0, 55.0, 40.0, 27.0, 26.0, 15.0, 23.0, 12.0, 11.0, 6.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21121995151042938, -0.2046094834804535, -0.1979990005493164, -0.19138853251934052, -0.18477806448936462, -0.17816759645938873, -0.17155712842941284, -0.16494664549827576, -0.15833617746829987, -0.15172570943832397, -0.1451152265071869, -0.138504758477211, -0.1318942904472351, -0.12528382241725922, -0.11867334693670273, -0.11206287145614624, -0.10545240342617035, -0.09884193539619446, -0.09223145991563797, -0.08562098443508148, -0.07901051640510559, -0.0724000483751297, -0.06578957289457321, -0.05917910113930702, -0.05256862938404083, -0.04595815762877464, -0.03934768587350845, -0.032737214118242264, -0.026126742362976074, -0.019516270607709885, -0.012905798852443695, -0.0062953270971775055, 0.00031515955924987793, 0.0069256313145160675, 0.013536103069782257, 0.020146574825048447, 0.026757046580314636, 0.033367518335580826, 0.039977990090847015, 0.046588461846113205, 0.053198933601379395, 0.059809405356645584, 0.06641987711191177, 0.07303035259246826, 0.07964082062244415, 0.08625128865242004, 0.09286176413297653, 0.09947223961353302, 0.10608270764350891, 0.1126931756734848, 0.11930365115404129, 0.12591412663459778, 0.13252459466457367, 0.13913506269454956, 0.14574554562568665, 0.15235601365566254, 0.15896648168563843, 0.16557694971561432, 0.1721874177455902, 0.1787979006767273, 0.18540836870670319, 0.19201883673667908, 0.19862931966781616, 0.20523978769779205, 0.21185025572776794]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 13.0, 17.0, 17.0, 13.0, 17.0, 21.0, 24.0, 23.0, 31.0, 44.0, 40.0, 46.0, 42.0, 40.0, 47.0, 46.0, 38.0, 43.0, 31.0, 43.0, 31.0, 32.0, 31.0, 32.0, 30.0, 36.0, 29.0, 16.0, 16.0, 15.0, 14.0, 10.0, 17.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.18202324211597443, -0.17685925960540771, -0.1716952919960022, -0.16653130948543549, -0.16136732697486877, -0.15620335936546326, -0.15103937685489655, -0.14587539434432983, -0.14071142673492432, -0.1355474442243576, -0.1303834766149521, -0.12521949410438538, -0.12005551159381866, -0.11489153653383255, -0.10972756147384644, -0.10456357896327972, -0.09939959645271301, -0.0942356213927269, -0.08907163888216019, -0.08390766382217407, -0.07874368131160736, -0.07357970625162125, -0.06841573119163513, -0.06325174868106842, -0.058087773621082306, -0.05292379483580589, -0.04775981605052948, -0.042595840990543365, -0.03743186220526695, -0.03226788341999054, -0.027103906497359276, -0.021939929574728012, -0.016775965690612793, -0.011611987836658955, -0.006448009982705116, -0.001284032128751278, 0.0038799457252025604, 0.009043924510478973, 0.014207901433110237, 0.0193718783557415, 0.024535857141017914, 0.029699835926294327, 0.03486381471157074, 0.040027789771556854, 0.04519176855683327, 0.05035574734210968, 0.055519722402095795, 0.06068370118737221, 0.06584767997264862, 0.07101165503263474, 0.07617563754320145, 0.08133961260318756, 0.08650359511375427, 0.09166757017374039, 0.0968315452337265, 0.10199552774429321, 0.10715950280427933, 0.11232347786426544, 0.11748746037483215, 0.12265143543481827, 0.12781541049480438, 0.1329793930053711, 0.1381433755159378, 0.14330734312534332, 0.14847132563591003]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 7.0, 14.0, 16.0, 39.0, 47.0, 73.0, 125.0, 147.0, 255.0, 415.0, 691.0, 1233.0, 2344.0, 4395.0, 8518.0, 18313.0, 43889.0, 120770.0, 321582.0, 323463.0, 121380.0, 44037.0, 18364.0, 8592.0, 4276.0, 2375.0, 1272.0, 700.0, 420.0, 282.0, 170.0, 99.0, 70.0, 51.0, 41.0, 25.0, 12.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.313232421875, -0.303741455078125, -0.29425048828125, -0.284759521484375, -0.2752685546875, -0.265777587890625, -0.25628662109375, -0.246795654296875, -0.2373046875, -0.227813720703125, -0.21832275390625, -0.208831787109375, -0.1993408203125, -0.189849853515625, -0.18035888671875, -0.170867919921875, -0.161376953125, -0.151885986328125, -0.14239501953125, -0.132904052734375, -0.1234130859375, -0.113922119140625, -0.10443115234375, -0.094940185546875, -0.08544921875, -0.075958251953125, -0.06646728515625, -0.056976318359375, -0.0474853515625, -0.037994384765625, -0.02850341796875, -0.019012451171875, -0.009521484375, -3.0517578125e-05, 0.00946044921875, 0.018951416015625, 0.0284423828125, 0.037933349609375, 0.04742431640625, 0.056915283203125, 0.06640625, 0.075897216796875, 0.08538818359375, 0.094879150390625, 0.1043701171875, 0.113861083984375, 0.12335205078125, 0.132843017578125, 0.142333984375, 0.151824951171875, 0.16131591796875, 0.170806884765625, 0.1802978515625, 0.189788818359375, 0.19927978515625, 0.208770751953125, 0.21826171875, 0.227752685546875, 0.23724365234375, 0.246734619140625, 0.2562255859375, 0.265716552734375, 0.27520751953125, 0.284698486328125, 0.294189453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 9.0, 12.0, 18.0, 12.0, 14.0, 23.0, 33.0, 29.0, 28.0, 34.0, 54.0, 46.0, 44.0, 45.0, 58.0, 48.0, 45.0, 31.0, 43.0, 43.0, 43.0, 30.0, 41.0, 38.0, 20.0, 23.0, 24.0, 14.0, 16.0, 10.0, 13.0, 10.0, 9.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.320068359375, -0.310882568359375, -0.30169677734375, -0.292510986328125, -0.2833251953125, -0.274139404296875, -0.26495361328125, -0.255767822265625, -0.24658203125, -0.237396240234375, -0.22821044921875, -0.219024658203125, -0.2098388671875, -0.200653076171875, -0.19146728515625, -0.182281494140625, -0.173095703125, -0.163909912109375, -0.15472412109375, -0.145538330078125, -0.1363525390625, -0.127166748046875, -0.11798095703125, -0.108795166015625, -0.099609375, -0.090423583984375, -0.08123779296875, -0.072052001953125, -0.0628662109375, -0.053680419921875, -0.04449462890625, -0.035308837890625, -0.026123046875, -0.016937255859375, -0.00775146484375, 0.001434326171875, 0.0106201171875, 0.019805908203125, 0.02899169921875, 0.038177490234375, 0.04736328125, 0.056549072265625, 0.06573486328125, 0.074920654296875, 0.0841064453125, 0.093292236328125, 0.10247802734375, 0.111663818359375, 0.120849609375, 0.130035400390625, 0.13922119140625, 0.148406982421875, 0.1575927734375, 0.166778564453125, 0.17596435546875, 0.185150146484375, 0.1943359375, 0.203521728515625, 0.21270751953125, 0.221893310546875, 0.2310791015625, 0.240264892578125, 0.24945068359375, 0.258636474609375, 0.267822265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 6.0, 4.0, 12.0, 13.0, 19.0, 32.0, 53.0, 72.0, 143.0, 206.0, 345.0, 632.0, 1248.0, 2414.0, 5123.0, 12081.0, 32206.0, 103575.0, 352478.0, 369565.0, 110855.0, 33900.0, 12887.0, 5369.0, 2510.0, 1214.0, 662.0, 350.0, 205.0, 132.0, 72.0, 52.0, 38.0, 23.0, 9.0, 12.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34912109375, -0.3370933532714844, -0.32506561279296875, -0.3130378723144531, -0.3010101318359375, -0.2889823913574219, -0.27695465087890625, -0.2649269104003906, -0.252899169921875, -0.24087142944335938, -0.22884368896484375, -0.21681594848632812, -0.2047882080078125, -0.19276046752929688, -0.18073272705078125, -0.16870498657226562, -0.15667724609375, -0.14464950561523438, -0.13262176513671875, -0.12059402465820312, -0.1085662841796875, -0.09653854370117188, -0.08451080322265625, -0.07248306274414062, -0.060455322265625, -0.048427581787109375, -0.03639984130859375, -0.024372100830078125, -0.0123443603515625, -0.000316619873046875, 0.01171112060546875, 0.023738861083984375, 0.0357666015625, 0.047794342041015625, 0.05982208251953125, 0.07184982299804688, 0.0838775634765625, 0.09590530395507812, 0.10793304443359375, 0.11996078491210938, 0.131988525390625, 0.14401626586914062, 0.15604400634765625, 0.16807174682617188, 0.1800994873046875, 0.19212722778320312, 0.20415496826171875, 0.21618270874023438, 0.22821044921875, 0.24023818969726562, 0.25226593017578125, 0.2642936706542969, 0.2763214111328125, 0.2883491516113281, 0.30037689208984375, 0.3124046325683594, 0.324432373046875, 0.3364601135253906, 0.34848785400390625, 0.3605155944824219, 0.3725433349609375, 0.3845710754394531, 0.39659881591796875, 0.4086265563964844, 0.420654296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 11.0, 12.0, 8.0, 22.0, 24.0, 27.0, 28.0, 29.0, 40.0, 50.0, 44.0, 64.0, 69.0, 56.0, 55.0, 62.0, 58.0, 46.0, 48.0, 38.0, 44.0, 31.0, 23.0, 19.0, 21.0, 15.0, 14.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3403472900390625, -0.326690673828125, -0.3130340576171875, -0.29937744140625, -0.2857208251953125, -0.272064208984375, -0.2584075927734375, -0.2447509765625, -0.2310943603515625, -0.217437744140625, -0.2037811279296875, -0.19012451171875, -0.1764678955078125, -0.162811279296875, -0.1491546630859375, -0.135498046875, -0.1218414306640625, -0.108184814453125, -0.0945281982421875, -0.08087158203125, -0.0672149658203125, -0.053558349609375, -0.0399017333984375, -0.0262451171875, -0.0125885009765625, 0.001068115234375, 0.0147247314453125, 0.02838134765625, 0.0420379638671875, 0.055694580078125, 0.0693511962890625, 0.0830078125, 0.0966644287109375, 0.110321044921875, 0.1239776611328125, 0.13763427734375, 0.1512908935546875, 0.164947509765625, 0.1786041259765625, 0.1922607421875, 0.2059173583984375, 0.219573974609375, 0.2332305908203125, 0.24688720703125, 0.2605438232421875, 0.274200439453125, 0.2878570556640625, 0.301513671875, 0.3151702880859375, 0.328826904296875, 0.3424835205078125, 0.35614013671875, 0.3697967529296875, 0.383453369140625, 0.3971099853515625, 0.4107666015625, 0.4244232177734375, 0.438079833984375, 0.4517364501953125, 0.46539306640625, 0.4790496826171875, 0.492706298828125, 0.5063629150390625, 0.52001953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 6.0, 10.0, 16.0, 22.0, 28.0, 50.0, 83.0, 149.0, 242.0, 368.0, 589.0, 950.0, 1699.0, 2945.0, 5148.0, 9861.0, 19688.0, 42038.0, 95770.0, 201597.0, 337507.0, 177032.0, 80781.0, 35898.0, 16738.0, 8540.0, 4492.0, 2576.0, 1409.0, 912.0, 531.0, 329.0, 194.0, 139.0, 76.0, 49.0, 28.0, 16.0, 22.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04888916015625, -0.04737997055053711, -0.04587078094482422, -0.04436159133911133, -0.04285240173339844, -0.04134321212768555, -0.039834022521972656, -0.038324832916259766, -0.036815643310546875, -0.035306453704833984, -0.033797264099121094, -0.0322880744934082, -0.030778884887695312, -0.029269695281982422, -0.02776050567626953, -0.02625131607055664, -0.02474212646484375, -0.02323293685913086, -0.02172374725341797, -0.020214557647705078, -0.018705368041992188, -0.017196178436279297, -0.015686988830566406, -0.014177799224853516, -0.012668609619140625, -0.011159420013427734, -0.009650230407714844, -0.008141040802001953, -0.0066318511962890625, -0.005122661590576172, -0.0036134719848632812, -0.0021042823791503906, -0.0005950927734375, 0.0009140968322753906, 0.0024232864379882812, 0.003932476043701172, 0.0054416656494140625, 0.006950855255126953, 0.008460044860839844, 0.009969234466552734, 0.011478424072265625, 0.012987613677978516, 0.014496803283691406, 0.016005992889404297, 0.017515182495117188, 0.019024372100830078, 0.02053356170654297, 0.02204275131225586, 0.02355194091796875, 0.02506113052368164, 0.02657032012939453, 0.028079509735107422, 0.029588699340820312, 0.031097888946533203, 0.032607078552246094, 0.034116268157958984, 0.035625457763671875, 0.037134647369384766, 0.038643836975097656, 0.04015302658081055, 0.04166221618652344, 0.04317140579223633, 0.04468059539794922, 0.04618978500366211, 0.047698974609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 10.0, 7.0, 9.0, 5.0, 18.0, 17.0, 17.0, 27.0, 32.0, 48.0, 54.0, 48.0, 79.0, 101.0, 106.0, 59.0, 63.0, 62.0, 46.0, 36.0, 21.0, 29.0, 11.0, 14.0, 15.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3947486877441406e-05, -1.3538636267185211e-05, -1.3129785656929016e-05, -1.2720935046672821e-05, -1.2312084436416626e-05, -1.1903233826160431e-05, -1.1494383215904236e-05, -1.108553260564804e-05, -1.0676681995391846e-05, -1.026783138513565e-05, -9.858980774879456e-06, -9.45013016462326e-06, -9.041279554367065e-06, -8.63242894411087e-06, -8.223578333854675e-06, -7.81472772359848e-06, -7.405877113342285e-06, -6.99702650308609e-06, -6.588175892829895e-06, -6.1793252825737e-06, -5.770474672317505e-06, -5.36162406206131e-06, -4.952773451805115e-06, -4.54392284154892e-06, -4.135072231292725e-06, -3.7262216210365295e-06, -3.3173710107803345e-06, -2.9085204005241394e-06, -2.4996697902679443e-06, -2.0908191800117493e-06, -1.6819685697555542e-06, -1.2731179594993591e-06, -8.642673492431641e-07, -4.55416738986969e-07, -4.6566128730773926e-08, 3.6228448152542114e-07, 7.711350917816162e-07, 1.1799857020378113e-06, 1.5888363122940063e-06, 1.9976869225502014e-06, 2.4065375328063965e-06, 2.8153881430625916e-06, 3.2242387533187866e-06, 3.6330893635749817e-06, 4.041939973831177e-06, 4.450790584087372e-06, 4.859641194343567e-06, 5.268491804599762e-06, 5.677342414855957e-06, 6.086193025112152e-06, 6.495043635368347e-06, 6.903894245624542e-06, 7.312744855880737e-06, 7.721595466136932e-06, 8.130446076393127e-06, 8.539296686649323e-06, 8.948147296905518e-06, 9.356997907161713e-06, 9.765848517417908e-06, 1.0174699127674103e-05, 1.0583549737930298e-05, 1.0992400348186493e-05, 1.1401250958442688e-05, 1.1810101568698883e-05, 1.2218952178955078e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 14.0, 11.0, 18.0, 16.0, 25.0, 49.0, 55.0, 83.0, 99.0, 156.0, 245.0, 304.0, 402.0, 630.0, 977.0, 1780.0, 3246.0, 6305.0, 13750.0, 33486.0, 99604.0, 332824.0, 386416.0, 104243.0, 34855.0, 14110.0, 6433.0, 3367.0, 1786.0, 1089.0, 695.0, 483.0, 293.0, 171.0, 138.0, 99.0, 59.0, 50.0, 53.0, 31.0, 19.0, 17.0, 12.0, 14.0, 12.0, 6.0, 5.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.08127689361572266, -0.07856941223144531, -0.07586193084716797, -0.07315444946289062, -0.07044696807861328, -0.06773948669433594, -0.0650320053100586, -0.06232452392578125, -0.059617042541503906, -0.05690956115722656, -0.05420207977294922, -0.051494598388671875, -0.04878711700439453, -0.04607963562011719, -0.043372154235839844, -0.0406646728515625, -0.037957191467285156, -0.03524971008300781, -0.03254222869873047, -0.029834747314453125, -0.02712726593017578, -0.024419784545898438, -0.021712303161621094, -0.01900482177734375, -0.016297340393066406, -0.013589859008789062, -0.010882377624511719, -0.008174896240234375, -0.005467414855957031, -0.0027599334716796875, -5.245208740234375e-05, 0.002655029296875, 0.005362510681152344, 0.008069992065429688, 0.010777473449707031, 0.013484954833984375, 0.01619243621826172, 0.018899917602539062, 0.021607398986816406, 0.02431488037109375, 0.027022361755371094, 0.029729843139648438, 0.03243732452392578, 0.035144805908203125, 0.03785228729248047, 0.04055976867675781, 0.043267250061035156, 0.0459747314453125, 0.048682212829589844, 0.05138969421386719, 0.05409717559814453, 0.056804656982421875, 0.05951213836669922, 0.06221961975097656, 0.0649271011352539, 0.06763458251953125, 0.0703420639038086, 0.07304954528808594, 0.07575702667236328, 0.07846450805664062, 0.08117198944091797, 0.08387947082519531, 0.08658695220947266, 0.08929443359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 14.0, 20.0, 18.0, 25.0, 39.0, 40.0, 67.0, 56.0, 80.0, 124.0, 105.0, 87.0, 73.0, 50.0, 26.0, 31.0, 22.0, 21.0, 11.0, 5.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0499267578125, -0.04836320877075195, -0.046799659729003906, -0.04523611068725586, -0.04367256164550781, -0.042109012603759766, -0.04054546356201172, -0.03898191452026367, -0.037418365478515625, -0.03585481643676758, -0.03429126739501953, -0.032727718353271484, -0.031164169311523438, -0.02960062026977539, -0.028037071228027344, -0.026473522186279297, -0.02490997314453125, -0.023346424102783203, -0.021782875061035156, -0.02021932601928711, -0.018655776977539062, -0.017092227935791016, -0.015528678894042969, -0.013965129852294922, -0.012401580810546875, -0.010838031768798828, -0.009274482727050781, -0.007710933685302734, -0.0061473846435546875, -0.004583835601806641, -0.0030202865600585938, -0.0014567375183105469, 0.0001068115234375, 0.0016703605651855469, 0.0032339096069335938, 0.004797458648681641, 0.0063610076904296875, 0.007924556732177734, 0.009488105773925781, 0.011051654815673828, 0.012615203857421875, 0.014178752899169922, 0.01574230194091797, 0.017305850982666016, 0.018869400024414062, 0.02043294906616211, 0.021996498107910156, 0.023560047149658203, 0.02512359619140625, 0.026687145233154297, 0.028250694274902344, 0.02981424331665039, 0.03137779235839844, 0.032941341400146484, 0.03450489044189453, 0.03606843948364258, 0.037631988525390625, 0.03919553756713867, 0.04075908660888672, 0.042322635650634766, 0.04388618469238281, 0.04544973373413086, 0.047013282775878906, 0.04857683181762695, 0.050140380859375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 16.0, 31.0, 74.0, 119.0, 200.0, 192.0, 148.0, 96.0, 61.0, 34.0, 10.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0467673540115356, -1.007058024406433, -0.9673486351966858, -0.9276392459869385, -0.8879299163818359, -0.8482205271720886, -0.8085111379623413, -0.7688018083572388, -0.7290924191474915, -0.6893830299377441, -0.6496737003326416, -0.6099643111228943, -0.570254921913147, -0.5305455923080444, -0.4908362030982971, -0.4511268436908722, -0.41141748428344727, -0.37170812487602234, -0.3319987654685974, -0.2922893762588501, -0.25258001685142517, -0.21287065744400024, -0.17316128313541412, -0.133451908826828, -0.09374254941940308, -0.05403318256139755, -0.014323815703392029, 0.025385551154613495, 0.06509491801261902, 0.10480427742004395, 0.14451365172863007, 0.1842230260372162, 0.22393250465393066, 0.2636418640613556, 0.3033512234687805, 0.34306061267852783, 0.38276997208595276, 0.4224793314933777, 0.462188720703125, 0.5018980503082275, 0.5416074395179749, 0.5813168287277222, 0.6210261583328247, 0.660735547542572, 0.7004449367523193, 0.7401542663574219, 0.7798636555671692, 0.8195730447769165, 0.859282374382019, 0.8989917635917664, 0.9387010931968689, 0.9784104824066162, 1.0181198120117188, 1.0578291416168213, 1.0975385904312134, 1.137247920036316, 1.176957368850708, 1.2166666984558105, 1.2563761472702026, 1.2960854768753052, 1.3357948064804077, 1.3755042552947998, 1.4152135848999023, 1.4549229145050049, 1.4946322441101074]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 5.0, 6.0, 6.0, 17.0, 17.0, 18.0, 17.0, 26.0, 22.0, 28.0, 40.0, 24.0, 35.0, 52.0, 41.0, 36.0, 55.0, 50.0, 50.0, 35.0, 40.0, 47.0, 31.0, 34.0, 26.0, 36.0, 30.0, 26.0, 24.0, 14.0, 21.0, 16.0, 13.0, 16.0, 7.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6149052381515503, -0.5975620746612549, -0.5802189111709595, -0.5628758072853088, -0.5455326437950134, -0.528189480304718, -0.5108463168144226, -0.4935031533241272, -0.4761600196361542, -0.45881685614585876, -0.44147372245788574, -0.42413055896759033, -0.4067873954772949, -0.3894442617893219, -0.3721010982990265, -0.35475796461105347, -0.33741480112075806, -0.32007163763046265, -0.3027285039424896, -0.2853853404521942, -0.2680422067642212, -0.2506990432739258, -0.23335587978363037, -0.21601273119449615, -0.19866958260536194, -0.18132643401622772, -0.1639832854270935, -0.1466401219367981, -0.12929697334766388, -0.11195382475852966, -0.09461066871881485, -0.07726751267910004, -0.05992436408996582, -0.042581211775541306, -0.02523805946111679, -0.007894907146692276, 0.009448245167732239, 0.026791393756866455, 0.04413454979658127, 0.06147770583629608, 0.0788208544254303, 0.09616400301456451, 0.11350715905427933, 0.13085031509399414, 0.14819346368312836, 0.16553661227226257, 0.18287977576255798, 0.2002229243516922, 0.21756607294082642, 0.23490922152996063, 0.25225237011909485, 0.26959553360939026, 0.2869386672973633, 0.3042818307876587, 0.3216249942779541, 0.3389681577682495, 0.35631129145622253, 0.37365445494651794, 0.39099758863449097, 0.4083407521247864, 0.4256839156150818, 0.4430270493030548, 0.4603702127933502, 0.47771334648132324, 0.49505650997161865]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 17.0, 18.0, 20.0, 23.0, 41.0, 43.0, 52.0, 61.0, 94.0, 150.0, 178.0, 255.0, 320.0, 482.0, 841.0, 1347.0, 2506.0, 4625.0, 1021404.0, 8392.0, 4050.0, 2072.0, 1191.0, 787.0, 469.0, 280.0, 203.0, 162.0, 98.0, 101.0, 72.0, 47.0, 38.0, 35.0, 29.0, 18.0, 25.0, 9.0, 9.0, 5.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.598320722579956, -0.5776081085205078, -0.5568954944610596, -0.5361828804016113, -0.5154702663421631, -0.49475765228271484, -0.474045068025589, -0.45333245396614075, -0.4326198399066925, -0.41190722584724426, -0.391194611787796, -0.3704819977283478, -0.3497694134712219, -0.3290567994117737, -0.30834418535232544, -0.2876315712928772, -0.26691895723342896, -0.2462063431739807, -0.22549372911453247, -0.20478112995624542, -0.18406851589679718, -0.16335590183734894, -0.1426433026790619, -0.12193068861961365, -0.1012180745601654, -0.08050546050071716, -0.05979285389184952, -0.039080243557691574, -0.01836763322353363, 0.002344980835914612, 0.023057587444782257, 0.0437701940536499, 0.06448280811309814, 0.08519542217254639, 0.10590802878141403, 0.12662063539028168, 0.14733324944972992, 0.16804586350917816, 0.1887584626674652, 0.20947107672691345, 0.2301836907863617, 0.25089630484580994, 0.2716089189052582, 0.2923215329647064, 0.3130341172218323, 0.3337467312812805, 0.35445934534072876, 0.375171959400177, 0.39588457345962524, 0.4165971875190735, 0.43730980157852173, 0.45802241563796997, 0.4787350296974182, 0.49944764375686646, 0.5201602578163147, 0.5408728122711182, 0.5615854263305664, 0.5822980403900146, 0.6030106544494629, 0.6237232685089111, 0.6444358825683594, 0.6651484966278076, 0.6858611106872559, 0.7065737247467041, 0.7272863388061523]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 8.0, 8.0, 17.0, 49.0, 110.0, 287.0, 835.0, 2415.0, 51457048.0, 7208.0, 1436.0, 539.0, 218.0, 74.0, 32.0, 19.0, 2.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.43700122833252, -13.050508499145508, -12.664015769958496, -12.277523040771484, -11.891031265258789, -11.504538536071777, -11.118045806884766, -10.731553077697754, -10.345060348510742, -9.95856761932373, -9.572074890136719, -9.185583114624023, -8.799090385437012, -8.41259765625, -8.026104927062988, -7.639612197875977, -7.253120422363281, -6.8666276931762695, -6.480135440826416, -6.093642711639404, -5.707150459289551, -5.320657730102539, -4.934165000915527, -4.547672271728516, -4.161180019378662, -3.7746875286102295, -3.388195037841797, -3.001702308654785, -2.6152098178863525, -2.22871732711792, -1.8422245979309082, -1.4557321071624756, -1.069239616394043, -0.6827470660209656, -0.2962545156478882, 0.09023809432983398, 0.4767305850982666, 0.8632230758666992, 1.249715805053711, 1.6362082958221436, 2.022700786590576, 2.409193277359009, 2.7956857681274414, 3.182178497314453, 3.5686709880828857, 3.9551634788513184, 4.34165620803833, 4.728148460388184, 5.114641189575195, 5.501133918762207, 5.8876261711120605, 6.274118900299072, 6.660611152648926, 7.0471038818359375, 7.433596611022949, 7.820089340209961, 8.206581115722656, 8.593073844909668, 8.97956657409668, 9.366058349609375, 9.752551078796387, 10.139043807983398, 10.52553653717041, 10.912029266357422, 11.298521995544434]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 26.0, 31.0, 40.0, 80.0, 113.0, 169.0, 290.0, 456.0, 789.0, 1298.0, 2087.0, 3590.0, 5904.0, 9991.0, 17003.0, 28016.0, 46827.0, 75334.0, 119186.0, 182364.0, 260300.0, 349174.0, 981586.0, 2930900.0, 400247.0, 292167.0, 210462.0, 142143.0, 90403.0, 55916.0, 33896.0, 20592.0, 12346.0, 7159.0, 4241.0, 2559.0, 1474.0, 899.0, 537.0, 319.0, 198.0, 112.0, 74.0, 53.0, 19.0, 21.0, 15.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.27587890625, -0.2675666809082031, -0.25925445556640625, -0.2509422302246094, -0.2426300048828125, -0.23431777954101562, -0.22600555419921875, -0.21769332885742188, -0.209381103515625, -0.20106887817382812, -0.19275665283203125, -0.18444442749023438, -0.1761322021484375, -0.16781997680664062, -0.15950775146484375, -0.15119552612304688, -0.14288330078125, -0.13457107543945312, -0.12625885009765625, -0.11794662475585938, -0.1096343994140625, -0.10132217407226562, -0.09300994873046875, -0.08469772338867188, -0.076385498046875, -0.06807327270507812, -0.05976104736328125, -0.051448822021484375, -0.0431365966796875, -0.034824371337890625, -0.02651214599609375, -0.018199920654296875, -0.0098876953125, -0.001575469970703125, 0.00673675537109375, 0.015048980712890625, 0.0233612060546875, 0.031673431396484375, 0.03998565673828125, 0.048297882080078125, 0.056610107421875, 0.06492233276367188, 0.07323455810546875, 0.08154678344726562, 0.0898590087890625, 0.09817123413085938, 0.10648345947265625, 0.11479568481445312, 0.12310791015625, 0.13142013549804688, 0.13973236083984375, 0.14804458618164062, 0.1563568115234375, 0.16466903686523438, 0.17298126220703125, 0.18129348754882812, 0.189605712890625, 0.19791793823242188, 0.20623016357421875, 0.21454238891601562, 0.2228546142578125, 0.23116683959960938, 0.23947906494140625, 0.24779129028320312, 0.256103515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 8.0, 5.0, 9.0, 11.0, 17.0, 14.0, 20.0, 21.0, 31.0, 16.0, 22.0, 41.0, 24.0, 37.0, 43.0, 46.0, 56.0, 83.0, 560.0, 502.0, 58.0, 42.0, 48.0, 30.0, 36.0, 32.0, 30.0, 29.0, 35.0, 15.0, 17.0, 17.0, 15.0, 13.0, 11.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.619140625, -2.537261962890625, -2.45538330078125, -2.373504638671875, -2.2916259765625, -2.209747314453125, -2.12786865234375, -2.045989990234375, -1.964111328125, -1.882232666015625, -1.80035400390625, -1.718475341796875, -1.6365966796875, -1.554718017578125, -1.47283935546875, -1.390960693359375, -1.30908203125, -1.227203369140625, -1.14532470703125, -1.063446044921875, -0.9815673828125, -0.899688720703125, -0.81781005859375, -0.735931396484375, -0.654052734375, -0.572174072265625, -0.49029541015625, -0.408416748046875, -0.3265380859375, -0.244659423828125, -0.16278076171875, -0.080902099609375, 0.0009765625, 0.082855224609375, 0.16473388671875, 0.246612548828125, 0.3284912109375, 0.410369873046875, 0.49224853515625, 0.574127197265625, 0.656005859375, 0.737884521484375, 0.81976318359375, 0.901641845703125, 0.9835205078125, 1.065399169921875, 1.14727783203125, 1.229156494140625, 1.31103515625, 1.392913818359375, 1.47479248046875, 1.556671142578125, 1.6385498046875, 1.720428466796875, 1.80230712890625, 1.884185791015625, 1.966064453125, 2.047943115234375, 2.12982177734375, 2.211700439453125, 2.2935791015625, 2.375457763671875, 2.45733642578125, 2.539215087890625, 2.62109375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 9.0, 8.0, 8.0, 23.0, 41.0, 69.0, 105.0, 126.0, 207.0, 404.0, 626.0, 1020.0, 1639.0, 2763.0, 4350.0, 7211.0, 11875.0, 18737.0, 29771.0, 46302.0, 69195.0, 102150.0, 142590.0, 193614.0, 244099.0, 290772.0, 721321.0, 3048997.0, 330798.0, 269988.0, 219103.0, 168145.0, 122947.0, 85462.0, 57096.0, 37135.0, 23672.0, 15004.0, 9398.0, 5662.0, 3393.0, 2095.0, 1357.0, 837.0, 501.0, 319.0, 196.0, 137.0, 62.0, 36.0, 14.0, 18.0, 10.0, 7.0, 5.0, 3.0, 7.0], "bins": [-0.184814453125, -0.17942047119140625, -0.1740264892578125, -0.16863250732421875, -0.163238525390625, -0.15784454345703125, -0.1524505615234375, -0.14705657958984375, -0.14166259765625, -0.13626861572265625, -0.1308746337890625, -0.12548065185546875, -0.120086669921875, -0.11469268798828125, -0.1092987060546875, -0.10390472412109375, -0.0985107421875, -0.09311676025390625, -0.0877227783203125, -0.08232879638671875, -0.076934814453125, -0.07154083251953125, -0.0661468505859375, -0.06075286865234375, -0.05535888671875, -0.04996490478515625, -0.0445709228515625, -0.03917694091796875, -0.033782958984375, -0.02838897705078125, -0.0229949951171875, -0.01760101318359375, -0.01220703125, -0.00681304931640625, -0.0014190673828125, 0.00397491455078125, 0.009368896484375, 0.01476287841796875, 0.0201568603515625, 0.02555084228515625, 0.03094482421875, 0.03633880615234375, 0.0417327880859375, 0.04712677001953125, 0.052520751953125, 0.05791473388671875, 0.0633087158203125, 0.06870269775390625, 0.0740966796875, 0.07949066162109375, 0.0848846435546875, 0.09027862548828125, 0.095672607421875, 0.10106658935546875, 0.1064605712890625, 0.11185455322265625, 0.11724853515625, 0.12264251708984375, 0.1280364990234375, 0.13343048095703125, 0.138824462890625, 0.14421844482421875, 0.1496124267578125, 0.15500640869140625, 0.160400390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 2.0, 4.0, 9.0, 16.0, 9.0, 16.0, 16.0, 20.0, 21.0, 18.0, 17.0, 30.0, 31.0, 38.0, 29.0, 44.0, 31.0, 30.0, 53.0, 484.0, 595.0, 61.0, 48.0, 40.0, 41.0, 36.0, 38.0, 28.0, 33.0, 27.0, 21.0, 19.0, 11.0, 21.0, 24.0, 15.0, 10.0, 3.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.98968505859375, -1.9188232421875, -1.84796142578125, -1.777099609375, -1.70623779296875, -1.6353759765625, -1.56451416015625, -1.49365234375, -1.42279052734375, -1.3519287109375, -1.28106689453125, -1.210205078125, -1.13934326171875, -1.0684814453125, -0.99761962890625, -0.9267578125, -0.85589599609375, -0.7850341796875, -0.71417236328125, -0.643310546875, -0.57244873046875, -0.5015869140625, -0.43072509765625, -0.35986328125, -0.28900146484375, -0.2181396484375, -0.14727783203125, -0.076416015625, -0.00555419921875, 0.0653076171875, 0.13616943359375, 0.20703125, 0.27789306640625, 0.3487548828125, 0.41961669921875, 0.490478515625, 0.56134033203125, 0.6322021484375, 0.70306396484375, 0.77392578125, 0.84478759765625, 0.9156494140625, 0.98651123046875, 1.057373046875, 1.12823486328125, 1.1990966796875, 1.26995849609375, 1.3408203125, 1.41168212890625, 1.4825439453125, 1.55340576171875, 1.624267578125, 1.69512939453125, 1.7659912109375, 1.83685302734375, 1.90771484375, 1.97857666015625, 2.0494384765625, 2.12030029296875, 2.191162109375, 2.26202392578125, 2.3328857421875, 2.40374755859375, 2.474609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 17.0, 18.0, 41.0, 55.0, 65.0, 91.0, 136.0, 143.0, 218.0, 301.0, 404.0, 527.0, 759.0, 1052.0, 1574.0, 2616.0, 4539.0, 8963.0, 17606.0, 35698.0, 72037.0, 145264.0, 5531812.0, 276233.0, 93245.0, 47226.0, 23388.0, 11646.0, 6079.0, 3302.0, 2035.0, 1286.0, 855.0, 596.0, 424.0, 285.0, 226.0, 168.0, 125.0, 95.0, 57.0, 51.0, 44.0, 32.0, 19.0, 12.0, 14.0, 8.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.72900390625, -0.7067108154296875, -0.684417724609375, -0.6621246337890625, -0.63983154296875, -0.6175384521484375, -0.595245361328125, -0.5729522705078125, -0.5506591796875, -0.5283660888671875, -0.506072998046875, -0.4837799072265625, -0.46148681640625, -0.4391937255859375, -0.416900634765625, -0.3946075439453125, -0.372314453125, -0.3500213623046875, -0.327728271484375, -0.3054351806640625, -0.28314208984375, -0.2608489990234375, -0.238555908203125, -0.2162628173828125, -0.1939697265625, -0.1716766357421875, -0.149383544921875, -0.1270904541015625, -0.10479736328125, -0.0825042724609375, -0.060211181640625, -0.0379180908203125, -0.015625, 0.0066680908203125, 0.028961181640625, 0.0512542724609375, 0.07354736328125, 0.0958404541015625, 0.118133544921875, 0.1404266357421875, 0.1627197265625, 0.1850128173828125, 0.207305908203125, 0.2295989990234375, 0.25189208984375, 0.2741851806640625, 0.296478271484375, 0.3187713623046875, 0.341064453125, 0.3633575439453125, 0.385650634765625, 0.4079437255859375, 0.43023681640625, 0.4525299072265625, 0.474822998046875, 0.4971160888671875, 0.5194091796875, 0.5417022705078125, 0.563995361328125, 0.5862884521484375, 0.60858154296875, 0.6308746337890625, 0.653167724609375, 0.6754608154296875, 0.69775390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 2.0, 10.0, 8.0, 7.0, 13.0, 9.0, 13.0, 25.0, 36.0, 39.0, 38.0, 37.0, 44.0, 42.0, 39.0, 42.0, 98.0, 1012.0, 62.0, 58.0, 44.0, 48.0, 49.0, 40.0, 30.0, 25.0, 19.0, 29.0, 24.0, 21.0, 16.0, 7.0, 5.0, 5.0, 7.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -3.0069580078125, -2.914306640625, -2.8216552734375, -2.72900390625, -2.6363525390625, -2.543701171875, -2.4510498046875, -2.3583984375, -2.2657470703125, -2.173095703125, -2.0804443359375, -1.98779296875, -1.8951416015625, -1.802490234375, -1.7098388671875, -1.6171875, -1.5245361328125, -1.431884765625, -1.3392333984375, -1.24658203125, -1.1539306640625, -1.061279296875, -0.9686279296875, -0.8759765625, -0.7833251953125, -0.690673828125, -0.5980224609375, -0.50537109375, -0.4127197265625, -0.320068359375, -0.2274169921875, -0.134765625, -0.0421142578125, 0.050537109375, 0.1431884765625, 0.23583984375, 0.3284912109375, 0.421142578125, 0.5137939453125, 0.6064453125, 0.6990966796875, 0.791748046875, 0.8843994140625, 0.97705078125, 1.0697021484375, 1.162353515625, 1.2550048828125, 1.34765625, 1.4403076171875, 1.532958984375, 1.6256103515625, 1.71826171875, 1.8109130859375, 1.903564453125, 1.9962158203125, 2.0888671875, 2.1815185546875, 2.274169921875, 2.3668212890625, 2.45947265625, 2.5521240234375, 2.644775390625, 2.7374267578125, 2.830078125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 15.0, 19.0, 35.0, 80.0, 170.0, 284.0, 210.0, 100.0, 49.0, 23.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.863334655761719, -15.454010009765625, -15.044686317443848, -14.635361671447754, -14.22603702545166, -13.816713333129883, -13.407388687133789, -12.998064041137695, -12.588739395141602, -12.179414749145508, -11.77009105682373, -11.360766410827637, -10.951441764831543, -10.542118072509766, -10.132793426513672, -9.723468780517578, -9.3141450881958, -8.904820442199707, -8.49549674987793, -8.086172103881836, -7.676847457885742, -7.267523288726807, -6.858199119567871, -6.448874473571777, -6.039550304412842, -5.630226135253906, -5.2209014892578125, -4.811577320098877, -4.402253150939941, -3.9929285049438477, -3.583604335784912, -3.1742799282073975, -2.764955520629883, -2.355631113052368, -1.946306824684143, -1.536982536315918, -1.1276581287384033, -0.7183337211608887, -0.3090095520019531, 0.10031485557556152, 0.5096392631530762, 0.918963611125946, 1.328287959098816, 1.737612247467041, 2.1469366550445557, 2.5562610626220703, 2.965585231781006, 3.3749096393585205, 3.784234046936035, 4.193558216094971, 4.6028828620910645, 5.01220703125, 5.421531677246094, 5.830855846405029, 6.240180015563965, 6.649504661560059, 7.058828830718994, 7.46815299987793, 7.877477645874023, 8.286802291870117, 8.696125984191895, 9.105450630187988, 9.514774322509766, 9.92409896850586, 10.333423614501953]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 0.0, 4.0, 6.0, 7.0, 12.0, 8.0, 11.0, 12.0, 20.0, 20.0, 33.0, 28.0, 33.0, 34.0, 43.0, 53.0, 60.0, 68.0, 85.0, 49.0, 65.0, 58.0, 52.0, 37.0, 26.0, 27.0, 22.0, 22.0, 15.0, 14.0, 9.0, 12.0, 15.0, 11.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0], "bins": [-10.555952072143555, -10.27237606048584, -9.988801002502441, -9.705224990844727, -9.421649932861328, -9.138073921203613, -8.854498863220215, -8.5709228515625, -8.287347793579102, -8.003771781921387, -7.720196723937988, -7.436621189117432, -7.153045654296875, -6.86946964263916, -6.5858941078186035, -6.302318572998047, -6.018742561340332, -5.735167026519775, -5.451591491699219, -5.168015956878662, -4.8844404220581055, -4.600864410400391, -4.317288875579834, -4.033713340759277, -3.7501378059387207, -3.466562271118164, -3.1829867362976074, -2.8994109630584717, -2.615835428237915, -2.3322598934173584, -2.0486841201782227, -1.765108585357666, -1.4815325736999512, -1.1979570388793945, -0.9143813848495483, -0.6308057904243469, -0.3472301959991455, -0.06365466117858887, 0.21992099285125732, 0.5034966468811035, 0.7870721817016602, 1.0706477165222168, 1.354223370552063, 1.6377990245819092, 1.9213745594024658, 2.2049500942230225, 2.488525867462158, 2.772101402282715, 3.0556769371032715, 3.339252471923828, 3.6228280067443848, 3.9064037799835205, 4.189979553222656, 4.473554611206055, 4.7571306228637695, 5.040706157684326, 5.324281692504883, 5.6078572273254395, 5.891432762145996, 6.175008296966553, 6.458583831787109, 6.742159843444824, 7.025735378265381, 7.3093109130859375, 7.592886447906494]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 3.0, 12.0, 6.0, 16.0, 10.0, 28.0, 50.0, 53.0, 93.0, 107.0, 169.0, 271.0, 530.0, 845.0, 1435.0, 2789.0, 5394.0, 12519.0, 39522.0, 3574427.0, 498296.0, 34967.0, 11670.0, 5179.0, 2553.0, 1339.0, 762.0, 444.0, 289.0, 173.0, 94.0, 73.0, 41.0, 41.0, 21.0, 15.0, 12.0, 7.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08148193359375, -0.07900810241699219, -0.07653427124023438, -0.07406044006347656, -0.07158660888671875, -0.06911277770996094, -0.06663894653320312, -0.06416511535644531, -0.0616912841796875, -0.05921745300292969, -0.056743621826171875, -0.05426979064941406, -0.05179595947265625, -0.04932212829589844, -0.046848297119140625, -0.04437446594238281, -0.041900634765625, -0.03942680358886719, -0.036952972412109375, -0.03447914123535156, -0.03200531005859375, -0.029531478881835938, -0.027057647705078125, -0.024583816528320312, -0.0221099853515625, -0.019636154174804688, -0.017162322998046875, -0.014688491821289062, -0.01221466064453125, -0.009740829467773438, -0.007266998291015625, -0.0047931671142578125, -0.0023193359375, 0.0001544952392578125, 0.002628326416015625, 0.0051021575927734375, 0.00757598876953125, 0.010049819946289062, 0.012523651123046875, 0.014997482299804688, 0.0174713134765625, 0.019945144653320312, 0.022418975830078125, 0.024892807006835938, 0.02736663818359375, 0.029840469360351562, 0.032314300537109375, 0.03478813171386719, 0.037261962890625, 0.03973579406738281, 0.042209625244140625, 0.04468345642089844, 0.04715728759765625, 0.04963111877441406, 0.052104949951171875, 0.05457878112792969, 0.0570526123046875, 0.05952644348144531, 0.062000274658203125, 0.06447410583496094, 0.06694793701171875, 0.06942176818847656, 0.07189559936523438, 0.07436943054199219, 0.07684326171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 5.0, 5.0, 9.0, 4.0, 7.0, 9.0, 11.0, 18.0, 19.0, 30.0, 63.0, 439.0, 168.0, 52.0, 30.0, 17.0, 8.0, 10.0, 13.0, 12.0, 6.0, 3.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0225067138671875, -0.021802902221679688, -0.021099090576171875, -0.020395278930664062, -0.01969146728515625, -0.018987655639648438, -0.018283843994140625, -0.017580032348632812, -0.016876220703125, -0.016172409057617188, -0.015468597412109375, -0.014764785766601562, -0.01406097412109375, -0.013357162475585938, -0.012653350830078125, -0.011949539184570312, -0.0112457275390625, -0.010541915893554688, -0.009838104248046875, -0.009134292602539062, -0.00843048095703125, -0.0077266693115234375, -0.007022857666015625, -0.0063190460205078125, -0.005615234375, -0.0049114227294921875, -0.004207611083984375, -0.0035037994384765625, -0.00279998779296875, -0.0020961761474609375, -0.001392364501953125, -0.0006885528564453125, 1.52587890625e-05, 0.0007190704345703125, 0.001422882080078125, 0.0021266937255859375, 0.00283050537109375, 0.0035343170166015625, 0.004238128662109375, 0.0049419403076171875, 0.005645751953125, 0.0063495635986328125, 0.007053375244140625, 0.0077571868896484375, 0.00846099853515625, 0.009164810180664062, 0.009868621826171875, 0.010572433471679688, 0.0112762451171875, 0.011980056762695312, 0.012683868408203125, 0.013387680053710938, 0.01409149169921875, 0.014795303344726562, 0.015499114990234375, 0.016202926635742188, 0.01690673828125, 0.017610549926757812, 0.018314361572265625, 0.019018173217773438, 0.01972198486328125, 0.020425796508789062, 0.021129608154296875, 0.021833419799804688, 0.0225372314453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 15.0, 15.0, 19.0, 36.0, 63.0, 72.0, 158.0, 327.0, 636.0, 1399.0, 3245.0, 8679.0, 25848.0, 100798.0, 696303.0, 3055694.0, 229680.0, 48530.0, 14202.0, 4795.0, 1952.0, 867.0, 400.0, 219.0, 93.0, 61.0, 38.0, 28.0, 14.0, 16.0, 8.0, 7.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.055891990661621094, -0.05404472351074219, -0.05219745635986328, -0.050350189208984375, -0.04850292205810547, -0.04665565490722656, -0.044808387756347656, -0.04296112060546875, -0.041113853454589844, -0.03926658630371094, -0.03741931915283203, -0.035572052001953125, -0.03372478485107422, -0.03187751770019531, -0.030030250549316406, -0.0281829833984375, -0.026335716247558594, -0.024488449096679688, -0.02264118194580078, -0.020793914794921875, -0.01894664764404297, -0.017099380493164062, -0.015252113342285156, -0.01340484619140625, -0.011557579040527344, -0.009710311889648438, -0.007863044738769531, -0.006015777587890625, -0.004168510437011719, -0.0023212432861328125, -0.00047397613525390625, 0.001373291015625, 0.0032205581665039062, 0.0050678253173828125, 0.006915092468261719, 0.008762359619140625, 0.010609626770019531, 0.012456893920898438, 0.014304161071777344, 0.01615142822265625, 0.017998695373535156, 0.019845962524414062, 0.02169322967529297, 0.023540496826171875, 0.02538776397705078, 0.027235031127929688, 0.029082298278808594, 0.0309295654296875, 0.032776832580566406, 0.03462409973144531, 0.03647136688232422, 0.038318634033203125, 0.04016590118408203, 0.04201316833496094, 0.043860435485839844, 0.04570770263671875, 0.047554969787597656, 0.04940223693847656, 0.05124950408935547, 0.053096771240234375, 0.05494403839111328, 0.05679130554199219, 0.058638572692871094, 0.06048583984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 10.0, 6.0, 6.0, 19.0, 16.0, 24.0, 16.0, 22.0, 33.0, 48.0, 68.0, 91.0, 91.0, 174.0, 253.0, 498.0, 1151.0, 672.0, 266.0, 148.0, 104.0, 76.0, 56.0, 45.0, 38.0, 24.0, 25.0, 18.0, 13.0, 12.0, 7.0, 5.0, 2.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.0283660888671875, -0.02761244773864746, -0.026858806610107422, -0.026105165481567383, -0.025351524353027344, -0.024597883224487305, -0.023844242095947266, -0.023090600967407227, -0.022336959838867188, -0.02158331871032715, -0.02082967758178711, -0.02007603645324707, -0.01932239532470703, -0.018568754196166992, -0.017815113067626953, -0.017061471939086914, -0.016307830810546875, -0.015554189682006836, -0.014800548553466797, -0.014046907424926758, -0.013293266296386719, -0.01253962516784668, -0.01178598403930664, -0.011032342910766602, -0.010278701782226562, -0.009525060653686523, -0.008771419525146484, -0.008017778396606445, -0.007264137268066406, -0.006510496139526367, -0.005756855010986328, -0.005003213882446289, -0.00424957275390625, -0.003495931625366211, -0.002742290496826172, -0.001988649368286133, -0.0012350082397460938, -0.0004813671112060547, 0.0002722740173339844, 0.0010259151458740234, 0.0017795562744140625, 0.0025331974029541016, 0.0032868385314941406, 0.00404047966003418, 0.004794120788574219, 0.005547761917114258, 0.006301403045654297, 0.007055044174194336, 0.007808685302734375, 0.008562326431274414, 0.009315967559814453, 0.010069608688354492, 0.010823249816894531, 0.01157689094543457, 0.01233053207397461, 0.013084173202514648, 0.013837814331054688, 0.014591455459594727, 0.015345096588134766, 0.016098737716674805, 0.016852378845214844, 0.017606019973754883, 0.018359661102294922, 0.01911330223083496, 0.019866943359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 14.0, 47.0, 151.0, 350.0, 310.0, 100.0, 22.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3096752166748047, -0.2989852726459503, -0.28829532861709595, -0.27760541439056396, -0.2669154703617096, -0.2562255263328552, -0.24553558230400085, -0.23484563827514648, -0.2241557091474533, -0.21346576511859894, -0.20277583599090576, -0.1920858919620514, -0.18139594793319702, -0.17070601880550385, -0.16001607477664948, -0.1493261456489563, -0.13863620162010193, -0.12794625759124756, -0.11725632846355438, -0.10656638443470001, -0.09587644785642624, -0.08518651127815247, -0.0744965672492981, -0.06380663067102432, -0.05311669409275055, -0.042426757514476776, -0.031736817210912704, -0.021046876907348633, -0.01035694032907486, 0.0003329962491989136, 0.011022940278053284, 0.021712876856327057, 0.03240281343460083, 0.0430927500128746, 0.053782690316438675, 0.06447263062000275, 0.07516256719827652, 0.08585250377655029, 0.09654244780540466, 0.10723238438367844, 0.11792232096195221, 0.12861226499080658, 0.13930219411849976, 0.14999213814735413, 0.1606820821762085, 0.17137201130390167, 0.18206195533275604, 0.19275188446044922, 0.2034418284893036, 0.21413177251815796, 0.22482170164585114, 0.2355116456747055, 0.24620157480239868, 0.25689151883125305, 0.2675814628601074, 0.2782714068889618, 0.28896135091781616, 0.29965129494667053, 0.3103412389755249, 0.3210311532020569, 0.33172109723091125, 0.3424110412597656, 0.35310098528862, 0.36379092931747437, 0.37448084354400635]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 12.0, 22.0, 30.0, 30.0, 32.0, 37.0, 36.0, 37.0, 61.0, 77.0, 62.0, 86.0, 66.0, 65.0, 63.0, 45.0, 51.0, 41.0, 28.0, 21.0, 21.0, 18.0, 7.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12411165237426758, -0.11969789862632751, -0.11528414487838745, -0.11087039113044739, -0.10645663738250732, -0.10204288363456726, -0.0976291373372078, -0.09321538358926773, -0.08880162984132767, -0.0843878760933876, -0.07997412234544754, -0.07556036859750748, -0.07114662230014801, -0.06673286855220795, -0.06231911480426788, -0.05790536105632782, -0.053491607308387756, -0.04907785356044769, -0.04466409981250763, -0.040250349789857864, -0.0358365960419178, -0.03142284229397774, -0.027009090408682823, -0.02259533852338791, -0.018181584775447845, -0.013767831958830357, -0.009354079142212868, -0.004940326325595379, -0.00052657350897789, 0.0038871802389621735, 0.008300932124257088, 0.012714684009552002, 0.017128437757492065, 0.02154219150543213, 0.025955943390727043, 0.030369695276021957, 0.03478344902396202, 0.039197202771902084, 0.04361095279455185, 0.04802470654249191, 0.052438460290431976, 0.05685221403837204, 0.0612659677863121, 0.06567972153425217, 0.07009346783161163, 0.0745072215795517, 0.07892097532749176, 0.08333472907543182, 0.08774848282337189, 0.09216223657131195, 0.09657599031925201, 0.10098974406719208, 0.10540349781513214, 0.1098172515630722, 0.11423099786043167, 0.11864475160837173, 0.1230585053563118, 0.12747225165367126, 0.13188600540161133, 0.1362997591495514, 0.14071351289749146, 0.14512726664543152, 0.14954102039337158, 0.15395477414131165, 0.1583685278892517]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 10.0, 17.0, 23.0, 43.0, 38.0, 65.0, 78.0, 114.0, 181.0, 222.0, 352.0, 509.0, 640.0, 958.0, 1420.0, 2085.0, 3103.0, 4908.0, 7685.0, 13055.0, 23888.0, 56305.0, 718165.0, 134916.0, 34425.0, 17270.0, 9911.0, 6130.0, 3800.0, 2560.0, 1687.0, 1258.0, 808.0, 541.0, 386.0, 278.0, 217.0, 146.0, 104.0, 70.0, 50.0, 30.0, 24.0, 24.0, 17.0, 11.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0806884765625, -0.07822418212890625, -0.0757598876953125, -0.07329559326171875, -0.070831298828125, -0.06836700439453125, -0.0659027099609375, -0.06343841552734375, -0.06097412109375, -0.05850982666015625, -0.0560455322265625, -0.05358123779296875, -0.051116943359375, -0.04865264892578125, -0.0461883544921875, -0.04372406005859375, -0.041259765625, -0.03879547119140625, -0.0363311767578125, -0.03386688232421875, -0.031402587890625, -0.02893829345703125, -0.0264739990234375, -0.02400970458984375, -0.02154541015625, -0.01908111572265625, -0.0166168212890625, -0.01415252685546875, -0.011688232421875, -0.00922393798828125, -0.0067596435546875, -0.00429534912109375, -0.0018310546875, 0.00063323974609375, 0.0030975341796875, 0.00556182861328125, 0.008026123046875, 0.01049041748046875, 0.0129547119140625, 0.01541900634765625, 0.01788330078125, 0.02034759521484375, 0.0228118896484375, 0.02527618408203125, 0.027740478515625, 0.03020477294921875, 0.0326690673828125, 0.03513336181640625, 0.03759765625, 0.04006195068359375, 0.0425262451171875, 0.04499053955078125, 0.047454833984375, 0.04991912841796875, 0.0523834228515625, 0.05484771728515625, 0.05731201171875, 0.05977630615234375, 0.0622406005859375, 0.06470489501953125, 0.067169189453125, 0.06963348388671875, 0.0720977783203125, 0.07456207275390625, 0.0770263671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 6.0, 14.0, 8.0, 21.0, 27.0, 49.0, 179.0, 395.0, 88.0, 35.0, 27.0, 17.0, 8.0, 10.0, 12.0, 7.0, 8.0, 4.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.023895263671875, -0.023179292678833008, -0.022463321685791016, -0.021747350692749023, -0.02103137969970703, -0.02031540870666504, -0.019599437713623047, -0.018883466720581055, -0.018167495727539062, -0.01745152473449707, -0.016735553741455078, -0.016019582748413086, -0.015303611755371094, -0.014587640762329102, -0.01387166976928711, -0.013155698776245117, -0.012439727783203125, -0.011723756790161133, -0.01100778579711914, -0.010291814804077148, -0.009575843811035156, -0.008859872817993164, -0.008143901824951172, -0.00742793083190918, -0.0067119598388671875, -0.005995988845825195, -0.005280017852783203, -0.004564046859741211, -0.0038480758666992188, -0.0031321048736572266, -0.0024161338806152344, -0.0017001628875732422, -0.00098419189453125, -0.0002682209014892578, 0.0004477500915527344, 0.0011637210845947266, 0.0018796920776367188, 0.002595663070678711, 0.003311634063720703, 0.004027605056762695, 0.0047435760498046875, 0.00545954704284668, 0.006175518035888672, 0.006891489028930664, 0.007607460021972656, 0.008323431015014648, 0.00903940200805664, 0.009755373001098633, 0.010471343994140625, 0.011187314987182617, 0.01190328598022461, 0.012619256973266602, 0.013335227966308594, 0.014051198959350586, 0.014767169952392578, 0.01548314094543457, 0.016199111938476562, 0.016915082931518555, 0.017631053924560547, 0.01834702491760254, 0.01906299591064453, 0.019778966903686523, 0.020494937896728516, 0.021210908889770508, 0.0219268798828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 10.0, 6.0, 15.0, 13.0, 32.0, 41.0, 53.0, 74.0, 127.0, 166.0, 299.0, 566.0, 1166.0, 2743.0, 6846.0, 19184.0, 62834.0, 245335.0, 491939.0, 152666.0, 41298.0, 13608.0, 5198.0, 2133.0, 978.0, 484.0, 251.0, 138.0, 107.0, 69.0, 48.0, 40.0, 23.0, 18.0, 18.0, 7.0, 13.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.06565380096435547, -0.06355857849121094, -0.061463356018066406, -0.059368133544921875, -0.057272911071777344, -0.05517768859863281, -0.05308246612548828, -0.05098724365234375, -0.04889202117919922, -0.04679679870605469, -0.044701576232910156, -0.042606353759765625, -0.040511131286621094, -0.03841590881347656, -0.03632068634033203, -0.0342254638671875, -0.03213024139404297, -0.030035018920898438, -0.027939796447753906, -0.025844573974609375, -0.023749351501464844, -0.021654129028320312, -0.01955890655517578, -0.01746368408203125, -0.015368461608886719, -0.013273239135742188, -0.011178016662597656, -0.009082794189453125, -0.006987571716308594, -0.0048923492431640625, -0.0027971267700195312, -0.000701904296875, 0.0013933181762695312, 0.0034885406494140625, 0.005583763122558594, 0.007678985595703125, 0.009774208068847656, 0.011869430541992188, 0.013964653015136719, 0.01605987548828125, 0.01815509796142578, 0.020250320434570312, 0.022345542907714844, 0.024440765380859375, 0.026535987854003906, 0.028631210327148438, 0.03072643280029297, 0.0328216552734375, 0.03491687774658203, 0.03701210021972656, 0.039107322692871094, 0.041202545166015625, 0.043297767639160156, 0.04539299011230469, 0.04748821258544922, 0.04958343505859375, 0.05167865753173828, 0.05377388000488281, 0.055869102478027344, 0.057964324951171875, 0.060059547424316406, 0.06215476989746094, 0.06424999237060547, 0.06634521484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 7.0, 11.0, 7.0, 9.0, 14.0, 20.0, 19.0, 31.0, 28.0, 43.0, 41.0, 36.0, 43.0, 51.0, 44.0, 48.0, 52.0, 58.0, 52.0, 41.0, 40.0, 39.0, 29.0, 39.0, 32.0, 19.0, 26.0, 20.0, 20.0, 19.0, 11.0, 13.0, 11.0, 6.0, 10.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10394287109375, -0.1006765365600586, -0.09741020202636719, -0.09414386749267578, -0.09087753295898438, -0.08761119842529297, -0.08434486389160156, -0.08107852935791016, -0.07781219482421875, -0.07454586029052734, -0.07127952575683594, -0.06801319122314453, -0.06474685668945312, -0.06148052215576172, -0.05821418762207031, -0.054947853088378906, -0.0516815185546875, -0.048415184020996094, -0.04514884948730469, -0.04188251495361328, -0.038616180419921875, -0.03534984588623047, -0.03208351135253906, -0.028817176818847656, -0.02555084228515625, -0.022284507751464844, -0.019018173217773438, -0.01575183868408203, -0.012485504150390625, -0.009219169616699219, -0.0059528350830078125, -0.0026865005493164062, 0.000579833984375, 0.0038461685180664062, 0.0071125030517578125, 0.010378837585449219, 0.013645172119140625, 0.01691150665283203, 0.020177841186523438, 0.023444175720214844, 0.02671051025390625, 0.029976844787597656, 0.03324317932128906, 0.03650951385498047, 0.039775848388671875, 0.04304218292236328, 0.04630851745605469, 0.049574851989746094, 0.0528411865234375, 0.056107521057128906, 0.05937385559082031, 0.06264019012451172, 0.06590652465820312, 0.06917285919189453, 0.07243919372558594, 0.07570552825927734, 0.07897186279296875, 0.08223819732666016, 0.08550453186035156, 0.08877086639404297, 0.09203720092773438, 0.09530353546142578, 0.09856986999511719, 0.1018362045288086, 0.1051025390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 10.0, 13.0, 14.0, 28.0, 30.0, 38.0, 59.0, 82.0, 119.0, 188.0, 274.0, 412.0, 659.0, 1197.0, 2343.0, 5048.0, 13056.0, 49009.0, 410631.0, 483938.0, 55844.0, 14437.0, 5299.0, 2516.0, 1275.0, 732.0, 462.0, 275.0, 171.0, 111.0, 76.0, 71.0, 33.0, 37.0, 7.0, 13.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06402587890625, -0.062198638916015625, -0.06037139892578125, -0.058544158935546875, -0.0567169189453125, -0.054889678955078125, -0.05306243896484375, -0.051235198974609375, -0.049407958984375, -0.047580718994140625, -0.04575347900390625, -0.043926239013671875, -0.0420989990234375, -0.040271759033203125, -0.03844451904296875, -0.036617279052734375, -0.0347900390625, -0.032962799072265625, -0.03113555908203125, -0.029308319091796875, -0.0274810791015625, -0.025653839111328125, -0.02382659912109375, -0.021999359130859375, -0.020172119140625, -0.018344879150390625, -0.01651763916015625, -0.014690399169921875, -0.0128631591796875, -0.011035919189453125, -0.00920867919921875, -0.007381439208984375, -0.00555419921875, -0.003726959228515625, -0.00189971923828125, -7.2479248046875e-05, 0.0017547607421875, 0.003582000732421875, 0.00540924072265625, 0.007236480712890625, 0.009063720703125, 0.010890960693359375, 0.01271820068359375, 0.014545440673828125, 0.0163726806640625, 0.018199920654296875, 0.02002716064453125, 0.021854400634765625, 0.023681640625, 0.025508880615234375, 0.02733612060546875, 0.029163360595703125, 0.0309906005859375, 0.032817840576171875, 0.03464508056640625, 0.036472320556640625, 0.038299560546875, 0.040126800537109375, 0.04195404052734375, 0.043781280517578125, 0.0456085205078125, 0.047435760498046875, 0.04926300048828125, 0.051090240478515625, 0.05291748046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 2.0, 8.0, 9.0, 17.0, 12.0, 20.0, 30.0, 17.0, 30.0, 40.0, 47.0, 58.0, 69.0, 64.0, 69.0, 66.0, 78.0, 76.0, 53.0, 27.0, 34.0, 34.0, 21.0, 21.0, 19.0, 12.0, 17.0, 13.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6716461181640625e-05, -3.569386899471283e-05, -3.4671276807785034e-05, -3.364868462085724e-05, -3.262609243392944e-05, -3.160350024700165e-05, -3.058090806007385e-05, -2.9558315873146057e-05, -2.8535723686218262e-05, -2.7513131499290466e-05, -2.649053931236267e-05, -2.5467947125434875e-05, -2.444535493850708e-05, -2.3422762751579285e-05, -2.240017056465149e-05, -2.1377578377723694e-05, -2.03549861907959e-05, -1.9332394003868103e-05, -1.8309801816940308e-05, -1.7287209630012512e-05, -1.6264617443084717e-05, -1.5242025256156921e-05, -1.4219433069229126e-05, -1.319684088230133e-05, -1.2174248695373535e-05, -1.115165650844574e-05, -1.0129064321517944e-05, -9.106472134590149e-06, -8.083879947662354e-06, -7.061287760734558e-06, -6.038695573806763e-06, -5.016103386878967e-06, -3.993511199951172e-06, -2.9709190130233765e-06, -1.948326826095581e-06, -9.257346391677856e-07, 9.685754776000977e-08, 1.1194497346878052e-06, 2.1420419216156006e-06, 3.164634108543396e-06, 4.187226295471191e-06, 5.209818482398987e-06, 6.232410669326782e-06, 7.255002856254578e-06, 8.277595043182373e-06, 9.300187230110168e-06, 1.0322779417037964e-05, 1.134537160396576e-05, 1.2367963790893555e-05, 1.339055597782135e-05, 1.4413148164749146e-05, 1.543574035167694e-05, 1.6458332538604736e-05, 1.7480924725532532e-05, 1.8503516912460327e-05, 1.9526109099388123e-05, 2.0548701286315918e-05, 2.1571293473243713e-05, 2.259388566017151e-05, 2.3616477847099304e-05, 2.46390700340271e-05, 2.5661662220954895e-05, 2.668425440788269e-05, 2.7706846594810486e-05, 2.872943878173828e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 26.0, 29.0, 44.0, 64.0, 112.0, 222.0, 371.0, 803.0, 1736.0, 4696.0, 17187.0, 112636.0, 727424.0, 152853.0, 20949.0, 5502.0, 2009.0, 856.0, 412.0, 210.0, 123.0, 83.0, 52.0, 41.0, 16.0, 15.0, 15.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.055389404296875, -0.053304195404052734, -0.05121898651123047, -0.0491337776184082, -0.04704856872558594, -0.04496335983276367, -0.042878150939941406, -0.04079294204711914, -0.038707733154296875, -0.03662252426147461, -0.034537315368652344, -0.03245210647583008, -0.030366897583007812, -0.028281688690185547, -0.02619647979736328, -0.024111270904541016, -0.02202606201171875, -0.019940853118896484, -0.01785564422607422, -0.015770435333251953, -0.013685226440429688, -0.011600017547607422, -0.009514808654785156, -0.007429599761962891, -0.005344390869140625, -0.0032591819763183594, -0.0011739730834960938, 0.0009112358093261719, 0.0029964447021484375, 0.005081653594970703, 0.007166862487792969, 0.009252071380615234, 0.0113372802734375, 0.013422489166259766, 0.015507698059082031, 0.017592906951904297, 0.019678115844726562, 0.021763324737548828, 0.023848533630371094, 0.02593374252319336, 0.028018951416015625, 0.03010416030883789, 0.032189369201660156, 0.03427457809448242, 0.03635978698730469, 0.03844499588012695, 0.04053020477294922, 0.042615413665771484, 0.04470062255859375, 0.046785831451416016, 0.04887104034423828, 0.05095624923706055, 0.05304145812988281, 0.05512666702270508, 0.057211875915527344, 0.05929708480834961, 0.061382293701171875, 0.06346750259399414, 0.0655527114868164, 0.06763792037963867, 0.06972312927246094, 0.0718083381652832, 0.07389354705810547, 0.07597875595092773, 0.07806396484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 10.0, 6.0, 7.0, 21.0, 20.0, 22.0, 32.0, 40.0, 48.0, 50.0, 56.0, 77.0, 66.0, 79.0, 77.0, 66.0, 65.0, 42.0, 44.0, 31.0, 24.0, 23.0, 17.0, 12.0, 3.0, 7.0, 12.0, 5.0, 5.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.032379150390625, -0.031101703643798828, -0.029824256896972656, -0.028546810150146484, -0.027269363403320312, -0.02599191665649414, -0.02471446990966797, -0.023437023162841797, -0.022159576416015625, -0.020882129669189453, -0.01960468292236328, -0.01832723617553711, -0.017049789428710938, -0.015772342681884766, -0.014494895935058594, -0.013217449188232422, -0.01194000244140625, -0.010662555694580078, -0.009385108947753906, -0.008107662200927734, -0.0068302154541015625, -0.005552768707275391, -0.004275321960449219, -0.002997875213623047, -0.001720428466796875, -0.0004429817199707031, 0.0008344650268554688, 0.0021119117736816406, 0.0033893585205078125, 0.004666805267333984, 0.005944252014160156, 0.007221698760986328, 0.0084991455078125, 0.009776592254638672, 0.011054039001464844, 0.012331485748291016, 0.013608932495117188, 0.01488637924194336, 0.01616382598876953, 0.017441272735595703, 0.018718719482421875, 0.019996166229248047, 0.02127361297607422, 0.02255105972290039, 0.023828506469726562, 0.025105953216552734, 0.026383399963378906, 0.027660846710205078, 0.02893829345703125, 0.030215740203857422, 0.031493186950683594, 0.032770633697509766, 0.03404808044433594, 0.03532552719116211, 0.03660297393798828, 0.03788042068481445, 0.039157867431640625, 0.0404353141784668, 0.04171276092529297, 0.04299020767211914, 0.04426765441894531, 0.045545101165771484, 0.046822547912597656, 0.04809999465942383, 0.04937744140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 16.0, 15.0, 30.0, 75.0, 153.0, 248.0, 213.0, 124.0, 55.0, 28.0, 15.0, 11.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48074230551719666, -0.4563523232936859, -0.4319623112678528, -0.40757232904434204, -0.3831823468208313, -0.35879236459732056, -0.3344023525714874, -0.3100123703479767, -0.28562235832214355, -0.2612323760986328, -0.23684237897396088, -0.21245238184928894, -0.1880623996257782, -0.16367240250110626, -0.13928240537643433, -0.11489242315292358, -0.09050244092941284, -0.0661124512553215, -0.041722457855939865, -0.017332464456558228, 0.007057525217533112, 0.03144751489162445, 0.05583751201629639, 0.08022749423980713, 0.10461749136447906, 0.129007488489151, 0.15339747071266174, 0.17778746783733368, 0.20217746496200562, 0.22656744718551636, 0.2509574294090271, 0.27534741163253784, 0.2997373938560486, 0.3241273760795593, 0.34851738810539246, 0.3729073703289032, 0.39729735255241394, 0.42168736457824707, 0.4460773468017578, 0.47046732902526855, 0.4948573112487793, 0.51924729347229, 0.5436372756958008, 0.5680272579193115, 0.592417299747467, 0.6168072819709778, 0.6411972641944885, 0.6655872464179993, 0.6899772882461548, 0.7143672704696655, 0.7387572526931763, 0.763147234916687, 0.7875372767448425, 0.8119272589683533, 0.836317241191864, 0.8607072234153748, 0.8850972056388855, 0.9094871878623962, 0.933877170085907, 0.9582672119140625, 0.9826571941375732, 1.007047176361084, 1.0314371585845947, 1.0558271408081055, 1.0802171230316162]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 14.0, 24.0, 33.0, 49.0, 76.0, 135.0, 184.0, 145.0, 103.0, 75.0, 39.0, 16.0, 12.0, 9.0, 5.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.504492998123169, -1.4502655267715454, -1.3960381746292114, -1.341810703277588, -1.287583351135254, -1.2333558797836304, -1.1791284084320068, -1.1249010562896729, -1.0706737041473389, -1.0164462327957153, -0.9622188806533813, -0.9079914093017578, -0.8537640571594238, -0.7995365858078003, -0.7453091740608215, -0.6910817623138428, -0.6368542909622192, -0.5826268792152405, -0.5283994674682617, -0.47417202591896057, -0.4199446141719818, -0.36571720242500305, -0.3114897608757019, -0.25726234912872314, -0.20303493738174438, -0.14880752563476562, -0.09458009898662567, -0.04035267233848572, 0.013874739408493042, 0.0681021511554718, 0.12232959270477295, 0.1765570044517517, 0.23078429698944092, 0.2850117087364197, 0.33923912048339844, 0.3934665620326996, 0.44769397377967834, 0.5019214153289795, 0.5561488270759583, 0.610376238822937, 0.6646036505699158, 0.7188310623168945, 0.7730584740638733, 0.827285885810852, 0.8815133571624756, 0.9357407093048096, 0.9899681806564331, 1.0441956520080566, 1.0984230041503906, 1.1526504755020142, 1.2068778276443481, 1.2611052989959717, 1.3153326511383057, 1.3695601224899292, 1.4237875938415527, 1.4780149459838867, 1.5322422981262207, 1.5864697694778442, 1.6406971216201782, 1.6949245929718018, 1.7491519451141357, 1.8033794164657593, 1.8576068878173828, 1.9118342399597168, 1.9660617113113403]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 1.0, 11.0, 21.0, 24.0, 27.0, 37.0, 56.0, 91.0, 115.0, 191.0, 275.0, 419.0, 726.0, 1367.0, 2560.0, 5466.0, 14162.0, 56692.0, 3786349.0, 270691.0, 33308.0, 11213.0, 4703.0, 2427.0, 1362.0, 768.0, 410.0, 280.0, 170.0, 120.0, 58.0, 46.0, 30.0, 23.0, 20.0, 22.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2022705078125, -0.1964588165283203, -0.19064712524414062, -0.18483543395996094, -0.17902374267578125, -0.17321205139160156, -0.16740036010742188, -0.1615886688232422, -0.1557769775390625, -0.1499652862548828, -0.14415359497070312, -0.13834190368652344, -0.13253021240234375, -0.12671852111816406, -0.12090682983398438, -0.11509513854980469, -0.109283447265625, -0.10347175598144531, -0.09766006469726562, -0.09184837341308594, -0.08603668212890625, -0.08022499084472656, -0.07441329956054688, -0.06860160827636719, -0.0627899169921875, -0.05697822570800781, -0.051166534423828125, -0.04535484313964844, -0.03954315185546875, -0.03373146057128906, -0.027919769287109375, -0.022108078002929688, -0.01629638671875, -0.010484695434570312, -0.004673004150390625, 0.0011386871337890625, 0.00695037841796875, 0.012762069702148438, 0.018573760986328125, 0.024385452270507812, 0.0301971435546875, 0.03600883483886719, 0.041820526123046875, 0.04763221740722656, 0.05344390869140625, 0.05925559997558594, 0.06506729125976562, 0.07087898254394531, 0.076690673828125, 0.08250236511230469, 0.08831405639648438, 0.09412574768066406, 0.09993743896484375, 0.10574913024902344, 0.11156082153320312, 0.11737251281738281, 0.1231842041015625, 0.1289958953857422, 0.13480758666992188, 0.14061927795410156, 0.14643096923828125, 0.15224266052246094, 0.15805435180664062, 0.1638660430908203, 0.169677734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 7.0, 2.0, 6.0, 7.0, 8.0, 20.0, 15.0, 26.0, 49.0, 127.0, 237.0, 203.0, 108.0, 45.0, 33.0, 21.0, 15.0, 3.0, 12.0, 6.0, 10.0, 8.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023956298828125, -0.023235797882080078, -0.022515296936035156, -0.021794795989990234, -0.021074295043945312, -0.02035379409790039, -0.01963329315185547, -0.018912792205810547, -0.018192291259765625, -0.017471790313720703, -0.01675128936767578, -0.01603078842163086, -0.015310287475585938, -0.014589786529541016, -0.013869285583496094, -0.013148784637451172, -0.01242828369140625, -0.011707782745361328, -0.010987281799316406, -0.010266780853271484, -0.009546279907226562, -0.00882577896118164, -0.008105278015136719, -0.007384777069091797, -0.006664276123046875, -0.005943775177001953, -0.005223274230957031, -0.004502773284912109, -0.0037822723388671875, -0.0030617713928222656, -0.0023412704467773438, -0.0016207695007324219, -0.0009002685546875, -0.00017976760864257812, 0.0005407333374023438, 0.0012612342834472656, 0.0019817352294921875, 0.0027022361755371094, 0.0034227371215820312, 0.004143238067626953, 0.004863739013671875, 0.005584239959716797, 0.006304740905761719, 0.007025241851806641, 0.0077457427978515625, 0.008466243743896484, 0.009186744689941406, 0.009907245635986328, 0.01062774658203125, 0.011348247528076172, 0.012068748474121094, 0.012789249420166016, 0.013509750366210938, 0.01423025131225586, 0.014950752258300781, 0.015671253204345703, 0.016391754150390625, 0.017112255096435547, 0.01783275604248047, 0.01855325698852539, 0.019273757934570312, 0.019994258880615234, 0.020714759826660156, 0.021435260772705078, 0.02215576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 10.0, 3.0, 19.0, 22.0, 44.0, 44.0, 81.0, 135.0, 186.0, 357.0, 721.0, 1593.0, 4453.0, 14727.0, 71676.0, 1194717.0, 2791547.0, 88040.0, 16903.0, 5187.0, 1929.0, 819.0, 432.0, 227.0, 139.0, 77.0, 49.0, 52.0, 25.0, 20.0, 12.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.14980125427246094, -0.14481735229492188, -0.1398334503173828, -0.13484954833984375, -0.1298656463623047, -0.12488174438476562, -0.11989784240722656, -0.1149139404296875, -0.10993003845214844, -0.10494613647460938, -0.09996223449707031, -0.09497833251953125, -0.08999443054199219, -0.08501052856445312, -0.08002662658691406, -0.075042724609375, -0.07005882263183594, -0.06507492065429688, -0.06009101867675781, -0.05510711669921875, -0.05012321472167969, -0.045139312744140625, -0.04015541076660156, -0.0351715087890625, -0.030187606811523438, -0.025203704833984375, -0.020219802856445312, -0.01523590087890625, -0.010251998901367188, -0.005268096923828125, -0.0002841949462890625, 0.00469970703125, 0.009683609008789062, 0.014667510986328125, 0.019651412963867188, 0.02463531494140625, 0.029619216918945312, 0.034603118896484375, 0.03958702087402344, 0.0445709228515625, 0.04955482482910156, 0.054538726806640625, 0.05952262878417969, 0.06450653076171875, 0.06949043273925781, 0.07447433471679688, 0.07945823669433594, 0.084442138671875, 0.08942604064941406, 0.09440994262695312, 0.09939384460449219, 0.10437774658203125, 0.10936164855957031, 0.11434555053710938, 0.11932945251464844, 0.1243133544921875, 0.12929725646972656, 0.13428115844726562, 0.1392650604248047, 0.14424896240234375, 0.1492328643798828, 0.15421676635742188, 0.15920066833496094, 0.1641845703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 12.0, 16.0, 31.0, 28.0, 59.0, 83.0, 151.0, 274.0, 654.0, 1814.0, 453.0, 165.0, 103.0, 55.0, 34.0, 19.0, 20.0, 21.0, 6.0, 8.0, 10.0, 8.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02874755859375, -0.02780008316040039, -0.02685260772705078, -0.025905132293701172, -0.024957656860351562, -0.024010181427001953, -0.023062705993652344, -0.022115230560302734, -0.021167755126953125, -0.020220279693603516, -0.019272804260253906, -0.018325328826904297, -0.017377853393554688, -0.016430377960205078, -0.015482902526855469, -0.01453542709350586, -0.01358795166015625, -0.01264047622680664, -0.011693000793457031, -0.010745525360107422, -0.009798049926757812, -0.008850574493408203, -0.007903099060058594, -0.006955623626708984, -0.006008148193359375, -0.005060672760009766, -0.004113197326660156, -0.003165721893310547, -0.0022182464599609375, -0.0012707710266113281, -0.00032329559326171875, 0.0006241798400878906, 0.0015716552734375, 0.0025191307067871094, 0.0034666061401367188, 0.004414081573486328, 0.0053615570068359375, 0.006309032440185547, 0.007256507873535156, 0.008203983306884766, 0.009151458740234375, 0.010098934173583984, 0.011046409606933594, 0.011993885040283203, 0.012941360473632812, 0.013888835906982422, 0.014836311340332031, 0.01578378677368164, 0.01673126220703125, 0.01767873764038086, 0.01862621307373047, 0.019573688507080078, 0.020521163940429688, 0.021468639373779297, 0.022416114807128906, 0.023363590240478516, 0.024311065673828125, 0.025258541107177734, 0.026206016540527344, 0.027153491973876953, 0.028100967407226562, 0.029048442840576172, 0.02999591827392578, 0.03094339370727539, 0.031890869140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 9.0, 19.0, 70.0, 206.0, 328.0, 238.0, 72.0, 34.0, 18.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16206994652748108, -0.15288899838924408, -0.1437080353498459, -0.1345270872116089, -0.1253461241722107, -0.1161651760339737, -0.1069842278957367, -0.0978032723069191, -0.0886223167181015, -0.0794413611292839, -0.07026040554046631, -0.06107945740222931, -0.05189850181341171, -0.042717546224594116, -0.03353659436106682, -0.02435564249753952, -0.015174686908721924, -0.005993733182549477, 0.0031872205436229706, 0.012368174269795418, 0.021549127995967865, 0.03073008358478546, 0.03991103544831276, 0.04909198731184006, 0.058272942900657654, 0.06745389848947525, 0.07663485407829285, 0.08581580221652985, 0.09499675780534744, 0.10417771339416504, 0.11335866153240204, 0.12253961712121964, 0.13172060251235962, 0.14090155065059662, 0.1500825136899948, 0.1592634618282318, 0.16844442486763, 0.177625373005867, 0.186806321144104, 0.1959872841835022, 0.2051682323217392, 0.2143491804599762, 0.2235301434993744, 0.2327110916376114, 0.2418920397758484, 0.2510730028152466, 0.2602539658546448, 0.2694348990917206, 0.2786158621311188, 0.28779682517051697, 0.2969777584075928, 0.30615872144699097, 0.31533968448638916, 0.32452064752578735, 0.33370158076286316, 0.34288254380226135, 0.35206347703933716, 0.36124444007873535, 0.37042537331581116, 0.37960633635520935, 0.38878729939460754, 0.39796823263168335, 0.40714919567108154, 0.41633015871047974, 0.42551112174987793]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 16.0, 17.0, 15.0, 26.0, 39.0, 34.0, 64.0, 42.0, 53.0, 42.0, 66.0, 59.0, 63.0, 59.0, 66.0, 52.0, 55.0, 44.0, 19.0, 29.0, 18.0, 22.0, 12.0, 12.0, 9.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1099323034286499, -0.10628964006900787, -0.10264697670936584, -0.09900431334972382, -0.09536164999008179, -0.09171898663043976, -0.08807633072137833, -0.0844336673617363, -0.08079100400209427, -0.07714834064245224, -0.07350567728281021, -0.06986301392316818, -0.06622035801410675, -0.06257769465446472, -0.05893503129482269, -0.055292367935180664, -0.051649704575538635, -0.048007041215896606, -0.04436437785625458, -0.04072171822190285, -0.03707905486226082, -0.03343639150261879, -0.02979373000562191, -0.02615106850862503, -0.022508405148983, -0.018865741789340973, -0.015223080292344093, -0.011580417864024639, -0.007937755435705185, -0.004295092076063156, -0.0006524305790662766, 0.002990230917930603, 0.006632894277572632, 0.010275556705892086, 0.01391821913421154, 0.01756088063120842, 0.02120354399085045, 0.024846207350492477, 0.028488868847489357, 0.03213153034448624, 0.035774193704128265, 0.039416857063770294, 0.04305952042341232, 0.04670218005776405, 0.05034484341740608, 0.05398750677704811, 0.05763016641139984, 0.06127282977104187, 0.0649154931306839, 0.06855815649032593, 0.07220081984996796, 0.07584348320960999, 0.07948614656925201, 0.08312880992889404, 0.08677146583795547, 0.0904141291975975, 0.09405679255723953, 0.09769945591688156, 0.10134211927652359, 0.10498478263616562, 0.10862743854522705, 0.11227010190486908, 0.11591276526451111, 0.11955542862415314, 0.12319809198379517]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 9.0, 7.0, 13.0, 7.0, 20.0, 24.0, 40.0, 44.0, 67.0, 68.0, 102.0, 141.0, 232.0, 327.0, 454.0, 664.0, 989.0, 1458.0, 2444.0, 4106.0, 6912.0, 13391.0, 28538.0, 84743.0, 525136.0, 278415.0, 53481.0, 21099.0, 10471.0, 5726.0, 3341.0, 1983.0, 1304.0, 831.0, 605.0, 441.0, 249.0, 164.0, 126.0, 115.0, 75.0, 52.0, 39.0, 27.0, 20.0, 13.0, 13.0, 10.0, 3.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.08612060546875, -0.08332633972167969, -0.08053207397460938, -0.07773780822753906, -0.07494354248046875, -0.07214927673339844, -0.06935501098632812, -0.06656074523925781, -0.0637664794921875, -0.06097221374511719, -0.058177947998046875, -0.05538368225097656, -0.05258941650390625, -0.04979515075683594, -0.047000885009765625, -0.04420661926269531, -0.041412353515625, -0.03861808776855469, -0.035823822021484375, -0.03302955627441406, -0.03023529052734375, -0.027441024780273438, -0.024646759033203125, -0.021852493286132812, -0.0190582275390625, -0.016263961791992188, -0.013469696044921875, -0.010675430297851562, -0.00788116455078125, -0.0050868988037109375, -0.002292633056640625, 0.0005016326904296875, 0.0032958984375, 0.0060901641845703125, 0.008884429931640625, 0.011678695678710938, 0.01447296142578125, 0.017267227172851562, 0.020061492919921875, 0.022855758666992188, 0.0256500244140625, 0.028444290161132812, 0.031238555908203125, 0.03403282165527344, 0.03682708740234375, 0.03962135314941406, 0.042415618896484375, 0.04520988464355469, 0.048004150390625, 0.05079841613769531, 0.053592681884765625, 0.05638694763183594, 0.05918121337890625, 0.06197547912597656, 0.06476974487304688, 0.06756401062011719, 0.0703582763671875, 0.07315254211425781, 0.07594680786132812, 0.07874107360839844, 0.08153533935546875, 0.08432960510253906, 0.08712387084960938, 0.08991813659667969, 0.09271240234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 4.0, 12.0, 16.0, 15.0, 30.0, 37.0, 71.0, 132.0, 224.0, 169.0, 106.0, 52.0, 27.0, 21.0, 10.0, 12.0, 10.0, 7.0, 9.0, 3.0, 6.0, 1.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228424072265625, -0.02212667465209961, -0.02141094207763672, -0.020695209503173828, -0.019979476928710938, -0.019263744354248047, -0.018548011779785156, -0.017832279205322266, -0.017116546630859375, -0.016400814056396484, -0.015685081481933594, -0.014969348907470703, -0.014253616333007812, -0.013537883758544922, -0.012822151184082031, -0.01210641860961914, -0.01139068603515625, -0.01067495346069336, -0.009959220886230469, -0.009243488311767578, -0.008527755737304688, -0.007812023162841797, -0.007096290588378906, -0.006380558013916016, -0.005664825439453125, -0.004949092864990234, -0.004233360290527344, -0.003517627716064453, -0.0028018951416015625, -0.002086162567138672, -0.0013704299926757812, -0.0006546974182128906, 6.103515625e-05, 0.0007767677307128906, 0.0014925003051757812, 0.002208232879638672, 0.0029239654541015625, 0.003639698028564453, 0.004355430603027344, 0.005071163177490234, 0.005786895751953125, 0.006502628326416016, 0.007218360900878906, 0.007934093475341797, 0.008649826049804688, 0.009365558624267578, 0.010081291198730469, 0.01079702377319336, 0.01151275634765625, 0.01222848892211914, 0.012944221496582031, 0.013659954071044922, 0.014375686645507812, 0.015091419219970703, 0.015807151794433594, 0.016522884368896484, 0.017238616943359375, 0.017954349517822266, 0.018670082092285156, 0.019385814666748047, 0.020101547241210938, 0.020817279815673828, 0.02153301239013672, 0.02224874496459961, 0.0229644775390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 11.0, 9.0, 22.0, 24.0, 37.0, 46.0, 65.0, 85.0, 142.0, 254.0, 422.0, 765.0, 1273.0, 2724.0, 5852.0, 15100.0, 46549.0, 179485.0, 480183.0, 225930.0, 58014.0, 18188.0, 6823.0, 2950.0, 1506.0, 811.0, 420.0, 268.0, 165.0, 132.0, 63.0, 60.0, 34.0, 34.0, 24.0, 18.0, 12.0, 11.0, 9.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.060211181640625, -0.05817556381225586, -0.05613994598388672, -0.05410432815551758, -0.05206871032714844, -0.0500330924987793, -0.047997474670410156, -0.045961856842041016, -0.043926239013671875, -0.041890621185302734, -0.039855003356933594, -0.03781938552856445, -0.03578376770019531, -0.03374814987182617, -0.03171253204345703, -0.02967691421508789, -0.02764129638671875, -0.02560567855834961, -0.02357006072998047, -0.021534442901611328, -0.019498825073242188, -0.017463207244873047, -0.015427589416503906, -0.013391971588134766, -0.011356353759765625, -0.009320735931396484, -0.007285118103027344, -0.005249500274658203, -0.0032138824462890625, -0.0011782646179199219, 0.0008573532104492188, 0.0028929710388183594, 0.0049285888671875, 0.006964206695556641, 0.008999824523925781, 0.011035442352294922, 0.013071060180664062, 0.015106678009033203, 0.017142295837402344, 0.019177913665771484, 0.021213531494140625, 0.023249149322509766, 0.025284767150878906, 0.027320384979248047, 0.029356002807617188, 0.03139162063598633, 0.03342723846435547, 0.03546285629272461, 0.03749847412109375, 0.03953409194946289, 0.04156970977783203, 0.04360532760620117, 0.04564094543457031, 0.04767656326293945, 0.049712181091308594, 0.051747798919677734, 0.053783416748046875, 0.055819034576416016, 0.057854652404785156, 0.0598902702331543, 0.06192588806152344, 0.06396150588989258, 0.06599712371826172, 0.06803274154663086, 0.070068359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 6.0, 12.0, 9.0, 16.0, 17.0, 17.0, 24.0, 23.0, 33.0, 31.0, 31.0, 45.0, 32.0, 42.0, 45.0, 52.0, 52.0, 39.0, 48.0, 43.0, 38.0, 39.0, 39.0, 51.0, 36.0, 20.0, 29.0, 27.0, 13.0, 20.0, 8.0, 9.0, 11.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.0501704216003418, -0.048308372497558594, -0.04644632339477539, -0.04458427429199219, -0.042722225189208984, -0.04086017608642578, -0.03899812698364258, -0.037136077880859375, -0.03527402877807617, -0.03341197967529297, -0.031549930572509766, -0.029687881469726562, -0.02782583236694336, -0.025963783264160156, -0.024101734161376953, -0.02223968505859375, -0.020377635955810547, -0.018515586853027344, -0.01665353775024414, -0.014791488647460938, -0.012929439544677734, -0.011067390441894531, -0.009205341339111328, -0.007343292236328125, -0.005481243133544922, -0.0036191940307617188, -0.0017571449279785156, 0.0001049041748046875, 0.0019669532775878906, 0.0038290023803710938, 0.005691051483154297, 0.0075531005859375, 0.009415149688720703, 0.011277198791503906, 0.01313924789428711, 0.015001296997070312, 0.016863346099853516, 0.01872539520263672, 0.020587444305419922, 0.022449493408203125, 0.024311542510986328, 0.02617359161376953, 0.028035640716552734, 0.029897689819335938, 0.03175973892211914, 0.033621788024902344, 0.03548383712768555, 0.03734588623046875, 0.03920793533325195, 0.041069984436035156, 0.04293203353881836, 0.04479408264160156, 0.046656131744384766, 0.04851818084716797, 0.05038022994995117, 0.052242279052734375, 0.05410432815551758, 0.05596637725830078, 0.057828426361083984, 0.05969047546386719, 0.06155252456665039, 0.0634145736694336, 0.0652766227722168, 0.067138671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 8.0, 4.0, 7.0, 6.0, 17.0, 29.0, 31.0, 51.0, 83.0, 157.0, 403.0, 1145.0, 4900.0, 36008.0, 757701.0, 230296.0, 13914.0, 2484.0, 666.0, 295.0, 136.0, 81.0, 43.0, 32.0, 20.0, 7.0, 4.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.12114906311035156, -0.11583328247070312, -0.11051750183105469, -0.10520172119140625, -0.09988594055175781, -0.09457015991210938, -0.08925437927246094, -0.0839385986328125, -0.07862281799316406, -0.07330703735351562, -0.06799125671386719, -0.06267547607421875, -0.05735969543457031, -0.052043914794921875, -0.04672813415527344, -0.041412353515625, -0.03609657287597656, -0.030780792236328125, -0.025465011596679688, -0.02014923095703125, -0.014833450317382812, -0.009517669677734375, -0.0042018890380859375, 0.0011138916015625, 0.0064296722412109375, 0.011745452880859375, 0.017061233520507812, 0.02237701416015625, 0.027692794799804688, 0.033008575439453125, 0.03832435607910156, 0.04364013671875, 0.04895591735839844, 0.054271697998046875, 0.05958747863769531, 0.06490325927734375, 0.07021903991699219, 0.07553482055664062, 0.08085060119628906, 0.0861663818359375, 0.09148216247558594, 0.09679794311523438, 0.10211372375488281, 0.10742950439453125, 0.11274528503417969, 0.11806106567382812, 0.12337684631347656, 0.128692626953125, 0.13400840759277344, 0.13932418823242188, 0.1446399688720703, 0.14995574951171875, 0.1552715301513672, 0.16058731079101562, 0.16590309143066406, 0.1712188720703125, 0.17653465270996094, 0.18185043334960938, 0.1871662139892578, 0.19248199462890625, 0.1977977752685547, 0.20311355590820312, 0.20842933654785156, 0.2137451171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 14.0, 16.0, 13.0, 22.0, 26.0, 32.0, 45.0, 48.0, 66.0, 85.0, 99.0, 89.0, 86.0, 74.0, 65.0, 37.0, 37.0, 31.0, 27.0, 20.0, 16.0, 8.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.561113357543945e-05, -5.383603274822235e-05, -5.206093192100525e-05, -5.028583109378815e-05, -4.8510730266571045e-05, -4.673562943935394e-05, -4.496052861213684e-05, -4.318542778491974e-05, -4.141032695770264e-05, -3.9635226130485535e-05, -3.786012530326843e-05, -3.608502447605133e-05, -3.430992364883423e-05, -3.2534822821617126e-05, -3.0759721994400024e-05, -2.8984621167182922e-05, -2.720952033996582e-05, -2.5434419512748718e-05, -2.3659318685531616e-05, -2.1884217858314514e-05, -2.0109117031097412e-05, -1.833401620388031e-05, -1.6558915376663208e-05, -1.4783814549446106e-05, -1.3008713722229004e-05, -1.1233612895011902e-05, -9.4585120677948e-06, -7.683411240577698e-06, -5.908310413360596e-06, -4.133209586143494e-06, -2.3581087589263916e-06, -5.830079317092896e-07, 1.1920928955078125e-06, 2.9671937227249146e-06, 4.742294549942017e-06, 6.517395377159119e-06, 8.29249620437622e-06, 1.0067597031593323e-05, 1.1842697858810425e-05, 1.3617798686027527e-05, 1.539289951324463e-05, 1.716800034046173e-05, 1.8943101167678833e-05, 2.0718201994895935e-05, 2.2493302822113037e-05, 2.426840364933014e-05, 2.604350447654724e-05, 2.7818605303764343e-05, 2.9593706130981445e-05, 3.136880695819855e-05, 3.314390778541565e-05, 3.491900861263275e-05, 3.6694109439849854e-05, 3.8469210267066956e-05, 4.024431109428406e-05, 4.201941192150116e-05, 4.379451274871826e-05, 4.5569613575935364e-05, 4.7344714403152466e-05, 4.911981523036957e-05, 5.089491605758667e-05, 5.267001688480377e-05, 5.4445117712020874e-05, 5.6220218539237976e-05, 5.799531936645508e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 4.0, 9.0, 17.0, 20.0, 40.0, 58.0, 85.0, 213.0, 371.0, 868.0, 2138.0, 6459.0, 27412.0, 198763.0, 658308.0, 125903.0, 19544.0, 5062.0, 1780.0, 744.0, 354.0, 161.0, 97.0, 49.0, 34.0, 18.0, 17.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1051025390625, -0.10221481323242188, -0.09932708740234375, -0.09643936157226562, -0.0935516357421875, -0.09066390991210938, -0.08777618408203125, -0.08488845825195312, -0.082000732421875, -0.07911300659179688, -0.07622528076171875, -0.07333755493164062, -0.0704498291015625, -0.06756210327148438, -0.06467437744140625, -0.061786651611328125, -0.05889892578125, -0.056011199951171875, -0.05312347412109375, -0.050235748291015625, -0.0473480224609375, -0.044460296630859375, -0.04157257080078125, -0.038684844970703125, -0.035797119140625, -0.032909393310546875, -0.03002166748046875, -0.027133941650390625, -0.0242462158203125, -0.021358489990234375, -0.01847076416015625, -0.015583038330078125, -0.0126953125, -0.009807586669921875, -0.00691986083984375, -0.004032135009765625, -0.0011444091796875, 0.001743316650390625, 0.00463104248046875, 0.007518768310546875, 0.010406494140625, 0.013294219970703125, 0.01618194580078125, 0.019069671630859375, 0.0219573974609375, 0.024845123291015625, 0.02773284912109375, 0.030620574951171875, 0.03350830078125, 0.036396026611328125, 0.03928375244140625, 0.042171478271484375, 0.0450592041015625, 0.047946929931640625, 0.05083465576171875, 0.053722381591796875, 0.056610107421875, 0.059497833251953125, 0.06238555908203125, 0.06527328491210938, 0.0681610107421875, 0.07104873657226562, 0.07393646240234375, 0.07682418823242188, 0.0797119140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 9.0, 7.0, 11.0, 16.0, 27.0, 35.0, 50.0, 76.0, 117.0, 120.0, 163.0, 124.0, 78.0, 51.0, 38.0, 26.0, 21.0, 11.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09039306640625, -0.08788681030273438, -0.08538055419921875, -0.08287429809570312, -0.0803680419921875, -0.07786178588867188, -0.07535552978515625, -0.07284927368164062, -0.070343017578125, -0.06783676147460938, -0.06533050537109375, -0.06282424926757812, -0.0603179931640625, -0.057811737060546875, -0.05530548095703125, -0.052799224853515625, -0.05029296875, -0.047786712646484375, -0.04528045654296875, -0.042774200439453125, -0.0402679443359375, -0.037761688232421875, -0.03525543212890625, -0.032749176025390625, -0.030242919921875, -0.027736663818359375, -0.02523040771484375, -0.022724151611328125, -0.0202178955078125, -0.017711639404296875, -0.01520538330078125, -0.012699127197265625, -0.01019287109375, -0.007686614990234375, -0.00518035888671875, -0.002674102783203125, -0.0001678466796875, 0.002338409423828125, 0.00484466552734375, 0.007350921630859375, 0.009857177734375, 0.012363433837890625, 0.01486968994140625, 0.017375946044921875, 0.0198822021484375, 0.022388458251953125, 0.02489471435546875, 0.027400970458984375, 0.0299072265625, 0.032413482666015625, 0.03491973876953125, 0.037425994873046875, 0.0399322509765625, 0.042438507080078125, 0.04494476318359375, 0.047451019287109375, 0.049957275390625, 0.052463531494140625, 0.05496978759765625, 0.057476043701171875, 0.0599822998046875, 0.062488555908203125, 0.06499481201171875, 0.06750106811523438, 0.07000732421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 45.0, 344.0, 462.0, 107.0, 23.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4232504367828369, -0.3711588382720947, -0.3190672695636749, -0.26697567105293274, -0.21488408744335175, -0.16279250383377075, -0.11070090532302856, -0.058609336614608765, -0.006517738103866577, 0.045573849231004715, 0.09766543656587601, 0.1497570276260376, 0.2018486112356186, 0.2539401948451996, 0.3060317933559418, 0.3581233620643616, 0.41021496057510376, 0.46230655908584595, 0.5143981575965881, 0.5664896965026855, 0.6185812950134277, 0.6706728935241699, 0.7227644920349121, 0.7748560905456543, 0.8269476890563965, 0.8790392875671387, 0.9311308860778809, 0.983222484588623, 1.0353140830993652, 1.0874056816101074, 1.1394972801208496, 1.1915887594223022, 1.2436803579330444, 1.2957719564437866, 1.3478635549545288, 1.399955153465271, 1.4520467519760132, 1.5041382312774658, 1.556229829788208, 1.6083214282989502, 1.6604130268096924, 1.7125046253204346, 1.7645962238311768, 1.816687822341919, 1.8687794208526611, 1.9208710193634033, 1.9729626178741455, 2.0250542163848877, 2.07714581489563, 2.129237413406372, 2.1813290119171143, 2.2334206104278564, 2.2855122089385986, 2.337603807449341, 2.389695405960083, 2.441787004470825, 2.4938783645629883, 2.5459699630737305, 2.5980615615844727, 2.650153160095215, 2.702244758605957, 2.754336357116699, 2.8064279556274414, 2.8585195541381836, 2.910611152648926]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 9.0, 6.0, 15.0, 11.0, 23.0, 35.0, 44.0, 60.0, 69.0, 97.0, 75.0, 104.0, 85.0, 89.0, 59.0, 55.0, 41.0, 25.0, 22.0, 16.0, 12.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7189944386482239, -0.696451723575592, -0.6739090085029602, -0.6513662338256836, -0.6288235187530518, -0.6062808036804199, -0.5837380886077881, -0.5611953735351562, -0.5386526584625244, -0.5161099433898926, -0.49356719851493835, -0.4710244834423065, -0.4484817385673523, -0.42593902349472046, -0.4033963084220886, -0.3808535933494568, -0.3583108186721802, -0.33576810359954834, -0.3132253587245941, -0.2906826436519623, -0.26813989877700806, -0.24559718370437622, -0.22305446863174438, -0.20051173865795135, -0.17796900868415833, -0.1554262787103653, -0.13288354873657227, -0.11034083366394043, -0.0877981036901474, -0.06525537371635437, -0.042712658643722534, -0.020169928669929504, 0.0023728609085083008, 0.024915587157011032, 0.04745831340551376, 0.0700010359287262, 0.09254376590251923, 0.11508649587631226, 0.1376292109489441, 0.16017194092273712, 0.18271467089653015, 0.20525740087032318, 0.2278001308441162, 0.25034284591674805, 0.2728855609893799, 0.2954283058643341, 0.31797102093696594, 0.34051376581192017, 0.363056480884552, 0.38559919595718384, 0.40814194083213806, 0.4306846559047699, 0.4532274007797241, 0.47577011585235596, 0.4983128309249878, 0.5208555459976196, 0.5433982610702515, 0.5659409761428833, 0.5884836912155151, 0.611026406288147, 0.6335691809654236, 0.6561118960380554, 0.6786546111106873, 0.7011973261833191, 0.7237401008605957]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 3.0, 13.0, 11.0, 15.0, 25.0, 22.0, 38.0, 37.0, 62.0, 73.0, 101.0, 107.0, 160.0, 235.0, 322.0, 506.0, 829.0, 1438.0, 2797.0, 5954.0, 16258.0, 70799.0, 3752701.0, 287989.0, 32747.0, 10082.0, 4424.0, 2343.0, 1405.0, 887.0, 614.0, 397.0, 293.0, 182.0, 111.0, 101.0, 69.0, 44.0, 29.0, 20.0, 16.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.25048828125, -0.2434844970703125, -0.236480712890625, -0.2294769287109375, -0.22247314453125, -0.2154693603515625, -0.208465576171875, -0.2014617919921875, -0.1944580078125, -0.1874542236328125, -0.180450439453125, -0.1734466552734375, -0.16644287109375, -0.1594390869140625, -0.152435302734375, -0.1454315185546875, -0.138427734375, -0.1314239501953125, -0.124420166015625, -0.1174163818359375, -0.11041259765625, -0.1034088134765625, -0.096405029296875, -0.0894012451171875, -0.0823974609375, -0.0753936767578125, -0.068389892578125, -0.0613861083984375, -0.05438232421875, -0.0473785400390625, -0.040374755859375, -0.0333709716796875, -0.0263671875, -0.0193634033203125, -0.012359619140625, -0.0053558349609375, 0.00164794921875, 0.0086517333984375, 0.015655517578125, 0.0226593017578125, 0.0296630859375, 0.0366668701171875, 0.043670654296875, 0.0506744384765625, 0.05767822265625, 0.0646820068359375, 0.071685791015625, 0.0786895751953125, 0.085693359375, 0.0926971435546875, 0.099700927734375, 0.1067047119140625, 0.11370849609375, 0.1207122802734375, 0.127716064453125, 0.1347198486328125, 0.1417236328125, 0.1487274169921875, 0.155731201171875, 0.1627349853515625, 0.16973876953125, 0.1767425537109375, 0.183746337890625, 0.1907501220703125, 0.19775390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 11.0, 18.0, 33.0, 61.0, 101.0, 118.0, 187.0, 170.0, 93.0, 61.0, 29.0, 20.0, 13.0, 7.0, 6.0, 17.0, 4.0, 6.0, 2.0, 2.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025299072265625, -0.02457261085510254, -0.023846149444580078, -0.023119688034057617, -0.022393226623535156, -0.021666765213012695, -0.020940303802490234, -0.020213842391967773, -0.019487380981445312, -0.01876091957092285, -0.01803445816040039, -0.01730799674987793, -0.01658153533935547, -0.015855073928833008, -0.015128612518310547, -0.014402151107788086, -0.013675689697265625, -0.012949228286743164, -0.012222766876220703, -0.011496305465698242, -0.010769844055175781, -0.01004338264465332, -0.00931692123413086, -0.008590459823608398, -0.007863998413085938, -0.0071375370025634766, -0.006411075592041016, -0.005684614181518555, -0.004958152770996094, -0.004231691360473633, -0.003505229949951172, -0.002778768539428711, -0.00205230712890625, -0.001325845718383789, -0.0005993843078613281, 0.0001270771026611328, 0.0008535385131835938, 0.0015799999237060547, 0.0023064613342285156, 0.0030329227447509766, 0.0037593841552734375, 0.0044858455657958984, 0.005212306976318359, 0.00593876838684082, 0.006665229797363281, 0.007391691207885742, 0.008118152618408203, 0.008844614028930664, 0.009571075439453125, 0.010297536849975586, 0.011023998260498047, 0.011750459671020508, 0.012476921081542969, 0.01320338249206543, 0.01392984390258789, 0.014656305313110352, 0.015382766723632812, 0.016109228134155273, 0.016835689544677734, 0.017562150955200195, 0.018288612365722656, 0.019015073776245117, 0.019741535186767578, 0.02046799659729004, 0.0211944580078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 13.0, 16.0, 26.0, 25.0, 71.0, 117.0, 223.0, 537.0, 1433.0, 5316.0, 26481.0, 338320.0, 3699938.0, 103256.0, 13556.0, 3121.0, 989.0, 368.0, 185.0, 115.0, 56.0, 39.0, 18.0, 9.0, 16.0, 11.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.270263671875, -0.26260948181152344, -0.2549552917480469, -0.2473011016845703, -0.23964691162109375, -0.2319927215576172, -0.22433853149414062, -0.21668434143066406, -0.2090301513671875, -0.20137596130371094, -0.19372177124023438, -0.1860675811767578, -0.17841339111328125, -0.1707592010498047, -0.16310501098632812, -0.15545082092285156, -0.147796630859375, -0.14014244079589844, -0.13248825073242188, -0.12483406066894531, -0.11717987060546875, -0.10952568054199219, -0.10187149047851562, -0.09421730041503906, -0.0865631103515625, -0.07890892028808594, -0.07125473022460938, -0.06360054016113281, -0.05594635009765625, -0.04829216003417969, -0.040637969970703125, -0.03298377990722656, -0.02532958984375, -0.017675399780273438, -0.010021209716796875, -0.0023670196533203125, 0.00528717041015625, 0.012941360473632812, 0.020595550537109375, 0.028249740600585938, 0.0359039306640625, 0.04355812072753906, 0.051212310791015625, 0.05886650085449219, 0.06652069091796875, 0.07417488098144531, 0.08182907104492188, 0.08948326110839844, 0.097137451171875, 0.10479164123535156, 0.11244583129882812, 0.12010002136230469, 0.12775421142578125, 0.1354084014892578, 0.14306259155273438, 0.15071678161621094, 0.1583709716796875, 0.16602516174316406, 0.17367935180664062, 0.1813335418701172, 0.18898773193359375, 0.1966419219970703, 0.20429611206054688, 0.21195030212402344, 0.2196044921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 1.0, 9.0, 5.0, 23.0, 29.0, 23.0, 41.0, 70.0, 73.0, 136.0, 205.0, 395.0, 1474.0, 721.0, 322.0, 170.0, 113.0, 71.0, 35.0, 34.0, 28.0, 8.0, 14.0, 12.0, 13.0, 9.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0222320556640625, -0.02136969566345215, -0.020507335662841797, -0.019644975662231445, -0.018782615661621094, -0.017920255661010742, -0.01705789566040039, -0.01619553565979004, -0.015333175659179688, -0.014470815658569336, -0.013608455657958984, -0.012746095657348633, -0.011883735656738281, -0.01102137565612793, -0.010159015655517578, -0.009296655654907227, -0.008434295654296875, -0.0075719356536865234, -0.006709575653076172, -0.00584721565246582, -0.004984855651855469, -0.004122495651245117, -0.0032601356506347656, -0.002397775650024414, -0.0015354156494140625, -0.0006730556488037109, 0.00018930435180664062, 0.0010516643524169922, 0.0019140243530273438, 0.0027763843536376953, 0.003638744354248047, 0.0045011043548583984, 0.00536346435546875, 0.0062258243560791016, 0.007088184356689453, 0.007950544357299805, 0.008812904357910156, 0.009675264358520508, 0.01053762435913086, 0.011399984359741211, 0.012262344360351562, 0.013124704360961914, 0.013987064361572266, 0.014849424362182617, 0.01571178436279297, 0.01657414436340332, 0.017436504364013672, 0.018298864364624023, 0.019161224365234375, 0.020023584365844727, 0.020885944366455078, 0.02174830436706543, 0.02261066436767578, 0.023473024368286133, 0.024335384368896484, 0.025197744369506836, 0.026060104370117188, 0.02692246437072754, 0.02778482437133789, 0.028647184371948242, 0.029509544372558594, 0.030371904373168945, 0.031234264373779297, 0.03209662437438965, 0.032958984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 30.0, 72.0, 242.0, 314.0, 204.0, 89.0, 30.0, 10.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09958233684301376, -0.08903111517429352, -0.07847990095615387, -0.06792868673801422, -0.057377465069293976, -0.04682624712586403, -0.03627502918243408, -0.025723807513713837, -0.015172593295574188, -0.004621375352144241, 0.005929842591285706, 0.016481060534715652, 0.0270322784781456, 0.037583496421575546, 0.04813471436500549, 0.05868593603372574, 0.06923715025186539, 0.07978837192058563, 0.09033958613872528, 0.10089080035686493, 0.11144202202558517, 0.12199324369430542, 0.13254445791244507, 0.14309567213058472, 0.15364688634872437, 0.164198100566864, 0.17474931478500366, 0.1853005439043045, 0.19585175812244415, 0.2064029723405838, 0.21695420145988464, 0.2275054156780243, 0.23805665969848633, 0.24860787391662598, 0.2591590881347656, 0.2697103023529053, 0.2802615165710449, 0.29081276059150696, 0.3013639748096466, 0.31191518902778625, 0.3224664032459259, 0.33301761746406555, 0.3435688316822052, 0.35412004590034485, 0.3646712899208069, 0.37522250413894653, 0.3857737183570862, 0.39632493257522583, 0.4068761467933655, 0.4174273610115051, 0.4279785752296448, 0.4385297894477844, 0.4490810036659241, 0.4596322476863861, 0.47018346190452576, 0.4807346761226654, 0.49128589034080505, 0.5018371343612671, 0.5123883485794067, 0.5229395627975464, 0.533490777015686, 0.5440419912338257, 0.5545932054519653, 0.565144419670105, 0.5756956338882446]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 0.0, 8.0, 5.0, 6.0, 10.0, 11.0, 14.0, 26.0, 28.0, 33.0, 50.0, 43.0, 52.0, 53.0, 55.0, 64.0, 88.0, 54.0, 64.0, 53.0, 45.0, 50.0, 39.0, 32.0, 27.0, 19.0, 15.0, 10.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.12629568576812744, -0.12237454950809479, -0.11845341324806213, -0.11453226953744888, -0.11061113327741623, -0.10668999701738358, -0.10276885330677032, -0.09884771704673767, -0.09492658078670502, -0.09100544452667236, -0.08708430826663971, -0.08316316455602646, -0.0792420282959938, -0.07532089203596115, -0.0713997483253479, -0.06747861206531525, -0.06355747580528259, -0.05963633954524994, -0.05571519955992699, -0.051794059574604034, -0.04787292331457138, -0.04395178705453873, -0.040030647069215775, -0.03610950708389282, -0.03218837082386017, -0.028267232701182365, -0.024346094578504562, -0.02042495645582676, -0.016503818333148956, -0.012582680210471153, -0.00866154208779335, -0.004740403965115547, -0.0008192658424377441, 0.003101872280240059, 0.007023010402917862, 0.010944148525595665, 0.014865286648273468, 0.01878642477095127, 0.022707562893629074, 0.026628701016306877, 0.03054983913898468, 0.034470975399017334, 0.038392115384340286, 0.04231325536966324, 0.04623439162969589, 0.050155527889728546, 0.0540766678750515, 0.05799780786037445, 0.061918944120407104, 0.06584008038043976, 0.06976121664047241, 0.07368236035108566, 0.07760349661111832, 0.08152463287115097, 0.08544577658176422, 0.08936691284179688, 0.09328804910182953, 0.09720918536186218, 0.10113032162189484, 0.10505146533250809, 0.10897260159254074, 0.1128937378525734, 0.11681488156318665, 0.1207360178232193, 0.12465715408325195]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 10.0, 16.0, 17.0, 39.0, 50.0, 78.0, 85.0, 159.0, 249.0, 388.0, 704.0, 1138.0, 2099.0, 4163.0, 9525.0, 27606.0, 127409.0, 635826.0, 182371.0, 34853.0, 11550.0, 4773.0, 2284.0, 1227.0, 722.0, 423.0, 267.0, 169.0, 107.0, 74.0, 48.0, 34.0, 25.0, 14.0, 8.0, 12.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.14125633239746094, -0.13663864135742188, -0.1320209503173828, -0.12740325927734375, -0.12278556823730469, -0.11816787719726562, -0.11355018615722656, -0.1089324951171875, -0.10431480407714844, -0.09969711303710938, -0.09507942199707031, -0.09046173095703125, -0.08584403991699219, -0.08122634887695312, -0.07660865783691406, -0.071990966796875, -0.06737327575683594, -0.06275558471679688, -0.05813789367675781, -0.05352020263671875, -0.04890251159667969, -0.044284820556640625, -0.03966712951660156, -0.0350494384765625, -0.030431747436523438, -0.025814056396484375, -0.021196365356445312, -0.01657867431640625, -0.011960983276367188, -0.007343292236328125, -0.0027256011962890625, 0.00189208984375, 0.0065097808837890625, 0.011127471923828125, 0.015745162963867188, 0.02036285400390625, 0.024980545043945312, 0.029598236083984375, 0.03421592712402344, 0.0388336181640625, 0.04345130920410156, 0.048069000244140625, 0.05268669128417969, 0.05730438232421875, 0.06192207336425781, 0.06653976440429688, 0.07115745544433594, 0.075775146484375, 0.08039283752441406, 0.08501052856445312, 0.08962821960449219, 0.09424591064453125, 0.09886360168457031, 0.10348129272460938, 0.10809898376464844, 0.1127166748046875, 0.11733436584472656, 0.12195205688476562, 0.1265697479248047, 0.13118743896484375, 0.1358051300048828, 0.14042282104492188, 0.14504051208496094, 0.149658203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 5.0, 3.0, 7.0, 17.0, 25.0, 34.0, 51.0, 102.0, 126.0, 188.0, 131.0, 103.0, 75.0, 35.0, 27.0, 10.0, 13.0, 11.0, 11.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0243988037109375, -0.023699283599853516, -0.02299976348876953, -0.022300243377685547, -0.021600723266601562, -0.020901203155517578, -0.020201683044433594, -0.01950216293334961, -0.018802642822265625, -0.01810312271118164, -0.017403602600097656, -0.016704082489013672, -0.016004562377929688, -0.015305042266845703, -0.014605522155761719, -0.013906002044677734, -0.01320648193359375, -0.012506961822509766, -0.011807441711425781, -0.011107921600341797, -0.010408401489257812, -0.009708881378173828, -0.009009361267089844, -0.00830984115600586, -0.007610321044921875, -0.006910800933837891, -0.006211280822753906, -0.005511760711669922, -0.0048122406005859375, -0.004112720489501953, -0.0034132003784179688, -0.0027136802673339844, -0.00201416015625, -0.0013146400451660156, -0.0006151199340820312, 8.440017700195312e-05, 0.0007839202880859375, 0.0014834403991699219, 0.0021829605102539062, 0.0028824806213378906, 0.003582000732421875, 0.004281520843505859, 0.004981040954589844, 0.005680561065673828, 0.0063800811767578125, 0.007079601287841797, 0.007779121398925781, 0.008478641510009766, 0.00917816162109375, 0.009877681732177734, 0.010577201843261719, 0.011276721954345703, 0.011976242065429688, 0.012675762176513672, 0.013375282287597656, 0.01407480239868164, 0.014774322509765625, 0.01547384262084961, 0.016173362731933594, 0.016872882843017578, 0.017572402954101562, 0.018271923065185547, 0.01897144317626953, 0.019670963287353516, 0.0203704833984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 5.0, 8.0, 21.0, 29.0, 23.0, 39.0, 57.0, 98.0, 121.0, 179.0, 260.0, 405.0, 647.0, 1173.0, 2587.0, 7146.0, 24591.0, 109258.0, 455568.0, 345090.0, 73038.0, 17991.0, 5412.0, 2035.0, 1041.0, 546.0, 340.0, 243.0, 160.0, 112.0, 75.0, 71.0, 45.0, 30.0, 25.0, 21.0, 7.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1275634765625, -0.12368202209472656, -0.11980056762695312, -0.11591911315917969, -0.11203765869140625, -0.10815620422363281, -0.10427474975585938, -0.10039329528808594, -0.0965118408203125, -0.09263038635253906, -0.08874893188476562, -0.08486747741699219, -0.08098602294921875, -0.07710456848144531, -0.07322311401367188, -0.06934165954589844, -0.065460205078125, -0.06157875061035156, -0.057697296142578125, -0.05381584167480469, -0.04993438720703125, -0.04605293273925781, -0.042171478271484375, -0.03829002380371094, -0.0344085693359375, -0.030527114868164062, -0.026645660400390625, -0.022764205932617188, -0.01888275146484375, -0.015001296997070312, -0.011119842529296875, -0.0072383880615234375, -0.00335693359375, 0.0005245208740234375, 0.004405975341796875, 0.008287429809570312, 0.01216888427734375, 0.016050338745117188, 0.019931793212890625, 0.023813247680664062, 0.0276947021484375, 0.03157615661621094, 0.035457611083984375, 0.03933906555175781, 0.04322052001953125, 0.04710197448730469, 0.050983428955078125, 0.05486488342285156, 0.058746337890625, 0.06262779235839844, 0.06650924682617188, 0.07039070129394531, 0.07427215576171875, 0.07815361022949219, 0.08203506469726562, 0.08591651916503906, 0.0897979736328125, 0.09367942810058594, 0.09756088256835938, 0.10144233703613281, 0.10532379150390625, 0.10920524597167969, 0.11308670043945312, 0.11696815490722656, 0.120849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 7.0, 13.0, 13.0, 14.0, 24.0, 26.0, 24.0, 26.0, 34.0, 37.0, 38.0, 36.0, 40.0, 38.0, 38.0, 43.0, 45.0, 45.0, 44.0, 35.0, 34.0, 41.0, 37.0, 28.0, 26.0, 24.0, 21.0, 21.0, 21.0, 16.0, 14.0, 7.0, 11.0, 12.0, 7.0, 9.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0611572265625, -0.05928516387939453, -0.05741310119628906, -0.055541038513183594, -0.053668975830078125, -0.051796913146972656, -0.04992485046386719, -0.04805278778076172, -0.04618072509765625, -0.04430866241455078, -0.04243659973144531, -0.040564537048339844, -0.038692474365234375, -0.036820411682128906, -0.03494834899902344, -0.03307628631591797, -0.0312042236328125, -0.02933216094970703, -0.027460098266601562, -0.025588035583496094, -0.023715972900390625, -0.021843910217285156, -0.019971847534179688, -0.01809978485107422, -0.01622772216796875, -0.014355659484863281, -0.012483596801757812, -0.010611534118652344, -0.008739471435546875, -0.006867408752441406, -0.0049953460693359375, -0.0031232833862304688, -0.001251220703125, 0.0006208419799804688, 0.0024929046630859375, 0.004364967346191406, 0.006237030029296875, 0.008109092712402344, 0.009981155395507812, 0.011853218078613281, 0.01372528076171875, 0.015597343444824219, 0.017469406127929688, 0.019341468811035156, 0.021213531494140625, 0.023085594177246094, 0.024957656860351562, 0.02682971954345703, 0.0287017822265625, 0.03057384490966797, 0.03244590759277344, 0.034317970275878906, 0.036190032958984375, 0.038062095642089844, 0.03993415832519531, 0.04180622100830078, 0.04367828369140625, 0.04555034637451172, 0.04742240905761719, 0.049294471740722656, 0.051166534423828125, 0.053038597106933594, 0.05491065979003906, 0.05678272247314453, 0.05865478515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 9.0, 11.0, 18.0, 14.0, 26.0, 41.0, 48.0, 81.0, 146.0, 201.0, 317.0, 498.0, 839.0, 1413.0, 2582.0, 4923.0, 10884.0, 28084.0, 90444.0, 325958.0, 397777.0, 122222.0, 35966.0, 13087.0, 5812.0, 2910.0, 1657.0, 958.0, 581.0, 346.0, 233.0, 161.0, 89.0, 56.0, 54.0, 31.0, 20.0, 18.0, 9.0, 7.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06120014190673828, -0.05916786193847656, -0.057135581970214844, -0.055103302001953125, -0.053071022033691406, -0.05103874206542969, -0.04900646209716797, -0.04697418212890625, -0.04494190216064453, -0.04290962219238281, -0.040877342224121094, -0.038845062255859375, -0.036812782287597656, -0.03478050231933594, -0.03274822235107422, -0.0307159423828125, -0.02868366241455078, -0.026651382446289062, -0.024619102478027344, -0.022586822509765625, -0.020554542541503906, -0.018522262573242188, -0.01648998260498047, -0.01445770263671875, -0.012425422668457031, -0.010393142700195312, -0.008360862731933594, -0.006328582763671875, -0.004296302795410156, -0.0022640228271484375, -0.00023174285888671875, 0.001800537109375, 0.0038328170776367188, 0.0058650970458984375, 0.007897377014160156, 0.009929656982421875, 0.011961936950683594, 0.013994216918945312, 0.01602649688720703, 0.01805877685546875, 0.02009105682373047, 0.022123336791992188, 0.024155616760253906, 0.026187896728515625, 0.028220176696777344, 0.030252456665039062, 0.03228473663330078, 0.0343170166015625, 0.03634929656982422, 0.03838157653808594, 0.040413856506347656, 0.042446136474609375, 0.044478416442871094, 0.04651069641113281, 0.04854297637939453, 0.05057525634765625, 0.05260753631591797, 0.05463981628417969, 0.056672096252441406, 0.058704376220703125, 0.060736656188964844, 0.06276893615722656, 0.06480121612548828, 0.06683349609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 12.0, 9.0, 19.0, 14.0, 12.0, 35.0, 39.0, 51.0, 62.0, 52.0, 71.0, 83.0, 86.0, 68.0, 59.0, 63.0, 51.0, 39.0, 34.0, 27.0, 22.0, 13.0, 17.0, 16.0, 7.0, 8.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.03795051574707e-05, -5.8525241911411285e-05, -5.667097866535187e-05, -5.481671541929245e-05, -5.296245217323303e-05, -5.1108188927173615e-05, -4.92539256811142e-05, -4.739966243505478e-05, -4.554539918899536e-05, -4.3691135942935944e-05, -4.1836872696876526e-05, -3.998260945081711e-05, -3.812834620475769e-05, -3.627408295869827e-05, -3.4419819712638855e-05, -3.256555646657944e-05, -3.071129322052002e-05, -2.8857029974460602e-05, -2.7002766728401184e-05, -2.5148503482341766e-05, -2.329424023628235e-05, -2.143997699022293e-05, -1.9585713744163513e-05, -1.7731450498104095e-05, -1.5877187252044678e-05, -1.402292400598526e-05, -1.2168660759925842e-05, -1.0314397513866425e-05, -8.460134267807007e-06, -6.605871021747589e-06, -4.751607775688171e-06, -2.8973445296287537e-06, -1.043081283569336e-06, 8.111819624900818e-07, 2.6654452085494995e-06, 4.519708454608917e-06, 6.373971700668335e-06, 8.228234946727753e-06, 1.008249819278717e-05, 1.1936761438846588e-05, 1.3791024684906006e-05, 1.5645287930965424e-05, 1.749955117702484e-05, 1.935381442308426e-05, 2.1208077669143677e-05, 2.3062340915203094e-05, 2.4916604161262512e-05, 2.677086740732193e-05, 2.8625130653381348e-05, 3.0479393899440765e-05, 3.233365714550018e-05, 3.41879203915596e-05, 3.604218363761902e-05, 3.7896446883678436e-05, 3.9750710129737854e-05, 4.160497337579727e-05, 4.345923662185669e-05, 4.531349986791611e-05, 4.7167763113975525e-05, 4.902202636003494e-05, 5.087628960609436e-05, 5.273055285215378e-05, 5.4584816098213196e-05, 5.6439079344272614e-05, 5.829334259033203e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 13.0, 5.0, 15.0, 13.0, 25.0, 42.0, 49.0, 78.0, 152.0, 255.0, 488.0, 968.0, 2151.0, 6628.0, 27793.0, 181395.0, 643250.0, 151123.0, 24288.0, 5870.0, 2082.0, 838.0, 434.0, 246.0, 142.0, 74.0, 43.0, 38.0, 19.0, 3.0, 9.0, 10.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.10397720336914062, -0.10095977783203125, -0.09794235229492188, -0.0949249267578125, -0.09190750122070312, -0.08889007568359375, -0.08587265014648438, -0.082855224609375, -0.07983779907226562, -0.07682037353515625, -0.07380294799804688, -0.0707855224609375, -0.06776809692382812, -0.06475067138671875, -0.061733245849609375, -0.0587158203125, -0.055698394775390625, -0.05268096923828125, -0.049663543701171875, -0.0466461181640625, -0.043628692626953125, -0.04061126708984375, -0.037593841552734375, -0.034576416015625, -0.031558990478515625, -0.02854156494140625, -0.025524139404296875, -0.0225067138671875, -0.019489288330078125, -0.01647186279296875, -0.013454437255859375, -0.01043701171875, -0.007419586181640625, -0.00440216064453125, -0.001384735107421875, 0.0016326904296875, 0.004650115966796875, 0.00766754150390625, 0.010684967041015625, 0.013702392578125, 0.016719818115234375, 0.01973724365234375, 0.022754669189453125, 0.0257720947265625, 0.028789520263671875, 0.03180694580078125, 0.034824371337890625, 0.037841796875, 0.040859222412109375, 0.04387664794921875, 0.046894073486328125, 0.0499114990234375, 0.052928924560546875, 0.05594635009765625, 0.058963775634765625, 0.061981201171875, 0.06499862670898438, 0.06801605224609375, 0.07103347778320312, 0.0740509033203125, 0.07706832885742188, 0.08008575439453125, 0.08310317993164062, 0.08612060546875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 5.0, 8.0, 12.0, 19.0, 21.0, 29.0, 33.0, 34.0, 47.0, 54.0, 66.0, 69.0, 56.0, 83.0, 57.0, 65.0, 57.0, 39.0, 43.0, 41.0, 28.0, 28.0, 26.0, 16.0, 11.0, 6.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.046600341796875, -0.045503854751586914, -0.04440736770629883, -0.04331088066101074, -0.042214393615722656, -0.04111790657043457, -0.040021419525146484, -0.0389249324798584, -0.03782844543457031, -0.03673195838928223, -0.03563547134399414, -0.034538984298706055, -0.03344249725341797, -0.03234601020812988, -0.031249523162841797, -0.03015303611755371, -0.029056549072265625, -0.02796006202697754, -0.026863574981689453, -0.025767087936401367, -0.02467060089111328, -0.023574113845825195, -0.02247762680053711, -0.021381139755249023, -0.020284652709960938, -0.01918816566467285, -0.018091678619384766, -0.01699519157409668, -0.015898704528808594, -0.014802217483520508, -0.013705730438232422, -0.012609243392944336, -0.01151275634765625, -0.010416269302368164, -0.009319782257080078, -0.008223295211791992, -0.007126808166503906, -0.00603032112121582, -0.004933834075927734, -0.0038373470306396484, -0.0027408599853515625, -0.0016443729400634766, -0.0005478858947753906, 0.0005486011505126953, 0.0016450881958007812, 0.002741575241088867, 0.003838062286376953, 0.004934549331665039, 0.006031036376953125, 0.007127523422241211, 0.008224010467529297, 0.009320497512817383, 0.010416984558105469, 0.011513471603393555, 0.01260995864868164, 0.013706445693969727, 0.014802932739257812, 0.0158994197845459, 0.016995906829833984, 0.01809239387512207, 0.019188880920410156, 0.020285367965698242, 0.021381855010986328, 0.022478342056274414, 0.0235748291015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 8.0, 44.0, 156.0, 360.0, 304.0, 98.0, 21.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.775293231010437, -0.715581476688385, -0.655869722366333, -0.5961580276489258, -0.5364462733268738, -0.4767345190048218, -0.41702279448509216, -0.35731106996536255, -0.29759931564331055, -0.23788757622241974, -0.17817583680152893, -0.11846409738063812, -0.058752357959747314, 0.0009593963623046875, 0.0606711208820343, 0.12038284540176392, 0.18009459972381592, 0.23980633914470673, 0.29951807856559753, 0.35922980308532715, 0.41894155740737915, 0.47865331172943115, 0.5383650064468384, 0.5980767607688904, 0.6577885150909424, 0.7175002694129944, 0.7772120237350464, 0.8369237184524536, 0.8966354727745056, 0.9563472270965576, 1.0160589218139648, 1.075770616531372, 1.1354823112487793, 1.1951940059661865, 1.2549058198928833, 1.3146175146102905, 1.3743293285369873, 1.4340410232543945, 1.4937527179718018, 1.553464412689209, 1.6131762266159058, 1.672887921333313, 1.7325997352600098, 1.792311429977417, 1.8520231246948242, 1.911734938621521, 1.9714466333389282, 2.031158447265625, 2.0908701419830322, 2.1505818367004395, 2.2102935314178467, 2.270005464553833, 2.3297171592712402, 2.3894288539886475, 2.4491405487060547, 2.508852243423462, 2.568563938140869, 2.6282756328582764, 2.6879873275756836, 2.74769926071167, 2.807410955429077, 2.8671226501464844, 2.9268343448638916, 2.986546039581299, 3.046257972717285]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 8.0, 12.0, 24.0, 15.0, 22.0, 23.0, 23.0, 31.0, 34.0, 39.0, 36.0, 38.0, 40.0, 65.0, 59.0, 65.0, 48.0, 56.0, 62.0, 42.0, 38.0, 34.0, 33.0, 32.0, 17.0, 14.0, 17.0, 12.0, 10.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5495665073394775, -0.5306557416915894, -0.5117449760437012, -0.4928342401981354, -0.4739234745502472, -0.455012708902359, -0.4361019730567932, -0.41719120740890503, -0.39828044176101685, -0.37936967611312866, -0.3604589104652405, -0.3415481746196747, -0.3226374089717865, -0.3037266433238983, -0.2848159074783325, -0.26590514183044434, -0.24699437618255615, -0.22808361053466797, -0.20917285978794098, -0.190262109041214, -0.1713513433933258, -0.15244057774543762, -0.13352982699871063, -0.11461907625198364, -0.09570831060409546, -0.07679755240678787, -0.057886794209480286, -0.0389760360121727, -0.020065277814865112, -0.0011545196175575256, 0.01775623857975006, 0.03666698932647705, 0.055577754974365234, 0.07448851317167282, 0.09339927136898041, 0.112310029566288, 0.13122078776359558, 0.15013155341148376, 0.16904230415821075, 0.18795305490493774, 0.20686382055282593, 0.2257745862007141, 0.2446853369474411, 0.2635960876941681, 0.2825068533420563, 0.30141761898994446, 0.32032835483551025, 0.33923912048339844, 0.3581498861312866, 0.3770606517791748, 0.395971417427063, 0.4148821532726288, 0.43379291892051697, 0.45270368456840515, 0.47161442041397095, 0.49052518606185913, 0.5094359517097473, 0.5283467173576355, 0.5472574830055237, 0.5661682486534119, 0.5850789546966553, 0.6039897203445435, 0.6229004859924316, 0.6418112516403198, 0.660722017288208]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 17.0, 30.0, 41.0, 87.0, 160.0, 330.0, 902.0, 3219.0, 24182.0, 4015332.0, 139540.0, 7654.0, 1659.0, 580.0, 226.0, 117.0, 76.0, 39.0, 21.0, 18.0, 3.0, 9.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4582366943359375, -0.443328857421875, -0.4284210205078125, -0.41351318359375, -0.3986053466796875, -0.383697509765625, -0.3687896728515625, -0.3538818359375, -0.3389739990234375, -0.324066162109375, -0.3091583251953125, -0.29425048828125, -0.2793426513671875, -0.264434814453125, -0.2495269775390625, -0.234619140625, -0.2197113037109375, -0.204803466796875, -0.1898956298828125, -0.17498779296875, -0.1600799560546875, -0.145172119140625, -0.1302642822265625, -0.1153564453125, -0.1004486083984375, -0.085540771484375, -0.0706329345703125, -0.05572509765625, -0.0408172607421875, -0.025909423828125, -0.0110015869140625, 0.00390625, 0.0188140869140625, 0.033721923828125, 0.0486297607421875, 0.06353759765625, 0.0784454345703125, 0.093353271484375, 0.1082611083984375, 0.1231689453125, 0.1380767822265625, 0.152984619140625, 0.1678924560546875, 0.18280029296875, 0.1977081298828125, 0.212615966796875, 0.2275238037109375, 0.242431640625, 0.2573394775390625, 0.272247314453125, 0.2871551513671875, 0.30206298828125, 0.3169708251953125, 0.331878662109375, 0.3467864990234375, 0.3616943359375, 0.3766021728515625, 0.391510009765625, 0.4064178466796875, 0.42132568359375, 0.4362335205078125, 0.451141357421875, 0.4660491943359375, 0.48095703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 20.0, 31.0, 29.0, 45.0, 75.0, 127.0, 129.0, 122.0, 120.0, 72.0, 69.0, 38.0, 29.0, 27.0, 14.0, 7.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.024997949600219727, -0.024178028106689453, -0.02335810661315918, -0.022538185119628906, -0.021718263626098633, -0.02089834213256836, -0.020078420639038086, -0.019258499145507812, -0.01843857765197754, -0.017618656158447266, -0.016798734664916992, -0.01597881317138672, -0.015158891677856445, -0.014338970184326172, -0.013519048690795898, -0.012699127197265625, -0.011879205703735352, -0.011059284210205078, -0.010239362716674805, -0.009419441223144531, -0.008599519729614258, -0.007779598236083984, -0.006959676742553711, -0.0061397552490234375, -0.005319833755493164, -0.004499912261962891, -0.003679990768432617, -0.0028600692749023438, -0.0020401477813720703, -0.0012202262878417969, -0.00040030479431152344, 0.00041961669921875, 0.0012395381927490234, 0.002059459686279297, 0.0028793811798095703, 0.0036993026733398438, 0.004519224166870117, 0.005339145660400391, 0.006159067153930664, 0.0069789886474609375, 0.007798910140991211, 0.008618831634521484, 0.009438753128051758, 0.010258674621582031, 0.011078596115112305, 0.011898517608642578, 0.012718439102172852, 0.013538360595703125, 0.014358282089233398, 0.015178203582763672, 0.015998125076293945, 0.01681804656982422, 0.017637968063354492, 0.018457889556884766, 0.01927781105041504, 0.020097732543945312, 0.020917654037475586, 0.02173757553100586, 0.022557497024536133, 0.023377418518066406, 0.02419734001159668, 0.025017261505126953, 0.025837182998657227, 0.0266571044921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 22.0, 15.0, 32.0, 53.0, 73.0, 114.0, 213.0, 340.0, 582.0, 1201.0, 2616.0, 7066.0, 25439.0, 160390.0, 3504243.0, 429401.0, 44930.0, 10640.0, 3595.0, 1494.0, 745.0, 405.0, 230.0, 129.0, 99.0, 46.0, 47.0, 28.0, 18.0, 12.0, 5.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1662731170654297, -0.16067123413085938, -0.15506935119628906, -0.14946746826171875, -0.14386558532714844, -0.13826370239257812, -0.1326618194580078, -0.1270599365234375, -0.12145805358886719, -0.11585617065429688, -0.11025428771972656, -0.10465240478515625, -0.09905052185058594, -0.09344863891601562, -0.08784675598144531, -0.082244873046875, -0.07664299011230469, -0.07104110717773438, -0.06543922424316406, -0.05983734130859375, -0.05423545837402344, -0.048633575439453125, -0.04303169250488281, -0.0374298095703125, -0.03182792663574219, -0.026226043701171875, -0.020624160766601562, -0.01502227783203125, -0.009420394897460938, -0.003818511962890625, 0.0017833709716796875, 0.00738525390625, 0.012987136840820312, 0.018589019775390625, 0.024190902709960938, 0.02979278564453125, 0.03539466857910156, 0.040996551513671875, 0.04659843444824219, 0.0522003173828125, 0.05780220031738281, 0.06340408325195312, 0.06900596618652344, 0.07460784912109375, 0.08020973205566406, 0.08581161499023438, 0.09141349792480469, 0.097015380859375, 0.10261726379394531, 0.10821914672851562, 0.11382102966308594, 0.11942291259765625, 0.12502479553222656, 0.13062667846679688, 0.1362285614013672, 0.1418304443359375, 0.1474323272705078, 0.15303421020507812, 0.15863609313964844, 0.16423797607421875, 0.16983985900878906, 0.17544174194335938, 0.1810436248779297, 0.1866455078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 13.0, 10.0, 21.0, 20.0, 29.0, 49.0, 83.0, 141.0, 269.0, 627.0, 1798.0, 429.0, 239.0, 123.0, 55.0, 41.0, 35.0, 13.0, 19.0, 11.0, 9.0, 7.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.03126859664916992, -0.030035972595214844, -0.028803348541259766, -0.027570724487304688, -0.02633810043334961, -0.02510547637939453, -0.023872852325439453, -0.022640228271484375, -0.021407604217529297, -0.02017498016357422, -0.01894235610961914, -0.017709732055664062, -0.016477108001708984, -0.015244483947753906, -0.014011859893798828, -0.01277923583984375, -0.011546611785888672, -0.010313987731933594, -0.009081363677978516, -0.007848739624023438, -0.006616115570068359, -0.005383491516113281, -0.004150867462158203, -0.002918243408203125, -0.0016856193542480469, -0.00045299530029296875, 0.0007796287536621094, 0.0020122528076171875, 0.0032448768615722656, 0.004477500915527344, 0.005710124969482422, 0.0069427490234375, 0.008175373077392578, 0.009407997131347656, 0.010640621185302734, 0.011873245239257812, 0.01310586929321289, 0.014338493347167969, 0.015571117401123047, 0.016803741455078125, 0.018036365509033203, 0.01926898956298828, 0.02050161361694336, 0.021734237670898438, 0.022966861724853516, 0.024199485778808594, 0.025432109832763672, 0.02666473388671875, 0.027897357940673828, 0.029129981994628906, 0.030362606048583984, 0.03159523010253906, 0.03282785415649414, 0.03406047821044922, 0.0352931022644043, 0.036525726318359375, 0.03775835037231445, 0.03899097442626953, 0.04022359848022461, 0.04145622253417969, 0.042688846588134766, 0.043921470642089844, 0.04515409469604492, 0.04638671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 14.0, 22.0, 46.0, 70.0, 121.0, 140.0, 146.0, 134.0, 117.0, 73.0, 46.0, 18.0, 12.0, 12.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2676220238208771, -0.2612111270427704, -0.2548002600669861, -0.2483893632888794, -0.2419784665107727, -0.2355675846338272, -0.2291567027568817, -0.22274580597877502, -0.21633490920066833, -0.20992402732372284, -0.20351313054561615, -0.19710224866867065, -0.19069135189056396, -0.18428047001361847, -0.17786958813667297, -0.17145869135856628, -0.1650478094816208, -0.1586369276046753, -0.1522260308265686, -0.1458151489496231, -0.13940425217151642, -0.13299337029457092, -0.12658247351646423, -0.12017159163951874, -0.11376070231199265, -0.10734981298446655, -0.10093892365694046, -0.09452803432941437, -0.08811715245246887, -0.08170625567436218, -0.07529537379741669, -0.0688844844698906, -0.062473610043525696, -0.0560627207159996, -0.04965183138847351, -0.04324094578623772, -0.036830056458711624, -0.03041916713118553, -0.024008281528949738, -0.017597392201423645, -0.011186502873897552, -0.004775614477694035, 0.0016352739185094833, 0.008046161383390427, 0.01445705071091652, 0.02086794003844261, 0.027278825640678406, 0.0336897149682045, 0.04010060429573059, 0.04651149362325668, 0.052922382950782776, 0.05933326855301857, 0.06574416160583496, 0.07215504348278046, 0.07856593281030655, 0.08497682213783264, 0.09138771146535873, 0.09779860079288483, 0.10420949012041092, 0.11062037944793701, 0.11703126132488251, 0.1234421581029892, 0.1298530399799347, 0.13626393675804138, 0.14267481863498688]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 15.0, 7.0, 11.0, 10.0, 7.0, 15.0, 15.0, 19.0, 14.0, 27.0, 34.0, 36.0, 37.0, 41.0, 41.0, 51.0, 52.0, 44.0, 48.0, 47.0, 44.0, 40.0, 33.0, 44.0, 24.0, 37.0, 38.0, 23.0, 19.0, 13.0, 26.0, 14.0, 20.0, 13.0, 13.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.12018674612045288, -0.11640593409538269, -0.1126251146197319, -0.10884430259466171, -0.10506348311901093, -0.10128267109394073, -0.09750185906887054, -0.09372104704380035, -0.08994022756814957, -0.08615941554307938, -0.08237859606742859, -0.0785977840423584, -0.07481697201728821, -0.07103615254163742, -0.06725534051656723, -0.06347452104091644, -0.05969370901584625, -0.055912893265485764, -0.052132077515125275, -0.048351265490055084, -0.044570449739694595, -0.040789633989334106, -0.037008821964263916, -0.03322800621390343, -0.029447190463542938, -0.02566637471318245, -0.02188556082546711, -0.01810474693775177, -0.014323931187391281, -0.010543115437030792, -0.006762301549315453, -0.002981487661600113, 0.000799328088760376, 0.00458014290779829, 0.008360957726836205, 0.012141772545874119, 0.015922587364912033, 0.019703403115272522, 0.02348421700298786, 0.0272650308907032, 0.03104584664106369, 0.03482666239142418, 0.03860747814178467, 0.04238829016685486, 0.04616910591721535, 0.049949921667575836, 0.05373073369264603, 0.057511549443006516, 0.061292365193367004, 0.0650731772184372, 0.06885399669408798, 0.07263480871915817, 0.07641562819480896, 0.08019644021987915, 0.08397725224494934, 0.08775806427001953, 0.09153888374567032, 0.09531969577074051, 0.0991005152463913, 0.10288132727146149, 0.10666213929653168, 0.11044295877218246, 0.11422377079725266, 0.11800459027290344, 0.12178540229797363]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 11.0, 14.0, 24.0, 33.0, 38.0, 79.0, 95.0, 199.0, 320.0, 490.0, 926.0, 1610.0, 3394.0, 7932.0, 25434.0, 104829.0, 445859.0, 348406.0, 76432.0, 19620.0, 6541.0, 2841.0, 1419.0, 790.0, 441.0, 256.0, 179.0, 107.0, 81.0, 31.0, 34.0, 15.0, 13.0, 11.0, 9.0, 2.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1279296875, -0.12378883361816406, -0.11964797973632812, -0.11550712585449219, -0.11136627197265625, -0.10722541809082031, -0.10308456420898438, -0.09894371032714844, -0.0948028564453125, -0.09066200256347656, -0.08652114868164062, -0.08238029479980469, -0.07823944091796875, -0.07409858703613281, -0.06995773315429688, -0.06581687927246094, -0.061676025390625, -0.05753517150878906, -0.053394317626953125, -0.04925346374511719, -0.04511260986328125, -0.04097175598144531, -0.036830902099609375, -0.03269004821777344, -0.0285491943359375, -0.024408340454101562, -0.020267486572265625, -0.016126632690429688, -0.01198577880859375, -0.007844924926757812, -0.003704071044921875, 0.0004367828369140625, 0.00457763671875, 0.008718490600585938, 0.012859344482421875, 0.017000198364257812, 0.02114105224609375, 0.025281906127929688, 0.029422760009765625, 0.03356361389160156, 0.0377044677734375, 0.04184532165527344, 0.045986175537109375, 0.05012702941894531, 0.05426788330078125, 0.05840873718261719, 0.06254959106445312, 0.06669044494628906, 0.070831298828125, 0.07497215270996094, 0.07911300659179688, 0.08325386047363281, 0.08739471435546875, 0.09153556823730469, 0.09567642211914062, 0.09981727600097656, 0.1039581298828125, 0.10809898376464844, 0.11223983764648438, 0.11638069152832031, 0.12052154541015625, 0.12466239929199219, 0.12880325317382812, 0.13294410705566406, 0.1370849609375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 14.0, 17.0, 23.0, 46.0, 62.0, 102.0, 112.0, 113.0, 102.0, 101.0, 80.0, 62.0, 44.0, 33.0, 25.0, 21.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0260467529296875, -0.02523946762084961, -0.02443218231201172, -0.023624897003173828, -0.022817611694335938, -0.022010326385498047, -0.021203041076660156, -0.020395755767822266, -0.019588470458984375, -0.018781185150146484, -0.017973899841308594, -0.017166614532470703, -0.016359329223632812, -0.015552043914794922, -0.014744758605957031, -0.01393747329711914, -0.01313018798828125, -0.01232290267944336, -0.011515617370605469, -0.010708332061767578, -0.009901046752929688, -0.009093761444091797, -0.008286476135253906, -0.007479190826416016, -0.006671905517578125, -0.005864620208740234, -0.005057334899902344, -0.004250049591064453, -0.0034427642822265625, -0.002635478973388672, -0.0018281936645507812, -0.0010209083557128906, -0.000213623046875, 0.0005936622619628906, 0.0014009475708007812, 0.002208232879638672, 0.0030155181884765625, 0.003822803497314453, 0.004630088806152344, 0.005437374114990234, 0.006244659423828125, 0.007051944732666016, 0.007859230041503906, 0.008666515350341797, 0.009473800659179688, 0.010281085968017578, 0.011088371276855469, 0.01189565658569336, 0.01270294189453125, 0.01351022720336914, 0.014317512512207031, 0.015124797821044922, 0.015932083129882812, 0.016739368438720703, 0.017546653747558594, 0.018353939056396484, 0.019161224365234375, 0.019968509674072266, 0.020775794982910156, 0.021583080291748047, 0.022390365600585938, 0.023197650909423828, 0.02400493621826172, 0.02481222152709961, 0.0256195068359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 16.0, 23.0, 23.0, 21.0, 51.0, 60.0, 98.0, 124.0, 123.0, 177.0, 229.0, 367.0, 479.0, 816.0, 1438.0, 2919.0, 7003.0, 20810.0, 67895.0, 218052.0, 432687.0, 200212.0, 62715.0, 19135.0, 6450.0, 2742.0, 1302.0, 780.0, 450.0, 388.0, 268.0, 170.0, 138.0, 89.0, 73.0, 53.0, 37.0, 36.0, 28.0, 12.0, 14.0, 8.0, 9.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.09792137145996094, -0.09470748901367188, -0.09149360656738281, -0.08827972412109375, -0.08506584167480469, -0.08185195922851562, -0.07863807678222656, -0.0754241943359375, -0.07221031188964844, -0.06899642944335938, -0.06578254699707031, -0.06256866455078125, -0.05935478210449219, -0.056140899658203125, -0.05292701721191406, -0.049713134765625, -0.04649925231933594, -0.043285369873046875, -0.04007148742675781, -0.03685760498046875, -0.03364372253417969, -0.030429840087890625, -0.027215957641601562, -0.0240020751953125, -0.020788192749023438, -0.017574310302734375, -0.014360427856445312, -0.01114654541015625, -0.007932662963867188, -0.004718780517578125, -0.0015048980712890625, 0.001708984375, 0.0049228668212890625, 0.008136749267578125, 0.011350631713867188, 0.01456451416015625, 0.017778396606445312, 0.020992279052734375, 0.024206161499023438, 0.0274200439453125, 0.030633926391601562, 0.033847808837890625, 0.03706169128417969, 0.04027557373046875, 0.04348945617675781, 0.046703338623046875, 0.04991722106933594, 0.053131103515625, 0.05634498596191406, 0.059558868408203125, 0.06277275085449219, 0.06598663330078125, 0.06920051574707031, 0.07241439819335938, 0.07562828063964844, 0.0788421630859375, 0.08205604553222656, 0.08526992797851562, 0.08848381042480469, 0.09169769287109375, 0.09491157531738281, 0.09812545776367188, 0.10133934020996094, 0.10455322265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 18.0, 22.0, 25.0, 16.0, 30.0, 25.0, 28.0, 43.0, 37.0, 51.0, 40.0, 41.0, 53.0, 54.0, 50.0, 43.0, 52.0, 48.0, 32.0, 31.0, 43.0, 28.0, 28.0, 20.0, 18.0, 16.0, 16.0, 8.0, 12.0, 5.0, 5.0, 8.0, 7.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07817745208740234, -0.07548332214355469, -0.07278919219970703, -0.07009506225585938, -0.06740093231201172, -0.06470680236816406, -0.062012672424316406, -0.05931854248046875, -0.056624412536621094, -0.05393028259277344, -0.05123615264892578, -0.048542022705078125, -0.04584789276123047, -0.04315376281738281, -0.040459632873535156, -0.0377655029296875, -0.035071372985839844, -0.03237724304199219, -0.02968311309814453, -0.026988983154296875, -0.02429485321044922, -0.021600723266601562, -0.018906593322753906, -0.01621246337890625, -0.013518333435058594, -0.010824203491210938, -0.008130073547363281, -0.005435943603515625, -0.0027418136596679688, -4.76837158203125e-05, 0.0026464462280273438, 0.005340576171875, 0.008034706115722656, 0.010728836059570312, 0.013422966003417969, 0.016117095947265625, 0.01881122589111328, 0.021505355834960938, 0.024199485778808594, 0.02689361572265625, 0.029587745666503906, 0.03228187561035156, 0.03497600555419922, 0.037670135498046875, 0.04036426544189453, 0.04305839538574219, 0.045752525329589844, 0.0484466552734375, 0.051140785217285156, 0.05383491516113281, 0.05652904510498047, 0.059223175048828125, 0.06191730499267578, 0.06461143493652344, 0.0673055648803711, 0.06999969482421875, 0.0726938247680664, 0.07538795471191406, 0.07808208465576172, 0.08077621459960938, 0.08347034454345703, 0.08616447448730469, 0.08885860443115234, 0.091552734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 15.0, 12.0, 12.0, 23.0, 64.0, 43.0, 80.0, 120.0, 207.0, 312.0, 538.0, 877.0, 1467.0, 2516.0, 4450.0, 8202.0, 16136.0, 33305.0, 76734.0, 211720.0, 385615.0, 178420.0, 66548.0, 29460.0, 14317.0, 7544.0, 4135.0, 2280.0, 1275.0, 788.0, 454.0, 314.0, 179.0, 126.0, 76.0, 53.0, 53.0, 16.0, 10.0, 15.0, 10.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049163818359375, -0.04743385314941406, -0.045703887939453125, -0.04397392272949219, -0.04224395751953125, -0.04051399230957031, -0.038784027099609375, -0.03705406188964844, -0.0353240966796875, -0.03359413146972656, -0.031864166259765625, -0.030134201049804688, -0.02840423583984375, -0.026674270629882812, -0.024944305419921875, -0.023214340209960938, -0.021484375, -0.019754409790039062, -0.018024444580078125, -0.016294479370117188, -0.01456451416015625, -0.012834548950195312, -0.011104583740234375, -0.009374618530273438, -0.0076446533203125, -0.0059146881103515625, -0.004184722900390625, -0.0024547576904296875, -0.00072479248046875, 0.0010051727294921875, 0.002735137939453125, 0.0044651031494140625, 0.006195068359375, 0.007925033569335938, 0.009654998779296875, 0.011384963989257812, 0.01311492919921875, 0.014844894409179688, 0.016574859619140625, 0.018304824829101562, 0.0200347900390625, 0.021764755249023438, 0.023494720458984375, 0.025224685668945312, 0.02695465087890625, 0.028684616088867188, 0.030414581298828125, 0.03214454650878906, 0.03387451171875, 0.03560447692871094, 0.037334442138671875, 0.03906440734863281, 0.04079437255859375, 0.04252433776855469, 0.044254302978515625, 0.04598426818847656, 0.0477142333984375, 0.04944419860839844, 0.051174163818359375, 0.05290412902832031, 0.05463409423828125, 0.05636405944824219, 0.058094024658203125, 0.05982398986816406, 0.061553955078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 15.0, 17.0, 26.0, 33.0, 37.0, 45.0, 44.0, 73.0, 92.0, 111.0, 72.0, 77.0, 76.0, 61.0, 33.0, 46.0, 29.0, 23.0, 12.0, 13.0, 15.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.118680953979492e-05, -3.96091490983963e-05, -3.803148865699768e-05, -3.645382821559906e-05, -3.487616777420044e-05, -3.329850733280182e-05, -3.17208468914032e-05, -3.0143186450004578e-05, -2.8565526008605957e-05, -2.6987865567207336e-05, -2.5410205125808716e-05, -2.3832544684410095e-05, -2.2254884243011475e-05, -2.0677223801612854e-05, -1.9099563360214233e-05, -1.7521902918815613e-05, -1.5944242477416992e-05, -1.4366582036018372e-05, -1.2788921594619751e-05, -1.121126115322113e-05, -9.63360071182251e-06, -8.05594027042389e-06, -6.4782798290252686e-06, -4.900619387626648e-06, -3.3229589462280273e-06, -1.7452985048294067e-06, -1.6763806343078613e-07, 1.4100223779678345e-06, 2.987682819366455e-06, 4.565343260765076e-06, 6.143003702163696e-06, 7.720664143562317e-06, 9.298324584960938e-06, 1.0875985026359558e-05, 1.2453645467758179e-05, 1.40313059091568e-05, 1.560896635055542e-05, 1.718662679195404e-05, 1.876428723335266e-05, 2.0341947674751282e-05, 2.1919608116149902e-05, 2.3497268557548523e-05, 2.5074928998947144e-05, 2.6652589440345764e-05, 2.8230249881744385e-05, 2.9807910323143005e-05, 3.1385570764541626e-05, 3.2963231205940247e-05, 3.454089164733887e-05, 3.611855208873749e-05, 3.769621253013611e-05, 3.927387297153473e-05, 4.085153341293335e-05, 4.242919385433197e-05, 4.400685429573059e-05, 4.558451473712921e-05, 4.716217517852783e-05, 4.873983561992645e-05, 5.031749606132507e-05, 5.1895156502723694e-05, 5.3472816944122314e-05, 5.5050477385520935e-05, 5.6628137826919556e-05, 5.8205798268318176e-05, 5.97834587097168e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 7.0, 11.0, 9.0, 15.0, 25.0, 30.0, 38.0, 70.0, 114.0, 148.0, 245.0, 428.0, 840.0, 1932.0, 5304.0, 20321.0, 105762.0, 669688.0, 198657.0, 32078.0, 7812.0, 2570.0, 1090.0, 523.0, 280.0, 162.0, 120.0, 69.0, 63.0, 32.0, 30.0, 20.0, 12.0, 10.0, 10.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.137939453125, -0.13417625427246094, -0.13041305541992188, -0.1266498565673828, -0.12288665771484375, -0.11912345886230469, -0.11536026000976562, -0.11159706115722656, -0.1078338623046875, -0.10407066345214844, -0.10030746459960938, -0.09654426574707031, -0.09278106689453125, -0.08901786804199219, -0.08525466918945312, -0.08149147033691406, -0.077728271484375, -0.07396507263183594, -0.07020187377929688, -0.06643867492675781, -0.06267547607421875, -0.05891227722167969, -0.055149078369140625, -0.05138587951660156, -0.0476226806640625, -0.04385948181152344, -0.040096282958984375, -0.03633308410644531, -0.03256988525390625, -0.028806686401367188, -0.025043487548828125, -0.021280288696289062, -0.01751708984375, -0.013753890991210938, -0.009990692138671875, -0.0062274932861328125, -0.00246429443359375, 0.0012989044189453125, 0.005062103271484375, 0.008825302124023438, 0.0125885009765625, 0.016351699829101562, 0.020114898681640625, 0.023878097534179688, 0.02764129638671875, 0.03140449523925781, 0.035167694091796875, 0.03893089294433594, 0.042694091796875, 0.04645729064941406, 0.050220489501953125, 0.05398368835449219, 0.05774688720703125, 0.06151008605957031, 0.06527328491210938, 0.06903648376464844, 0.0727996826171875, 0.07656288146972656, 0.08032608032226562, 0.08408927917480469, 0.08785247802734375, 0.09161567687988281, 0.09537887573242188, 0.09914207458496094, 0.1029052734375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 8.0, 2.0, 11.0, 7.0, 8.0, 14.0, 12.0, 11.0, 23.0, 24.0, 23.0, 29.0, 42.0, 54.0, 66.0, 73.0, 78.0, 78.0, 84.0, 57.0, 63.0, 54.0, 24.0, 31.0, 20.0, 18.0, 23.0, 10.0, 13.0, 10.0, 5.0, 3.0, 8.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.051788330078125, -0.050187110900878906, -0.04858589172363281, -0.04698467254638672, -0.045383453369140625, -0.04378223419189453, -0.04218101501464844, -0.040579795837402344, -0.03897857666015625, -0.037377357482910156, -0.03577613830566406, -0.03417491912841797, -0.032573699951171875, -0.03097248077392578, -0.029371261596679688, -0.027770042419433594, -0.0261688232421875, -0.024567604064941406, -0.022966384887695312, -0.02136516571044922, -0.019763946533203125, -0.01816272735595703, -0.016561508178710938, -0.014960289001464844, -0.01335906982421875, -0.011757850646972656, -0.010156631469726562, -0.008555412292480469, -0.006954193115234375, -0.005352973937988281, -0.0037517547607421875, -0.0021505355834960938, -0.00054931640625, 0.0010519027709960938, 0.0026531219482421875, 0.004254341125488281, 0.005855560302734375, 0.007456779479980469, 0.009057998657226562, 0.010659217834472656, 0.01226043701171875, 0.013861656188964844, 0.015462875366210938, 0.01706409454345703, 0.018665313720703125, 0.02026653289794922, 0.021867752075195312, 0.023468971252441406, 0.0250701904296875, 0.026671409606933594, 0.028272628784179688, 0.02987384796142578, 0.031475067138671875, 0.03307628631591797, 0.03467750549316406, 0.036278724670410156, 0.03787994384765625, 0.039481163024902344, 0.04108238220214844, 0.04268360137939453, 0.044284820556640625, 0.04588603973388672, 0.04748725891113281, 0.049088478088378906, 0.050689697265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 22.0, 52.0, 123.0, 203.0, 250.0, 168.0, 98.0, 40.0, 18.0, 9.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1698739528656006, -1.1302838325500488, -1.090693712234497, -1.0511035919189453, -1.0115134716033936, -0.971923291683197, -0.9323331117630005, -0.8927429914474487, -0.853152871131897, -0.8135627508163452, -0.7739726305007935, -0.7343824505805969, -0.6947923302650452, -0.6552022099494934, -0.6156120300292969, -0.5760219097137451, -0.5364317893981934, -0.4968416690826416, -0.45725151896476746, -0.4176613688468933, -0.37807124853134155, -0.3384811282157898, -0.29889097809791565, -0.2593008279800415, -0.21971070766448975, -0.1801205724477768, -0.14053043723106384, -0.10094030201435089, -0.06135016679763794, -0.021760031580924988, 0.017830103635787964, 0.05742025375366211, 0.09701037406921387, 0.13660050928592682, 0.17619064450263977, 0.21578077971935272, 0.2553709149360657, 0.29496103525161743, 0.3345511853694916, 0.3741413354873657, 0.4137314558029175, 0.45332157611846924, 0.4929117262363434, 0.5325018763542175, 0.5720919966697693, 0.611682116985321, 0.6512722969055176, 0.6908624172210693, 0.7304525375366211, 0.7700426578521729, 0.8096327781677246, 0.8492229580879211, 0.8888130784034729, 0.9284031987190247, 0.9679933786392212, 1.007583498954773, 1.0471736192703247, 1.0867637395858765, 1.1263538599014282, 1.16594398021698, 1.2055342197418213, 1.245124340057373, 1.2847144603729248, 1.3243045806884766, 1.3638947010040283]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 7.0, 8.0, 8.0, 12.0, 21.0, 14.0, 15.0, 13.0, 15.0, 12.0, 21.0, 23.0, 28.0, 22.0, 36.0, 28.0, 30.0, 43.0, 44.0, 40.0, 33.0, 33.0, 40.0, 41.0, 46.0, 34.0, 50.0, 26.0, 27.0, 31.0, 33.0, 23.0, 19.0, 21.0, 16.0, 14.0, 10.0, 10.0, 10.0, 9.0, 8.0, 5.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.49877625703811646, -0.48435696959495544, -0.46993765234947205, -0.45551836490631104, -0.44109907746315, -0.426679790019989, -0.4122604727745056, -0.3978411853313446, -0.3834218978881836, -0.3690026104450226, -0.3545832931995392, -0.3401640057563782, -0.32574471831321716, -0.31132543087005615, -0.29690611362457275, -0.28248682618141174, -0.26806750893592834, -0.25364822149276733, -0.23922891914844513, -0.22480961680412292, -0.21039032936096191, -0.1959710270166397, -0.1815517246723175, -0.1671324372291565, -0.1527131348848343, -0.13829383254051208, -0.12387454509735107, -0.10945524275302887, -0.09503594785928726, -0.08061665296554565, -0.06619735062122345, -0.05177805572748184, -0.037358760833740234, -0.022939464077353477, -0.00852016732096672, 0.0058991312980651855, 0.020318426191806793, 0.0347377210855484, 0.049157023429870605, 0.06357631832361221, 0.07799561321735382, 0.09241490811109543, 0.10683420300483704, 0.12125350534915924, 0.13567280769348145, 0.15009209513664246, 0.16451139748096466, 0.17893069982528687, 0.19334998726844788, 0.20776928961277008, 0.2221885770559311, 0.2366078794002533, 0.2510271668434143, 0.2654464840888977, 0.2798657715320587, 0.2942850589752197, 0.3087043762207031, 0.32312366366386414, 0.33754298090934753, 0.35196226835250854, 0.36638155579566956, 0.38080084323883057, 0.39522016048431396, 0.409639447927475, 0.424058735370636]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 12.0, 13.0, 11.0, 21.0, 38.0, 43.0, 101.0, 127.0, 197.0, 431.0, 750.0, 1434.0, 3176.0, 8837.0, 35862.0, 374283.0, 3648371.0, 93867.0, 17015.0, 5278.0, 2095.0, 979.0, 532.0, 299.0, 157.0, 109.0, 72.0, 56.0, 20.0, 19.0, 12.0, 13.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16650390625, -0.1608104705810547, -0.15511703491210938, -0.14942359924316406, -0.14373016357421875, -0.13803672790527344, -0.13234329223632812, -0.1266498565673828, -0.1209564208984375, -0.11526298522949219, -0.10956954956054688, -0.10387611389160156, -0.09818267822265625, -0.09248924255371094, -0.08679580688476562, -0.08110237121582031, -0.075408935546875, -0.06971549987792969, -0.06402206420898438, -0.05832862854003906, -0.05263519287109375, -0.04694175720214844, -0.041248321533203125, -0.03555488586425781, -0.0298614501953125, -0.024168014526367188, -0.018474578857421875, -0.012781143188476562, -0.00708770751953125, -0.0013942718505859375, 0.004299163818359375, 0.009992599487304688, 0.01568603515625, 0.021379470825195312, 0.027072906494140625, 0.03276634216308594, 0.03845977783203125, 0.04415321350097656, 0.049846649169921875, 0.05554008483886719, 0.0612335205078125, 0.06692695617675781, 0.07262039184570312, 0.07831382751464844, 0.08400726318359375, 0.08970069885253906, 0.09539413452148438, 0.10108757019042969, 0.106781005859375, 0.11247444152832031, 0.11816787719726562, 0.12386131286621094, 0.12955474853515625, 0.13524818420410156, 0.14094161987304688, 0.1466350555419922, 0.1523284912109375, 0.1580219268798828, 0.16371536254882812, 0.16940879821777344, 0.17510223388671875, 0.18079566955566406, 0.18648910522460938, 0.1921825408935547, 0.1978759765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 19.0, 24.0, 31.0, 39.0, 54.0, 74.0, 75.0, 83.0, 98.0, 96.0, 86.0, 62.0, 55.0, 42.0, 36.0, 31.0, 31.0, 11.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.028154850006103516, -0.02731800079345703, -0.026481151580810547, -0.025644302368164062, -0.024807453155517578, -0.023970603942871094, -0.02313375473022461, -0.022296905517578125, -0.02146005630493164, -0.020623207092285156, -0.019786357879638672, -0.018949508666992188, -0.018112659454345703, -0.01727581024169922, -0.016438961029052734, -0.01560211181640625, -0.014765262603759766, -0.013928413391113281, -0.013091564178466797, -0.012254714965820312, -0.011417865753173828, -0.010581016540527344, -0.00974416732788086, -0.008907318115234375, -0.00807046890258789, -0.007233619689941406, -0.006396770477294922, -0.0055599212646484375, -0.004723072052001953, -0.0038862228393554688, -0.0030493736267089844, -0.0022125244140625, -0.0013756752014160156, -0.0005388259887695312, 0.0002980232238769531, 0.0011348724365234375, 0.001971721649169922, 0.0028085708618164062, 0.0036454200744628906, 0.004482269287109375, 0.005319118499755859, 0.006155967712402344, 0.006992816925048828, 0.007829666137695312, 0.008666515350341797, 0.009503364562988281, 0.010340213775634766, 0.01117706298828125, 0.012013912200927734, 0.012850761413574219, 0.013687610626220703, 0.014524459838867188, 0.015361309051513672, 0.016198158264160156, 0.01703500747680664, 0.017871856689453125, 0.01870870590209961, 0.019545555114746094, 0.020382404327392578, 0.021219253540039062, 0.022056102752685547, 0.02289295196533203, 0.023729801177978516, 0.024566650390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 0.0, 4.0, 7.0, 7.0, 2.0, 9.0, 15.0, 16.0, 19.0, 32.0, 59.0, 50.0, 111.0, 177.0, 302.0, 518.0, 834.0, 1729.0, 3797.0, 12447.0, 72911.0, 2629886.0, 1389578.0, 63571.0, 11353.0, 3541.0, 1476.0, 753.0, 380.0, 249.0, 163.0, 103.0, 61.0, 41.0, 26.0, 13.0, 10.0, 13.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17353057861328125, -0.1677398681640625, -0.16194915771484375, -0.156158447265625, -0.15036773681640625, -0.1445770263671875, -0.13878631591796875, -0.13299560546875, -0.12720489501953125, -0.1214141845703125, -0.11562347412109375, -0.109832763671875, -0.10404205322265625, -0.0982513427734375, -0.09246063232421875, -0.086669921875, -0.08087921142578125, -0.0750885009765625, -0.06929779052734375, -0.063507080078125, -0.05771636962890625, -0.0519256591796875, -0.04613494873046875, -0.04034423828125, -0.03455352783203125, -0.0287628173828125, -0.02297210693359375, -0.017181396484375, -0.01139068603515625, -0.0055999755859375, 0.00019073486328125, 0.0059814453125, 0.01177215576171875, 0.0175628662109375, 0.02335357666015625, 0.029144287109375, 0.03493499755859375, 0.0407257080078125, 0.04651641845703125, 0.05230712890625, 0.05809783935546875, 0.0638885498046875, 0.06967926025390625, 0.075469970703125, 0.08126068115234375, 0.0870513916015625, 0.09284210205078125, 0.0986328125, 0.10442352294921875, 0.1102142333984375, 0.11600494384765625, 0.121795654296875, 0.12758636474609375, 0.1333770751953125, 0.13916778564453125, 0.14495849609375, 0.15074920654296875, 0.1565399169921875, 0.16233062744140625, 0.168121337890625, 0.17391204833984375, 0.1797027587890625, 0.18549346923828125, 0.1912841796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 14.0, 21.0, 43.0, 74.0, 173.0, 453.0, 2218.0, 625.0, 207.0, 93.0, 57.0, 21.0, 28.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.078125, -0.07615423202514648, -0.07418346405029297, -0.07221269607543945, -0.07024192810058594, -0.06827116012573242, -0.0663003921508789, -0.06432962417602539, -0.062358856201171875, -0.06038808822631836, -0.058417320251464844, -0.05644655227661133, -0.05447578430175781, -0.0525050163269043, -0.05053424835205078, -0.048563480377197266, -0.04659271240234375, -0.044621944427490234, -0.04265117645263672, -0.0406804084777832, -0.03870964050292969, -0.03673887252807617, -0.034768104553222656, -0.03279733657836914, -0.030826568603515625, -0.02885580062866211, -0.026885032653808594, -0.024914264678955078, -0.022943496704101562, -0.020972728729248047, -0.01900196075439453, -0.017031192779541016, -0.0150604248046875, -0.013089656829833984, -0.011118888854980469, -0.009148120880126953, -0.0071773529052734375, -0.005206584930419922, -0.0032358169555664062, -0.0012650489807128906, 0.000705718994140625, 0.0026764869689941406, 0.004647254943847656, 0.006618022918701172, 0.008588790893554688, 0.010559558868408203, 0.012530326843261719, 0.014501094818115234, 0.01647186279296875, 0.018442630767822266, 0.02041339874267578, 0.022384166717529297, 0.024354934692382812, 0.026325702667236328, 0.028296470642089844, 0.03026723861694336, 0.032238006591796875, 0.03420877456665039, 0.036179542541503906, 0.03815031051635742, 0.04012107849121094, 0.04209184646606445, 0.04406261444091797, 0.046033382415771484, 0.048004150390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 4.0, 4.0, 12.0, 6.0, 16.0, 26.0, 43.0, 59.0, 93.0, 128.0, 134.0, 123.0, 94.0, 88.0, 73.0, 39.0, 29.0, 10.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1828184276819229, -0.17528069019317627, -0.16774295270442963, -0.16020521521568298, -0.15266746282577515, -0.1451297402381897, -0.13759198784828186, -0.13005425035953522, -0.12251651287078857, -0.11497877538204193, -0.10744103789329529, -0.09990329295396805, -0.0923655554652214, -0.08482781797647476, -0.07729007303714752, -0.06975233554840088, -0.062214598059654236, -0.05467686057090759, -0.04713911935687065, -0.03960137814283371, -0.03206364065408707, -0.024525903165340424, -0.016988161951303482, -0.00945042073726654, -0.0019126832485198975, 0.005625056102871895, 0.013162795454263687, 0.02070053480565548, 0.02823827415704727, 0.035776011645793915, 0.043313752859830856, 0.0508514940738678, 0.058389246463775635, 0.06592698395252228, 0.07346472144126892, 0.08100246638059616, 0.0885402038693428, 0.09607794135808945, 0.10361568629741669, 0.11115342378616333, 0.11869116127490997, 0.12622889876365662, 0.13376663625240326, 0.1413043737411499, 0.14884212613105774, 0.1563798487186432, 0.16391760110855103, 0.17145533859729767, 0.1789930760860443, 0.18653081357479095, 0.1940685510635376, 0.20160628855228424, 0.20914402604103088, 0.21668177843093872, 0.22421951591968536, 0.231757253408432, 0.23929499089717865, 0.2468327283859253, 0.25437048077583313, 0.2619082033634186, 0.2694459557533264, 0.27698367834091187, 0.2845214307308197, 0.29205918312072754, 0.299596905708313]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 2.0, 5.0, 11.0, 15.0, 17.0, 10.0, 20.0, 24.0, 23.0, 21.0, 23.0, 31.0, 30.0, 33.0, 36.0, 39.0, 29.0, 33.0, 43.0, 38.0, 34.0, 44.0, 34.0, 32.0, 30.0, 27.0, 25.0, 26.0, 19.0, 28.0, 21.0, 29.0, 24.0, 21.0, 26.0, 14.0, 9.0, 13.0, 9.0, 5.0, 11.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.1259007453918457, -0.12195496261119843, -0.11800917983055115, -0.11406338959932327, -0.110117606818676, -0.10617182403802872, -0.10222603380680084, -0.09828025102615356, -0.09433446824550629, -0.09038868546485901, -0.08644290268421173, -0.08249711245298386, -0.07855132967233658, -0.0746055468916893, -0.07065975666046143, -0.06671397387981415, -0.06276819109916687, -0.05882240831851959, -0.054876621812582016, -0.05093083530664444, -0.04698505252599716, -0.043039269745349884, -0.03909348323941231, -0.03514769673347473, -0.031201913952827454, -0.027256129309535027, -0.0233103446662426, -0.019364560022950172, -0.015418775379657745, -0.011472990736365318, -0.007527206093072891, -0.003581421449780464, 0.0003643631935119629, 0.00431014783680439, 0.008255932480096817, 0.012201717123389244, 0.01614750176668167, 0.020093286409974098, 0.024039071053266525, 0.027984855696558952, 0.03193064033985138, 0.03587642312049866, 0.039822209626436234, 0.04376799613237381, 0.04771377891302109, 0.051659561693668365, 0.05560534819960594, 0.05955113470554352, 0.0634969174861908, 0.06744270026683807, 0.07138848304748535, 0.07533427327871323, 0.0792800560593605, 0.08322583884000778, 0.08717162907123566, 0.09111741185188293, 0.09506319463253021, 0.09900897741317749, 0.10295476019382477, 0.10690055042505264, 0.11084633320569992, 0.1147921159863472, 0.11873790621757507, 0.12268368899822235, 0.12662947177886963]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 8.0, 7.0, 9.0, 15.0, 17.0, 26.0, 30.0, 43.0, 80.0, 103.0, 160.0, 201.0, 332.0, 528.0, 903.0, 1438.0, 2802.0, 5378.0, 10782.0, 23174.0, 52400.0, 120483.0, 258893.0, 298215.0, 150503.0, 65724.0, 28819.0, 13349.0, 6346.0, 3173.0, 1782.0, 993.0, 630.0, 360.0, 257.0, 177.0, 117.0, 84.0, 45.0, 44.0, 43.0, 23.0, 17.0, 7.0, 8.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.079345703125, -0.07708740234375, -0.0748291015625, -0.07257080078125, -0.0703125, -0.06805419921875, -0.0657958984375, -0.06353759765625, -0.061279296875, -0.05902099609375, -0.0567626953125, -0.05450439453125, -0.05224609375, -0.04998779296875, -0.0477294921875, -0.04547119140625, -0.043212890625, -0.04095458984375, -0.0386962890625, -0.03643798828125, -0.0341796875, -0.03192138671875, -0.0296630859375, -0.02740478515625, -0.025146484375, -0.02288818359375, -0.0206298828125, -0.01837158203125, -0.01611328125, -0.01385498046875, -0.0115966796875, -0.00933837890625, -0.007080078125, -0.00482177734375, -0.0025634765625, -0.00030517578125, 0.001953125, 0.00421142578125, 0.0064697265625, 0.00872802734375, 0.010986328125, 0.01324462890625, 0.0155029296875, 0.01776123046875, 0.02001953125, 0.02227783203125, 0.0245361328125, 0.02679443359375, 0.029052734375, 0.03131103515625, 0.0335693359375, 0.03582763671875, 0.0380859375, 0.04034423828125, 0.0426025390625, 0.04486083984375, 0.047119140625, 0.04937744140625, 0.0516357421875, 0.05389404296875, 0.05615234375, 0.05841064453125, 0.0606689453125, 0.06292724609375, 0.065185546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 13.0, 12.0, 22.0, 26.0, 42.0, 47.0, 50.0, 82.0, 69.0, 91.0, 83.0, 81.0, 63.0, 68.0, 56.0, 45.0, 35.0, 39.0, 18.0, 14.0, 11.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.027905941009521484, -0.02704906463623047, -0.026192188262939453, -0.025335311889648438, -0.024478435516357422, -0.023621559143066406, -0.02276468276977539, -0.021907806396484375, -0.02105093002319336, -0.020194053649902344, -0.019337177276611328, -0.018480300903320312, -0.017623424530029297, -0.01676654815673828, -0.015909671783447266, -0.01505279541015625, -0.014195919036865234, -0.013339042663574219, -0.012482166290283203, -0.011625289916992188, -0.010768413543701172, -0.009911537170410156, -0.00905466079711914, -0.008197784423828125, -0.007340908050537109, -0.006484031677246094, -0.005627155303955078, -0.0047702789306640625, -0.003913402557373047, -0.0030565261840820312, -0.0021996498107910156, -0.0013427734375, -0.0004858970642089844, 0.00037097930908203125, 0.0012278556823730469, 0.0020847320556640625, 0.002941608428955078, 0.0037984848022460938, 0.004655361175537109, 0.005512237548828125, 0.006369113922119141, 0.007225990295410156, 0.008082866668701172, 0.008939743041992188, 0.009796619415283203, 0.010653495788574219, 0.011510372161865234, 0.01236724853515625, 0.013224124908447266, 0.014081001281738281, 0.014937877655029297, 0.015794754028320312, 0.016651630401611328, 0.017508506774902344, 0.01836538314819336, 0.019222259521484375, 0.02007913589477539, 0.020936012268066406, 0.021792888641357422, 0.022649765014648438, 0.023506641387939453, 0.02436351776123047, 0.025220394134521484, 0.0260772705078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 7.0, 5.0, 10.0, 8.0, 16.0, 21.0, 18.0, 41.0, 48.0, 69.0, 81.0, 130.0, 184.0, 223.0, 322.0, 536.0, 810.0, 1290.0, 2461.0, 5613.0, 13960.0, 41784.0, 133899.0, 370809.0, 316134.0, 105077.0, 33268.0, 11459.0, 4637.0, 2169.0, 1178.0, 735.0, 463.0, 312.0, 230.0, 139.0, 118.0, 63.0, 54.0, 38.0, 43.0, 25.0, 24.0, 14.0, 6.0, 9.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.097412109375, -0.0944509506225586, -0.09148979187011719, -0.08852863311767578, -0.08556747436523438, -0.08260631561279297, -0.07964515686035156, -0.07668399810791016, -0.07372283935546875, -0.07076168060302734, -0.06780052185058594, -0.06483936309814453, -0.061878204345703125, -0.05891704559326172, -0.05595588684082031, -0.052994728088378906, -0.0500335693359375, -0.047072410583496094, -0.04411125183105469, -0.04115009307861328, -0.038188934326171875, -0.03522777557373047, -0.03226661682128906, -0.029305458068847656, -0.02634429931640625, -0.023383140563964844, -0.020421981811523438, -0.01746082305908203, -0.014499664306640625, -0.011538505554199219, -0.008577346801757812, -0.005616188049316406, -0.002655029296875, 0.00030612945556640625, 0.0032672882080078125, 0.006228446960449219, 0.009189605712890625, 0.012150764465332031, 0.015111923217773438, 0.018073081970214844, 0.02103424072265625, 0.023995399475097656, 0.026956558227539062, 0.02991771697998047, 0.032878875732421875, 0.03584003448486328, 0.03880119323730469, 0.041762351989746094, 0.0447235107421875, 0.047684669494628906, 0.05064582824707031, 0.05360698699951172, 0.056568145751953125, 0.05952930450439453, 0.06249046325683594, 0.06545162200927734, 0.06841278076171875, 0.07137393951416016, 0.07433509826660156, 0.07729625701904297, 0.08025741577148438, 0.08321857452392578, 0.08617973327636719, 0.0891408920288086, 0.09210205078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 19.0, 23.0, 30.0, 21.0, 35.0, 30.0, 42.0, 44.0, 45.0, 55.0, 65.0, 58.0, 49.0, 43.0, 61.0, 52.0, 52.0, 30.0, 23.0, 34.0, 22.0, 22.0, 21.0, 18.0, 13.0, 16.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11798095703125, -0.11449813842773438, -0.11101531982421875, -0.10753250122070312, -0.1040496826171875, -0.10056686401367188, -0.09708404541015625, -0.09360122680664062, -0.090118408203125, -0.08663558959960938, -0.08315277099609375, -0.07966995239257812, -0.0761871337890625, -0.07270431518554688, -0.06922149658203125, -0.06573867797851562, -0.062255859375, -0.058773040771484375, -0.05529022216796875, -0.051807403564453125, -0.0483245849609375, -0.044841766357421875, -0.04135894775390625, -0.037876129150390625, -0.034393310546875, -0.030910491943359375, -0.02742767333984375, -0.023944854736328125, -0.0204620361328125, -0.016979217529296875, -0.01349639892578125, -0.010013580322265625, -0.00653076171875, -0.003047943115234375, 0.00043487548828125, 0.003917694091796875, 0.0074005126953125, 0.010883331298828125, 0.01436614990234375, 0.017848968505859375, 0.021331787109375, 0.024814605712890625, 0.02829742431640625, 0.031780242919921875, 0.0352630615234375, 0.038745880126953125, 0.04222869873046875, 0.045711517333984375, 0.0491943359375, 0.052677154541015625, 0.05615997314453125, 0.059642791748046875, 0.0631256103515625, 0.06660842895507812, 0.07009124755859375, 0.07357406616210938, 0.077056884765625, 0.08053970336914062, 0.08402252197265625, 0.08750534057617188, 0.0909881591796875, 0.09447097778320312, 0.09795379638671875, 0.10143661499023438, 0.10491943359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 15.0, 11.0, 13.0, 22.0, 42.0, 63.0, 94.0, 125.0, 219.0, 377.0, 704.0, 1184.0, 2353.0, 4775.0, 10342.0, 25200.0, 72515.0, 296114.0, 460401.0, 111637.0, 35675.0, 13895.0, 6163.0, 2990.0, 1569.0, 830.0, 447.0, 266.0, 180.0, 104.0, 70.0, 57.0, 29.0, 21.0, 20.0, 6.0, 11.0, 7.0, 1.0, 0.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.0547032356262207, -0.052613258361816406, -0.05052328109741211, -0.04843330383300781, -0.046343326568603516, -0.04425334930419922, -0.04216337203979492, -0.040073394775390625, -0.03798341751098633, -0.03589344024658203, -0.033803462982177734, -0.03171348571777344, -0.02962350845336914, -0.027533531188964844, -0.025443553924560547, -0.02335357666015625, -0.021263599395751953, -0.019173622131347656, -0.01708364486694336, -0.014993667602539062, -0.012903690338134766, -0.010813713073730469, -0.008723735809326172, -0.006633758544921875, -0.004543781280517578, -0.0024538040161132812, -0.0003638267517089844, 0.0017261505126953125, 0.0038161277770996094, 0.005906105041503906, 0.007996082305908203, 0.0100860595703125, 0.012176036834716797, 0.014266014099121094, 0.01635599136352539, 0.018445968627929688, 0.020535945892333984, 0.02262592315673828, 0.024715900421142578, 0.026805877685546875, 0.028895854949951172, 0.03098583221435547, 0.033075809478759766, 0.03516578674316406, 0.03725576400756836, 0.039345741271972656, 0.04143571853637695, 0.04352569580078125, 0.04561567306518555, 0.047705650329589844, 0.04979562759399414, 0.05188560485839844, 0.053975582122802734, 0.05606555938720703, 0.05815553665161133, 0.060245513916015625, 0.06233549118041992, 0.06442546844482422, 0.06651544570922852, 0.06860542297363281, 0.07069540023803711, 0.0727853775024414, 0.0748753547668457, 0.07696533203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 17.0, 22.0, 32.0, 47.0, 72.0, 63.0, 78.0, 97.0, 114.0, 103.0, 78.0, 71.0, 61.0, 39.0, 21.0, 21.0, 18.0, 10.0, 7.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2319297790527344e-05, -4.043988883495331e-05, -3.856047987937927e-05, -3.668107092380524e-05, -3.48016619682312e-05, -3.2922253012657166e-05, -3.104284405708313e-05, -2.9163435101509094e-05, -2.728402614593506e-05, -2.5404617190361023e-05, -2.3525208234786987e-05, -2.164579927921295e-05, -1.9766390323638916e-05, -1.788698136806488e-05, -1.6007572412490845e-05, -1.4128163456916809e-05, -1.2248754501342773e-05, -1.0369345545768738e-05, -8.489936590194702e-06, -6.6105276346206665e-06, -4.731118679046631e-06, -2.8517097234725952e-06, -9.723007678985596e-07, 9.071081876754761e-07, 2.7865171432495117e-06, 4.665926098823547e-06, 6.545335054397583e-06, 8.424744009971619e-06, 1.0304152965545654e-05, 1.218356192111969e-05, 1.4062970876693726e-05, 1.594237983226776e-05, 1.7821788787841797e-05, 1.9701197743415833e-05, 2.1580606698989868e-05, 2.3460015654563904e-05, 2.533942461013794e-05, 2.7218833565711975e-05, 2.909824252128601e-05, 3.0977651476860046e-05, 3.285706043243408e-05, 3.473646938800812e-05, 3.661587834358215e-05, 3.849528729915619e-05, 4.0374696254730225e-05, 4.225410521030426e-05, 4.4133514165878296e-05, 4.601292312145233e-05, 4.789233207702637e-05, 4.97717410326004e-05, 5.165114998817444e-05, 5.3530558943748474e-05, 5.540996789932251e-05, 5.7289376854896545e-05, 5.916878581047058e-05, 6.104819476604462e-05, 6.292760372161865e-05, 6.480701267719269e-05, 6.668642163276672e-05, 6.856583058834076e-05, 7.04452395439148e-05, 7.232464849948883e-05, 7.420405745506287e-05, 7.60834664106369e-05, 7.796287536621094e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 11.0, 13.0, 10.0, 12.0, 22.0, 26.0, 38.0, 56.0, 77.0, 114.0, 180.0, 266.0, 520.0, 847.0, 1827.0, 4155.0, 10959.0, 33791.0, 141930.0, 610947.0, 181656.0, 39563.0, 12376.0, 4771.0, 1966.0, 987.0, 495.0, 305.0, 180.0, 113.0, 71.0, 77.0, 51.0, 26.0, 24.0, 26.0, 14.0, 7.0, 6.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.0732269287109375, -0.070831298828125, -0.0684356689453125, -0.0660400390625, -0.0636444091796875, -0.061248779296875, -0.0588531494140625, -0.05645751953125, -0.0540618896484375, -0.051666259765625, -0.0492706298828125, -0.046875, -0.0444793701171875, -0.042083740234375, -0.0396881103515625, -0.03729248046875, -0.0348968505859375, -0.032501220703125, -0.0301055908203125, -0.0277099609375, -0.0253143310546875, -0.022918701171875, -0.0205230712890625, -0.01812744140625, -0.0157318115234375, -0.013336181640625, -0.0109405517578125, -0.008544921875, -0.0061492919921875, -0.003753662109375, -0.0013580322265625, 0.00103759765625, 0.0034332275390625, 0.005828857421875, 0.0082244873046875, 0.0106201171875, 0.0130157470703125, 0.015411376953125, 0.0178070068359375, 0.02020263671875, 0.0225982666015625, 0.024993896484375, 0.0273895263671875, 0.02978515625, 0.0321807861328125, 0.034576416015625, 0.0369720458984375, 0.03936767578125, 0.0417633056640625, 0.044158935546875, 0.0465545654296875, 0.0489501953125, 0.0513458251953125, 0.053741455078125, 0.0561370849609375, 0.05853271484375, 0.0609283447265625, 0.063323974609375, 0.0657196044921875, 0.068115234375, 0.0705108642578125, 0.072906494140625, 0.0753021240234375, 0.07769775390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 7.0, 6.0, 11.0, 8.0, 10.0, 14.0, 21.0, 23.0, 30.0, 31.0, 46.0, 57.0, 85.0, 94.0, 92.0, 98.0, 71.0, 76.0, 50.0, 34.0, 22.0, 16.0, 20.0, 14.0, 11.0, 4.0, 9.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0531005859375, -0.051512718200683594, -0.04992485046386719, -0.04833698272705078, -0.046749114990234375, -0.04516124725341797, -0.04357337951660156, -0.041985511779785156, -0.04039764404296875, -0.038809776306152344, -0.03722190856933594, -0.03563404083251953, -0.034046173095703125, -0.03245830535888672, -0.030870437622070312, -0.029282569885253906, -0.0276947021484375, -0.026106834411621094, -0.024518966674804688, -0.02293109893798828, -0.021343231201171875, -0.01975536346435547, -0.018167495727539062, -0.016579627990722656, -0.01499176025390625, -0.013403892517089844, -0.011816024780273438, -0.010228157043457031, -0.008640289306640625, -0.007052421569824219, -0.0054645538330078125, -0.0038766860961914062, -0.002288818359375, -0.0007009506225585938, 0.0008869171142578125, 0.0024747848510742188, 0.004062652587890625, 0.005650520324707031, 0.0072383880615234375, 0.008826255798339844, 0.01041412353515625, 0.012001991271972656, 0.013589859008789062, 0.015177726745605469, 0.016765594482421875, 0.01835346221923828, 0.019941329956054688, 0.021529197692871094, 0.0231170654296875, 0.024704933166503906, 0.026292800903320312, 0.02788066864013672, 0.029468536376953125, 0.03105640411376953, 0.03264427185058594, 0.034232139587402344, 0.03582000732421875, 0.037407875061035156, 0.03899574279785156, 0.04058361053466797, 0.042171478271484375, 0.04375934600830078, 0.04534721374511719, 0.046935081481933594, 0.04852294921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 17.0, 37.0, 60.0, 130.0, 164.0, 197.0, 179.0, 111.0, 61.0, 23.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36662888526916504, -0.3313409984111786, -0.29605311155319214, -0.2607652544975281, -0.22547736763954163, -0.19018948078155518, -0.15490160882472992, -0.11961373686790466, -0.08432585000991821, -0.04903797060251236, -0.013750091195106506, 0.021537788212299347, 0.0568256676197052, 0.09211355447769165, 0.1274014264345169, 0.16268929839134216, 0.1979771852493286, 0.23326507210731506, 0.2685529589653015, 0.3038408160209656, 0.339128702878952, 0.3744165897369385, 0.40970444679260254, 0.444992333650589, 0.48028022050857544, 0.5155680775642395, 0.5508559942245483, 0.5861438512802124, 0.6214317083358765, 0.6567196249961853, 0.6920074820518494, 0.7272953987121582, 0.7625832557678223, 0.7978711128234863, 0.8331590294837952, 0.8684468865394592, 0.9037348031997681, 0.9390226602554321, 0.9743105173110962, 1.0095983743667603, 1.0448863506317139, 1.080174207687378, 1.115462064743042, 1.1507500410079956, 1.1860378980636597, 1.2213257551193237, 1.2566136121749878, 1.2919014692306519, 1.327189326286316, 1.36247718334198, 1.397765040397644, 1.4330530166625977, 1.4683408737182617, 1.5036287307739258, 1.5389165878295898, 1.574204444885254, 1.609492301940918, 1.644780158996582, 1.680068016052246, 1.7153559923171997, 1.7506438493728638, 1.7859317064285278, 1.821219563484192, 1.856507420539856, 1.8917953968048096]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 12.0, 8.0, 27.0, 20.0, 23.0, 26.0, 40.0, 36.0, 49.0, 50.0, 69.0, 54.0, 61.0, 65.0, 62.0, 56.0, 44.0, 48.0, 49.0, 43.0, 27.0, 25.0, 22.0, 18.0, 10.0, 11.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6638667583465576, -0.6416358947753906, -0.6194049715995789, -0.5971741080284119, -0.5749431848526001, -0.5527123212814331, -0.5304814577102661, -0.5082505345344543, -0.48601964116096497, -0.4637887477874756, -0.4415578544139862, -0.4193269610404968, -0.39709609746932983, -0.37486517429351807, -0.3526343107223511, -0.3304034173488617, -0.3081725239753723, -0.28594163060188293, -0.26371073722839355, -0.24147985875606537, -0.219248965382576, -0.1970180720090866, -0.17478719353675842, -0.15255630016326904, -0.13032540678977966, -0.10809451341629028, -0.0858636274933815, -0.06363274157047272, -0.04140184819698334, -0.019170954823493958, 0.0030599236488342285, 0.02529081702232361, 0.047521770000457764, 0.06975266337394714, 0.09198354929685593, 0.11421443521976471, 0.1364453285932541, 0.15867622196674347, 0.18090710043907166, 0.20313799381256104, 0.22536888718605042, 0.2475997805595398, 0.2698306739330292, 0.29206156730651855, 0.31429243087768555, 0.3365233540534973, 0.3587542176246643, 0.3809851109981537, 0.40321600437164307, 0.42544689774513245, 0.4476777911186218, 0.4699086546897888, 0.4921395778656006, 0.5143704414367676, 0.5366013050079346, 0.5588322281837463, 0.5810631513595581, 0.6032940149307251, 0.6255249381065369, 0.6477558016777039, 0.6699867248535156, 0.6922175884246826, 0.7144484519958496, 0.7366793751716614, 0.7589102387428284]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 10.0, 8.0, 11.0, 23.0, 32.0, 54.0, 93.0, 194.0, 348.0, 739.0, 1737.0, 5003.0, 21371.0, 176554.0, 3826009.0, 135625.0, 18810.0, 4659.0, 1604.0, 707.0, 332.0, 146.0, 105.0, 40.0, 33.0, 14.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17201614379882812, -0.16617584228515625, -0.16033554077148438, -0.1544952392578125, -0.14865493774414062, -0.14281463623046875, -0.13697433471679688, -0.131134033203125, -0.12529373168945312, -0.11945343017578125, -0.11361312866210938, -0.1077728271484375, -0.10193252563476562, -0.09609222412109375, -0.09025192260742188, -0.08441162109375, -0.07857131958007812, -0.07273101806640625, -0.06689071655273438, -0.0610504150390625, -0.055210113525390625, -0.04936981201171875, -0.043529510498046875, -0.037689208984375, -0.031848907470703125, -0.02600860595703125, -0.020168304443359375, -0.0143280029296875, -0.008487701416015625, -0.00264739990234375, 0.003192901611328125, 0.009033203125, 0.014873504638671875, 0.02071380615234375, 0.026554107666015625, 0.0323944091796875, 0.038234710693359375, 0.04407501220703125, 0.049915313720703125, 0.055755615234375, 0.061595916748046875, 0.06743621826171875, 0.07327651977539062, 0.0791168212890625, 0.08495712280273438, 0.09079742431640625, 0.09663772583007812, 0.10247802734375, 0.10831832885742188, 0.11415863037109375, 0.11999893188476562, 0.1258392333984375, 0.13167953491210938, 0.13751983642578125, 0.14336013793945312, 0.149200439453125, 0.15504074096679688, 0.16088104248046875, 0.16672134399414062, 0.1725616455078125, 0.17840194702148438, 0.18424224853515625, 0.19008255004882812, 0.1959228515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 9.0, 9.0, 23.0, 23.0, 27.0, 27.0, 53.0, 62.0, 63.0, 58.0, 82.0, 75.0, 83.0, 54.0, 61.0, 42.0, 62.0, 38.0, 38.0, 25.0, 22.0, 14.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02801513671875, -0.027231693267822266, -0.02644824981689453, -0.025664806365966797, -0.024881362915039062, -0.024097919464111328, -0.023314476013183594, -0.02253103256225586, -0.021747589111328125, -0.02096414566040039, -0.020180702209472656, -0.019397258758544922, -0.018613815307617188, -0.017830371856689453, -0.01704692840576172, -0.016263484954833984, -0.01548004150390625, -0.014696598052978516, -0.013913154602050781, -0.013129711151123047, -0.012346267700195312, -0.011562824249267578, -0.010779380798339844, -0.00999593734741211, -0.009212493896484375, -0.00842905044555664, -0.007645606994628906, -0.006862163543701172, -0.0060787200927734375, -0.005295276641845703, -0.004511833190917969, -0.0037283897399902344, -0.0029449462890625, -0.0021615028381347656, -0.0013780593872070312, -0.0005946159362792969, 0.0001888275146484375, 0.0009722709655761719, 0.0017557144165039062, 0.0025391578674316406, 0.003322601318359375, 0.004106044769287109, 0.004889488220214844, 0.005672931671142578, 0.0064563751220703125, 0.007239818572998047, 0.008023262023925781, 0.008806705474853516, 0.00959014892578125, 0.010373592376708984, 0.011157035827636719, 0.011940479278564453, 0.012723922729492188, 0.013507366180419922, 0.014290809631347656, 0.01507425308227539, 0.015857696533203125, 0.01664113998413086, 0.017424583435058594, 0.018208026885986328, 0.018991470336914062, 0.019774913787841797, 0.02055835723876953, 0.021341800689697266, 0.022125244140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 8.0, 11.0, 8.0, 21.0, 18.0, 33.0, 32.0, 38.0, 37.0, 54.0, 82.0, 157.0, 344.0, 1037.0, 4337.0, 31020.0, 2887850.0, 1235929.0, 27547.0, 3995.0, 987.0, 344.0, 117.0, 74.0, 47.0, 24.0, 22.0, 25.0, 13.0, 13.0, 13.0, 10.0, 5.0, 6.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317626953125, -0.3073692321777344, -0.29711151123046875, -0.2868537902832031, -0.2765960693359375, -0.2663383483886719, -0.25608062744140625, -0.24582290649414062, -0.235565185546875, -0.22530746459960938, -0.21504974365234375, -0.20479202270507812, -0.1945343017578125, -0.18427658081054688, -0.17401885986328125, -0.16376113891601562, -0.15350341796875, -0.14324569702148438, -0.13298797607421875, -0.12273025512695312, -0.1124725341796875, -0.10221481323242188, -0.09195709228515625, -0.08169937133789062, -0.071441650390625, -0.061183929443359375, -0.05092620849609375, -0.040668487548828125, -0.0304107666015625, -0.020153045654296875, -0.00989532470703125, 0.000362396240234375, 0.0106201171875, 0.020877838134765625, 0.03113555908203125, 0.041393280029296875, 0.0516510009765625, 0.061908721923828125, 0.07216644287109375, 0.08242416381835938, 0.092681884765625, 0.10293960571289062, 0.11319732666015625, 0.12345504760742188, 0.1337127685546875, 0.14397048950195312, 0.15422821044921875, 0.16448593139648438, 0.17474365234375, 0.18500137329101562, 0.19525909423828125, 0.20551681518554688, 0.2157745361328125, 0.22603225708007812, 0.23628997802734375, 0.24654769897460938, 0.256805419921875, 0.2670631408691406, 0.27732086181640625, 0.2875785827636719, 0.2978363037109375, 0.3080940246582031, 0.31835174560546875, 0.3286094665527344, 0.3388671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 20.0, 25.0, 91.0, 188.0, 715.0, 2356.0, 381.0, 149.0, 48.0, 39.0, 23.0, 13.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.142333984375, -0.1393880844116211, -0.1364421844482422, -0.13349628448486328, -0.13055038452148438, -0.12760448455810547, -0.12465858459472656, -0.12171268463134766, -0.11876678466796875, -0.11582088470458984, -0.11287498474121094, -0.10992908477783203, -0.10698318481445312, -0.10403728485107422, -0.10109138488769531, -0.0981454849243164, -0.0951995849609375, -0.0922536849975586, -0.08930778503417969, -0.08636188507080078, -0.08341598510742188, -0.08047008514404297, -0.07752418518066406, -0.07457828521728516, -0.07163238525390625, -0.06868648529052734, -0.06574058532714844, -0.06279468536376953, -0.059848785400390625, -0.05690288543701172, -0.05395698547363281, -0.051011085510253906, -0.048065185546875, -0.045119285583496094, -0.04217338562011719, -0.03922748565673828, -0.036281585693359375, -0.03333568572998047, -0.030389785766601562, -0.027443885803222656, -0.02449798583984375, -0.021552085876464844, -0.018606185913085938, -0.01566028594970703, -0.012714385986328125, -0.009768486022949219, -0.0068225860595703125, -0.0038766860961914062, -0.0009307861328125, 0.0020151138305664062, 0.0049610137939453125, 0.007906913757324219, 0.010852813720703125, 0.013798713684082031, 0.016744613647460938, 0.019690513610839844, 0.02263641357421875, 0.025582313537597656, 0.028528213500976562, 0.03147411346435547, 0.034420013427734375, 0.03736591339111328, 0.04031181335449219, 0.043257713317871094, 0.04620361328125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 14.0, 30.0, 61.0, 88.0, 140.0, 168.0, 161.0, 133.0, 93.0, 65.0, 24.0, 11.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18401604890823364, -0.17166294157505035, -0.15930983424186707, -0.14695671200752258, -0.1346036046743393, -0.122250497341156, -0.10989739000797272, -0.09754427522420883, -0.08519116789102554, -0.07283806055784225, -0.06048494577407837, -0.04813183844089508, -0.035778727382421494, -0.023425616323947906, -0.011072508990764618, 0.0012806057929992676, 0.013633713126182556, 0.025986824184656143, 0.03833993524312973, 0.05069304257631302, 0.0630461573600769, 0.07539926469326019, 0.08775237202644348, 0.10010548681020737, 0.11245859414339066, 0.12481170147657394, 0.13716481626033783, 0.14951792359352112, 0.1618710309267044, 0.1742241382598877, 0.18657726049423218, 0.19893036782741547, 0.21128347516059875, 0.22363658249378204, 0.23598968982696533, 0.24834281206130981, 0.2606959044933319, 0.2730490267276764, 0.2854021191596985, 0.29775524139404297, 0.31010836362838745, 0.32246148586273193, 0.33481457829475403, 0.3471677005290985, 0.3595207929611206, 0.3718739151954651, 0.38422703742980957, 0.39658012986183167, 0.40893322229385376, 0.42128634452819824, 0.43363943696022034, 0.4459925591945648, 0.4583456516265869, 0.4706987738609314, 0.4830518960952759, 0.495404988527298, 0.5077581405639648, 0.5201112627983093, 0.5324643850326538, 0.5448174476623535, 0.557170569896698, 0.5695236921310425, 0.581876814365387, 0.5942299365997314, 0.6065829992294312]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 10.0, 11.0, 5.0, 18.0, 23.0, 24.0, 28.0, 30.0, 28.0, 23.0, 35.0, 50.0, 46.0, 40.0, 36.0, 32.0, 51.0, 42.0, 34.0, 44.0, 37.0, 45.0, 35.0, 41.0, 29.0, 19.0, 25.0, 20.0, 21.0, 12.0, 19.0, 9.0, 7.0, 14.0, 6.0, 6.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.16341900825500488, -0.1584937572479248, -0.15356852114200592, -0.14864327013492584, -0.14371801912784576, -0.13879278302192688, -0.1338675320148468, -0.12894228100776672, -0.12401703745126724, -0.11909179389476776, -0.11416654288768768, -0.1092412993311882, -0.10431605577468872, -0.09939080476760864, -0.09446556121110916, -0.08954031765460968, -0.0846150666475296, -0.07968982309103012, -0.07476457208395004, -0.06983932852745056, -0.06491407752037048, -0.059988833963871, -0.05506359040737152, -0.05013834312558174, -0.04521309584379196, -0.04028784856200218, -0.0353626012802124, -0.03043735772371292, -0.02551211044192314, -0.020586863160133362, -0.01566161774098873, -0.010736372321844101, -0.005811125040054321, -0.0008858786895871162, 0.004039367660880089, 0.008964614011347294, 0.013889860361814499, 0.01881510764360428, 0.02374035306274891, 0.02866559848189354, 0.03359084576368332, 0.0385160930454731, 0.04344134032726288, 0.04836658388376236, 0.05329183116555214, 0.05821707844734192, 0.0631423220038414, 0.06806756556034088, 0.07299281656742096, 0.07791806012392044, 0.08284331113100052, 0.0877685546875, 0.09269380569458008, 0.09761904925107956, 0.10254429280757904, 0.10746954381465912, 0.1123947873711586, 0.11732003092765808, 0.12224528193473816, 0.12717053294181824, 0.13209576904773712, 0.1370210200548172, 0.14194627106189728, 0.14687150716781616, 0.15179675817489624]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 9.0, 9.0, 18.0, 23.0, 33.0, 43.0, 80.0, 133.0, 191.0, 314.0, 570.0, 972.0, 1916.0, 3876.0, 7944.0, 17487.0, 41180.0, 97913.0, 230820.0, 340556.0, 174744.0, 72925.0, 30731.0, 13254.0, 6154.0, 3024.0, 1556.0, 838.0, 513.0, 248.0, 187.0, 80.0, 77.0, 50.0, 31.0, 18.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0860595703125, -0.08362388610839844, -0.08118820190429688, -0.07875251770019531, -0.07631683349609375, -0.07388114929199219, -0.07144546508789062, -0.06900978088378906, -0.0665740966796875, -0.06413841247558594, -0.061702728271484375, -0.05926704406738281, -0.05683135986328125, -0.05439567565917969, -0.051959991455078125, -0.04952430725097656, -0.047088623046875, -0.04465293884277344, -0.042217254638671875, -0.03978157043457031, -0.03734588623046875, -0.03491020202636719, -0.032474517822265625, -0.030038833618164062, -0.0276031494140625, -0.025167465209960938, -0.022731781005859375, -0.020296096801757812, -0.01786041259765625, -0.015424728393554688, -0.012989044189453125, -0.010553359985351562, -0.00811767578125, -0.0056819915771484375, -0.003246307373046875, -0.0008106231689453125, 0.00162506103515625, 0.0040607452392578125, 0.006496429443359375, 0.008932113647460938, 0.0113677978515625, 0.013803482055664062, 0.016239166259765625, 0.018674850463867188, 0.02111053466796875, 0.023546218872070312, 0.025981903076171875, 0.028417587280273438, 0.030853271484375, 0.03328895568847656, 0.035724639892578125, 0.03816032409667969, 0.04059600830078125, 0.04303169250488281, 0.045467376708984375, 0.04790306091308594, 0.0503387451171875, 0.05277442932128906, 0.055210113525390625, 0.05764579772949219, 0.06008148193359375, 0.06251716613769531, 0.06495285034179688, 0.06738853454589844, 0.06982421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 5.0, 13.0, 11.0, 31.0, 22.0, 40.0, 39.0, 48.0, 48.0, 55.0, 68.0, 90.0, 69.0, 62.0, 49.0, 62.0, 49.0, 51.0, 36.0, 32.0, 36.0, 18.0, 17.0, 7.0, 10.0, 7.0, 4.0, 3.0, 1.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0295867919921875, -0.028775691986083984, -0.02796459197998047, -0.027153491973876953, -0.026342391967773438, -0.025531291961669922, -0.024720191955566406, -0.02390909194946289, -0.023097991943359375, -0.02228689193725586, -0.021475791931152344, -0.020664691925048828, -0.019853591918945312, -0.019042491912841797, -0.01823139190673828, -0.017420291900634766, -0.01660919189453125, -0.015798091888427734, -0.014986991882324219, -0.014175891876220703, -0.013364791870117188, -0.012553691864013672, -0.011742591857910156, -0.01093149185180664, -0.010120391845703125, -0.00930929183959961, -0.008498191833496094, -0.007687091827392578, -0.0068759918212890625, -0.006064891815185547, -0.005253791809082031, -0.004442691802978516, -0.003631591796875, -0.0028204917907714844, -0.0020093917846679688, -0.0011982917785644531, -0.0003871917724609375, 0.0004239082336425781, 0.0012350082397460938, 0.0020461082458496094, 0.002857208251953125, 0.0036683082580566406, 0.004479408264160156, 0.005290508270263672, 0.0061016082763671875, 0.006912708282470703, 0.007723808288574219, 0.008534908294677734, 0.00934600830078125, 0.010157108306884766, 0.010968208312988281, 0.011779308319091797, 0.012590408325195312, 0.013401508331298828, 0.014212608337402344, 0.01502370834350586, 0.015834808349609375, 0.01664590835571289, 0.017457008361816406, 0.018268108367919922, 0.019079208374023438, 0.019890308380126953, 0.02070140838623047, 0.021512508392333984, 0.0223236083984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 9.0, 11.0, 11.0, 11.0, 17.0, 40.0, 51.0, 76.0, 136.0, 231.0, 354.0, 774.0, 1513.0, 3769.0, 14688.0, 87902.0, 525238.0, 347483.0, 51292.0, 9468.0, 2770.0, 1209.0, 610.0, 338.0, 211.0, 122.0, 88.0, 51.0, 30.0, 18.0, 13.0, 11.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1396484375, -0.1348094940185547, -0.12997055053710938, -0.12513160705566406, -0.12029266357421875, -0.11545372009277344, -0.11061477661132812, -0.10577583312988281, -0.1009368896484375, -0.09609794616699219, -0.09125900268554688, -0.08642005920410156, -0.08158111572265625, -0.07674217224121094, -0.07190322875976562, -0.06706428527832031, -0.062225341796875, -0.05738639831542969, -0.052547454833984375, -0.04770851135253906, -0.04286956787109375, -0.03803062438964844, -0.033191680908203125, -0.028352737426757812, -0.0235137939453125, -0.018674850463867188, -0.013835906982421875, -0.008996963500976562, -0.00415802001953125, 0.0006809234619140625, 0.005519866943359375, 0.010358810424804688, 0.01519775390625, 0.020036697387695312, 0.024875640869140625, 0.029714584350585938, 0.03455352783203125, 0.03939247131347656, 0.044231414794921875, 0.04907035827636719, 0.0539093017578125, 0.05874824523925781, 0.06358718872070312, 0.06842613220214844, 0.07326507568359375, 0.07810401916503906, 0.08294296264648438, 0.08778190612792969, 0.092620849609375, 0.09745979309082031, 0.10229873657226562, 0.10713768005371094, 0.11197662353515625, 0.11681556701660156, 0.12165451049804688, 0.1264934539794922, 0.1313323974609375, 0.1361713409423828, 0.14101028442382812, 0.14584922790527344, 0.15068817138671875, 0.15552711486816406, 0.16036605834960938, 0.1652050018310547, 0.1700439453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 3.0, 11.0, 14.0, 24.0, 20.0, 25.0, 36.0, 48.0, 26.0, 43.0, 29.0, 44.0, 74.0, 56.0, 59.0, 57.0, 48.0, 47.0, 47.0, 46.0, 29.0, 43.0, 27.0, 37.0, 16.0, 15.0, 12.0, 15.0, 15.0, 5.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10943603515625, -0.10591697692871094, -0.10239791870117188, -0.09887886047363281, -0.09535980224609375, -0.09184074401855469, -0.08832168579101562, -0.08480262756347656, -0.0812835693359375, -0.07776451110839844, -0.07424545288085938, -0.07072639465332031, -0.06720733642578125, -0.06368827819824219, -0.060169219970703125, -0.05665016174316406, -0.053131103515625, -0.04961204528808594, -0.046092987060546875, -0.04257392883300781, -0.03905487060546875, -0.03553581237792969, -0.032016754150390625, -0.028497695922851562, -0.0249786376953125, -0.021459579467773438, -0.017940521240234375, -0.014421463012695312, -0.01090240478515625, -0.0073833465576171875, -0.003864288330078125, -0.0003452301025390625, 0.003173828125, 0.0066928863525390625, 0.010211944580078125, 0.013731002807617188, 0.01725006103515625, 0.020769119262695312, 0.024288177490234375, 0.027807235717773438, 0.0313262939453125, 0.03484535217285156, 0.038364410400390625, 0.04188346862792969, 0.04540252685546875, 0.04892158508300781, 0.052440643310546875, 0.05595970153808594, 0.059478759765625, 0.06299781799316406, 0.06651687622070312, 0.07003593444824219, 0.07355499267578125, 0.07707405090332031, 0.08059310913085938, 0.08411216735839844, 0.0876312255859375, 0.09115028381347656, 0.09466934204101562, 0.09818840026855469, 0.10170745849609375, 0.10522651672363281, 0.10874557495117188, 0.11226463317871094, 0.11578369140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 15.0, 17.0, 23.0, 26.0, 51.0, 70.0, 119.0, 177.0, 309.0, 480.0, 880.0, 1657.0, 3136.0, 6487.0, 14612.0, 41046.0, 180104.0, 594953.0, 143502.0, 35331.0, 13194.0, 5841.0, 2952.0, 1511.0, 809.0, 457.0, 284.0, 148.0, 118.0, 86.0, 49.0, 40.0, 18.0, 13.0, 13.0, 4.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.085205078125, -0.08286666870117188, -0.08052825927734375, -0.07818984985351562, -0.0758514404296875, -0.07351303100585938, -0.07117462158203125, -0.06883621215820312, -0.066497802734375, -0.06415939331054688, -0.06182098388671875, -0.059482574462890625, -0.0571441650390625, -0.054805755615234375, -0.05246734619140625, -0.050128936767578125, -0.04779052734375, -0.045452117919921875, -0.04311370849609375, -0.040775299072265625, -0.0384368896484375, -0.036098480224609375, -0.03376007080078125, -0.031421661376953125, -0.029083251953125, -0.026744842529296875, -0.02440643310546875, -0.022068023681640625, -0.0197296142578125, -0.017391204833984375, -0.01505279541015625, -0.012714385986328125, -0.0103759765625, -0.008037567138671875, -0.00569915771484375, -0.003360748291015625, -0.0010223388671875, 0.001316070556640625, 0.00365447998046875, 0.005992889404296875, 0.008331298828125, 0.010669708251953125, 0.01300811767578125, 0.015346527099609375, 0.0176849365234375, 0.020023345947265625, 0.02236175537109375, 0.024700164794921875, 0.02703857421875, 0.029376983642578125, 0.03171539306640625, 0.034053802490234375, 0.0363922119140625, 0.038730621337890625, 0.04106903076171875, 0.043407440185546875, 0.045745849609375, 0.048084259033203125, 0.05042266845703125, 0.052761077880859375, 0.0550994873046875, 0.057437896728515625, 0.05977630615234375, 0.062114715576171875, 0.064453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 13.0, 19.0, 33.0, 60.0, 101.0, 128.0, 184.0, 164.0, 116.0, 75.0, 41.0, 14.0, 18.0, 6.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.091594696044922e-05, -5.781091749668121e-05, -5.470588803291321e-05, -5.16008585691452e-05, -4.84958291053772e-05, -4.539079964160919e-05, -4.2285770177841187e-05, -3.918074071407318e-05, -3.6075711250305176e-05, -3.297068178653717e-05, -2.9865652322769165e-05, -2.676062285900116e-05, -2.3655593395233154e-05, -2.055056393146515e-05, -1.7445534467697144e-05, -1.4340505003929138e-05, -1.1235475540161133e-05, -8.130446076393127e-06, -5.025416612625122e-06, -1.9203871488571167e-06, 1.1846423149108887e-06, 4.289671778678894e-06, 7.394701242446899e-06, 1.0499730706214905e-05, 1.360476016998291e-05, 1.6709789633750916e-05, 1.981481909751892e-05, 2.2919848561286926e-05, 2.602487802505493e-05, 2.9129907488822937e-05, 3.223493695259094e-05, 3.533996641635895e-05, 3.844499588012695e-05, 4.155002534389496e-05, 4.4655054807662964e-05, 4.776008427143097e-05, 5.0865113735198975e-05, 5.397014319896698e-05, 5.7075172662734985e-05, 6.018020212650299e-05, 6.3285231590271e-05, 6.6390261054039e-05, 6.949529051780701e-05, 7.260031998157501e-05, 7.570534944534302e-05, 7.881037890911102e-05, 8.191540837287903e-05, 8.502043783664703e-05, 8.812546730041504e-05, 9.123049676418304e-05, 9.433552622795105e-05, 9.744055569171906e-05, 0.00010054558515548706, 0.00010365061461925507, 0.00010675564408302307, 0.00010986067354679108, 0.00011296570301055908, 0.00011607073247432709, 0.00011917576193809509, 0.0001222807914018631, 0.0001253858208656311, 0.0001284908503293991, 0.00013159587979316711, 0.00013470090925693512, 0.00013780593872070312]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 9.0, 11.0, 14.0, 14.0, 14.0, 26.0, 36.0, 53.0, 85.0, 154.0, 256.0, 463.0, 985.0, 2175.0, 5539.0, 17410.0, 82048.0, 652068.0, 237791.0, 33767.0, 9375.0, 3332.0, 1381.0, 670.0, 345.0, 181.0, 103.0, 73.0, 54.0, 29.0, 25.0, 16.0, 18.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08928298950195312, -0.08628082275390625, -0.08327865600585938, -0.0802764892578125, -0.07727432250976562, -0.07427215576171875, -0.07126998901367188, -0.068267822265625, -0.06526565551757812, -0.06226348876953125, -0.059261322021484375, -0.0562591552734375, -0.053256988525390625, -0.05025482177734375, -0.047252655029296875, -0.04425048828125, -0.041248321533203125, -0.03824615478515625, -0.035243988037109375, -0.0322418212890625, -0.029239654541015625, -0.02623748779296875, -0.023235321044921875, -0.020233154296875, -0.017230987548828125, -0.01422882080078125, -0.011226654052734375, -0.0082244873046875, -0.005222320556640625, -0.00222015380859375, 0.000782012939453125, 0.0037841796875, 0.006786346435546875, 0.00978851318359375, 0.012790679931640625, 0.0157928466796875, 0.018795013427734375, 0.02179718017578125, 0.024799346923828125, 0.027801513671875, 0.030803680419921875, 0.03380584716796875, 0.036808013916015625, 0.0398101806640625, 0.042812347412109375, 0.04581451416015625, 0.048816680908203125, 0.05181884765625, 0.054821014404296875, 0.05782318115234375, 0.060825347900390625, 0.0638275146484375, 0.06682968139648438, 0.06983184814453125, 0.07283401489257812, 0.075836181640625, 0.07883834838867188, 0.08184051513671875, 0.08484268188476562, 0.0878448486328125, 0.09084701538085938, 0.09384918212890625, 0.09685134887695312, 0.099853515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 21.0, 14.0, 18.0, 38.0, 55.0, 65.0, 119.0, 110.0, 112.0, 109.0, 70.0, 50.0, 42.0, 41.0, 19.0, 20.0, 14.0, 8.0, 11.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.08099365234375, -0.0790705680847168, -0.0771474838256836, -0.07522439956665039, -0.07330131530761719, -0.07137823104858398, -0.06945514678955078, -0.06753206253051758, -0.06560897827148438, -0.06368589401245117, -0.06176280975341797, -0.059839725494384766, -0.05791664123535156, -0.05599355697631836, -0.054070472717285156, -0.05214738845825195, -0.05022430419921875, -0.04830121994018555, -0.046378135681152344, -0.04445505142211914, -0.04253196716308594, -0.040608882904052734, -0.03868579864501953, -0.03676271438598633, -0.034839630126953125, -0.03291654586791992, -0.03099346160888672, -0.029070377349853516, -0.027147293090820312, -0.02522420883178711, -0.023301124572753906, -0.021378040313720703, -0.0194549560546875, -0.017531871795654297, -0.015608787536621094, -0.01368570327758789, -0.011762619018554688, -0.009839534759521484, -0.007916450500488281, -0.005993366241455078, -0.004070281982421875, -0.002147197723388672, -0.00022411346435546875, 0.0016989707946777344, 0.0036220550537109375, 0.005545139312744141, 0.007468223571777344, 0.009391307830810547, 0.01131439208984375, 0.013237476348876953, 0.015160560607910156, 0.01708364486694336, 0.019006729125976562, 0.020929813385009766, 0.02285289764404297, 0.024775981903076172, 0.026699066162109375, 0.028622150421142578, 0.03054523468017578, 0.032468318939208984, 0.03439140319824219, 0.03631448745727539, 0.038237571716308594, 0.0401606559753418, 0.042083740234375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 13.0, 29.0, 73.0, 141.0, 238.0, 213.0, 161.0, 73.0, 48.0, 6.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3839235305786133, -0.3415030539035797, -0.29908257722854614, -0.25666213035583496, -0.2142416536808014, -0.17182117700576782, -0.12940073013305664, -0.08698025345802307, -0.0445597767829895, -0.0021393075585365295, 0.04028116166591644, 0.08270162343978882, 0.1251221001148224, 0.16754257678985596, 0.20996302366256714, 0.2523835003376007, 0.2948039770126343, 0.33722445368766785, 0.3796449303627014, 0.4220653772354126, 0.46448585391044617, 0.5069063305854797, 0.5493267774581909, 0.5917472839355469, 0.6341677308082581, 0.6765881776809692, 0.7190086841583252, 0.7614291310310364, 0.8038495779037476, 0.8462700843811035, 0.8886905312538147, 0.9311109781265259, 0.9735314846038818, 1.0159519910812378, 1.0583723783493042, 1.1007928848266602, 1.1432133913040161, 1.185633897781372, 1.2280542850494385, 1.2704747915267944, 1.3128952980041504, 1.3553158044815063, 1.3977361917495728, 1.4401566982269287, 1.4825772047042847, 1.5249977111816406, 1.567418098449707, 1.609838604927063, 1.6522589921951294, 1.6946794986724854, 1.7370998859405518, 1.7795203924179077, 1.8219408988952637, 1.86436128616333, 1.906781792640686, 1.949202299118042, 1.9916226863861084, 2.034043073654175, 2.0764636993408203, 2.1188840866088867, 2.161304473876953, 2.2037250995635986, 2.246145486831665, 2.2885658740997314, 2.330986499786377]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 6.0, 10.0, 9.0, 21.0, 16.0, 19.0, 37.0, 29.0, 31.0, 26.0, 46.0, 29.0, 32.0, 48.0, 52.0, 37.0, 38.0, 57.0, 38.0, 46.0, 47.0, 41.0, 38.0, 35.0, 17.0, 31.0, 25.0, 22.0, 19.0, 18.0, 14.0, 9.0, 5.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.47896742820739746, -0.46249446272850037, -0.44602149724960327, -0.4295485019683838, -0.4130755364894867, -0.3966025710105896, -0.3801296055316925, -0.3636566400527954, -0.3471836447715759, -0.33071067929267883, -0.31423771381378174, -0.29776471853256226, -0.28129175305366516, -0.26481878757476807, -0.24834582209587097, -0.23187285661697388, -0.21539989113807678, -0.1989269256591797, -0.1824539452791214, -0.1659809798002243, -0.14950799942016602, -0.13303503394126892, -0.11656206846237183, -0.10008909553289413, -0.08361612260341644, -0.06714314967393875, -0.05067018046975136, -0.034197211265563965, -0.017724238336086273, -0.0012512654066085815, 0.015221700072288513, 0.031694673001766205, 0.048167645931243896, 0.06464061886072159, 0.08111359179019928, 0.09758655726909637, 0.11405953019857407, 0.13053250312805176, 0.14700546860694885, 0.16347843408584595, 0.17995141446590424, 0.19642437994480133, 0.21289736032485962, 0.2293703258037567, 0.2458432912826538, 0.2623162865638733, 0.278789222240448, 0.2952622175216675, 0.3117351830005646, 0.32820814847946167, 0.34468111395835876, 0.36115407943725586, 0.37762707471847534, 0.39410004019737244, 0.41057300567626953, 0.4270459711551666, 0.4435189366340637, 0.4599919021129608, 0.4764648675918579, 0.4929378628730774, 0.5094107985496521, 0.5258837938308716, 0.5423567295074463, 0.5588297247886658, 0.5753027200698853]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 10.0, 10.0, 13.0, 13.0, 26.0, 36.0, 60.0, 63.0, 97.0, 160.0, 253.0, 381.0, 577.0, 997.0, 1750.0, 3053.0, 5866.0, 12166.0, 28015.0, 81229.0, 398437.0, 3217664.0, 321066.0, 71780.0, 25910.0, 11417.0, 5647.0, 3115.0, 1716.0, 1019.0, 617.0, 385.0, 249.0, 155.0, 118.0, 61.0, 49.0, 39.0, 15.0, 16.0, 11.0, 2.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08563232421875, -0.08290958404541016, -0.08018684387207031, -0.07746410369873047, -0.07474136352539062, -0.07201862335205078, -0.06929588317871094, -0.0665731430053711, -0.06385040283203125, -0.061127662658691406, -0.05840492248535156, -0.05568218231201172, -0.052959442138671875, -0.05023670196533203, -0.04751396179199219, -0.044791221618652344, -0.0420684814453125, -0.039345741271972656, -0.03662300109863281, -0.03390026092529297, -0.031177520751953125, -0.02845478057861328, -0.025732040405273438, -0.023009300231933594, -0.02028656005859375, -0.017563819885253906, -0.014841079711914062, -0.012118339538574219, -0.009395599365234375, -0.006672859191894531, -0.0039501190185546875, -0.0012273788452148438, 0.001495361328125, 0.004218101501464844, 0.0069408416748046875, 0.009663581848144531, 0.012386322021484375, 0.015109062194824219, 0.017831802368164062, 0.020554542541503906, 0.02327728271484375, 0.026000022888183594, 0.028722763061523438, 0.03144550323486328, 0.034168243408203125, 0.03689098358154297, 0.03961372375488281, 0.042336463928222656, 0.0450592041015625, 0.047781944274902344, 0.05050468444824219, 0.05322742462158203, 0.055950164794921875, 0.05867290496826172, 0.06139564514160156, 0.0641183853149414, 0.06684112548828125, 0.0695638656616211, 0.07228660583496094, 0.07500934600830078, 0.07773208618164062, 0.08045482635498047, 0.08317756652832031, 0.08590030670166016, 0.088623046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 12.0, 12.0, 15.0, 28.0, 35.0, 33.0, 49.0, 39.0, 69.0, 63.0, 58.0, 79.0, 74.0, 49.0, 57.0, 57.0, 56.0, 49.0, 31.0, 28.0, 24.0, 20.0, 10.0, 9.0, 8.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0264434814453125, -0.02564382553100586, -0.02484416961669922, -0.024044513702392578, -0.023244857788085938, -0.022445201873779297, -0.021645545959472656, -0.020845890045166016, -0.020046234130859375, -0.019246578216552734, -0.018446922302246094, -0.017647266387939453, -0.016847610473632812, -0.016047954559326172, -0.015248298645019531, -0.01444864273071289, -0.01364898681640625, -0.01284933090209961, -0.012049674987792969, -0.011250019073486328, -0.010450363159179688, -0.009650707244873047, -0.008851051330566406, -0.008051395416259766, -0.007251739501953125, -0.006452083587646484, -0.005652427673339844, -0.004852771759033203, -0.0040531158447265625, -0.003253459930419922, -0.0024538040161132812, -0.0016541481018066406, -0.0008544921875, -5.4836273193359375e-05, 0.0007448196411132812, 0.0015444755554199219, 0.0023441314697265625, 0.003143787384033203, 0.003943443298339844, 0.004743099212646484, 0.005542755126953125, 0.006342411041259766, 0.007142066955566406, 0.007941722869873047, 0.008741378784179688, 0.009541034698486328, 0.010340690612792969, 0.01114034652709961, 0.01194000244140625, 0.01273965835571289, 0.013539314270019531, 0.014338970184326172, 0.015138626098632812, 0.015938282012939453, 0.016737937927246094, 0.017537593841552734, 0.018337249755859375, 0.019136905670166016, 0.019936561584472656, 0.020736217498779297, 0.021535873413085938, 0.022335529327392578, 0.02313518524169922, 0.02393484115600586, 0.0247344970703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 8.0, 6.0, 9.0, 14.0, 26.0, 22.0, 27.0, 42.0, 47.0, 80.0, 115.0, 226.0, 436.0, 928.0, 2623.0, 9960.0, 62440.0, 1356542.0, 2660067.0, 82842.0, 12506.0, 3115.0, 1095.0, 440.0, 242.0, 154.0, 87.0, 47.0, 36.0, 31.0, 24.0, 15.0, 8.0, 10.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17898178100585938, -0.17302703857421875, -0.16707229614257812, -0.1611175537109375, -0.15516281127929688, -0.14920806884765625, -0.14325332641601562, -0.137298583984375, -0.13134384155273438, -0.12538909912109375, -0.11943435668945312, -0.1134796142578125, -0.10752487182617188, -0.10157012939453125, -0.09561538696289062, -0.08966064453125, -0.08370590209960938, -0.07775115966796875, -0.07179641723632812, -0.0658416748046875, -0.059886932373046875, -0.05393218994140625, -0.047977447509765625, -0.042022705078125, -0.036067962646484375, -0.03011322021484375, -0.024158477783203125, -0.0182037353515625, -0.012248992919921875, -0.00629425048828125, -0.000339508056640625, 0.005615234375, 0.011569976806640625, 0.01752471923828125, 0.023479461669921875, 0.0294342041015625, 0.035388946533203125, 0.04134368896484375, 0.047298431396484375, 0.053253173828125, 0.059207916259765625, 0.06516265869140625, 0.07111740112304688, 0.0770721435546875, 0.08302688598632812, 0.08898162841796875, 0.09493637084960938, 0.10089111328125, 0.10684585571289062, 0.11280059814453125, 0.11875534057617188, 0.1247100830078125, 0.13066482543945312, 0.13661956787109375, 0.14257431030273438, 0.148529052734375, 0.15448379516601562, 0.16043853759765625, 0.16639328002929688, 0.1723480224609375, 0.17830276489257812, 0.18425750732421875, 0.19021224975585938, 0.1961669921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 12.0, 32.0, 51.0, 96.0, 208.0, 527.0, 1680.0, 842.0, 298.0, 124.0, 78.0, 35.0, 35.0, 8.0, 11.0, 7.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.10387325286865234, -0.10111808776855469, -0.09836292266845703, -0.09560775756835938, -0.09285259246826172, -0.09009742736816406, -0.0873422622680664, -0.08458709716796875, -0.0818319320678711, -0.07907676696777344, -0.07632160186767578, -0.07356643676757812, -0.07081127166748047, -0.06805610656738281, -0.06530094146728516, -0.0625457763671875, -0.059790611267089844, -0.05703544616699219, -0.05428028106689453, -0.051525115966796875, -0.04876995086669922, -0.04601478576660156, -0.043259620666503906, -0.04050445556640625, -0.037749290466308594, -0.03499412536621094, -0.03223896026611328, -0.029483795166015625, -0.02672863006591797, -0.023973464965820312, -0.021218299865722656, -0.018463134765625, -0.015707969665527344, -0.012952804565429688, -0.010197639465332031, -0.007442474365234375, -0.004687309265136719, -0.0019321441650390625, 0.0008230209350585938, 0.00357818603515625, 0.006333351135253906, 0.009088516235351562, 0.011843681335449219, 0.014598846435546875, 0.01735401153564453, 0.020109176635742188, 0.022864341735839844, 0.0256195068359375, 0.028374671936035156, 0.031129837036132812, 0.03388500213623047, 0.036640167236328125, 0.03939533233642578, 0.04215049743652344, 0.044905662536621094, 0.04766082763671875, 0.050415992736816406, 0.05317115783691406, 0.05592632293701172, 0.058681488037109375, 0.06143665313720703, 0.06419181823730469, 0.06694698333740234, 0.0697021484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 16.0, 76.0, 146.0, 265.0, 271.0, 135.0, 59.0, 25.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453777015209198, -0.42830225825309753, -0.40282750129699707, -0.377352774143219, -0.35187798738479614, -0.32640326023101807, -0.3009285032749176, -0.27545374631881714, -0.24997898936271667, -0.2245042324066162, -0.19902947545051575, -0.17355473339557648, -0.148079976439476, -0.12260521948337555, -0.09713047742843628, -0.07165572047233582, -0.04618096351623535, -0.020706210285425186, 0.004768542945384979, 0.030243292450904846, 0.05571804940700531, 0.08119280636310577, 0.10666754841804504, 0.1321423053741455, 0.15761706233024597, 0.18309181928634644, 0.2085665762424469, 0.23404131829738617, 0.25951606035232544, 0.2849908471107483, 0.31046557426452637, 0.33594033122062683, 0.3614150285720825, 0.386889785528183, 0.41236454248428345, 0.4378392696380615, 0.4633140563964844, 0.48878878355026245, 0.5142635107040405, 0.5397382974624634, 0.5652130842208862, 0.5906878113746643, 0.6161625981330872, 0.6416373252868652, 0.6671121120452881, 0.6925868391990662, 0.7180615663528442, 0.7435363531112671, 0.7690110802650452, 0.7944858074188232, 0.8199605941772461, 0.8454353213310242, 0.870910108089447, 0.8963848352432251, 0.921859622001648, 0.947334349155426, 0.9728090763092041, 0.9982838034629822, 1.0237585306167603, 1.049233317375183, 1.074708104133606, 1.1001828908920288, 1.125657558441162, 1.151132345199585, 1.1766071319580078]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 0.0, 7.0, 8.0, 13.0, 16.0, 21.0, 22.0, 22.0, 19.0, 31.0, 45.0, 28.0, 34.0, 49.0, 53.0, 40.0, 53.0, 35.0, 34.0, 51.0, 37.0, 31.0, 43.0, 45.0, 46.0, 36.0, 25.0, 29.0, 27.0, 24.0, 16.0, 13.0, 10.0, 13.0, 8.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20565760135650635, -0.19885583221912384, -0.19205406308174133, -0.18525227904319763, -0.17845050990581512, -0.17164874076843262, -0.16484695672988892, -0.1580451875925064, -0.1512434184551239, -0.1444416493177414, -0.1376398801803589, -0.13083809614181519, -0.12403632700443268, -0.11723455786705017, -0.11043278127908707, -0.10363100469112396, -0.09682923555374146, -0.09002746641635895, -0.08322568982839584, -0.07642391324043274, -0.06962214410305023, -0.06282037496566772, -0.05601859837770462, -0.049216825515031815, -0.04241505265235901, -0.0356132797896862, -0.028811506927013397, -0.02200973406434059, -0.015207961201667786, -0.00840618833899498, -0.001604415476322174, 0.005197357386350632, 0.011999130249023438, 0.018800903111696243, 0.02560267597436905, 0.032404448837041855, 0.03920622169971466, 0.046007994562387466, 0.05280976742506027, 0.05961154028773308, 0.06641331315040588, 0.07321508228778839, 0.0800168588757515, 0.0868186354637146, 0.0936204046010971, 0.10042217373847961, 0.10722395032644272, 0.11402572691440582, 0.12082749605178833, 0.12762926518917084, 0.13443103432655334, 0.14123281836509705, 0.14803458750247955, 0.15483635663986206, 0.16163814067840576, 0.16843990981578827, 0.17524167895317078, 0.18204344809055328, 0.1888452172279358, 0.1956470012664795, 0.202448770403862, 0.2092505395412445, 0.2160523235797882, 0.22285409271717072, 0.22965586185455322]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 16.0, 23.0, 33.0, 57.0, 87.0, 133.0, 186.0, 353.0, 624.0, 1080.0, 1971.0, 3932.0, 8020.0, 17929.0, 39986.0, 94038.0, 258315.0, 376774.0, 139915.0, 57486.0, 25152.0, 11153.0, 5298.0, 2611.0, 1439.0, 775.0, 441.0, 246.0, 175.0, 89.0, 76.0, 45.0, 29.0, 18.0, 11.0, 8.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.095703125, -0.0926370620727539, -0.08957099914550781, -0.08650493621826172, -0.08343887329101562, -0.08037281036376953, -0.07730674743652344, -0.07424068450927734, -0.07117462158203125, -0.06810855865478516, -0.06504249572753906, -0.06197643280029297, -0.058910369873046875, -0.05584430694580078, -0.05277824401855469, -0.049712181091308594, -0.0466461181640625, -0.043580055236816406, -0.04051399230957031, -0.03744792938232422, -0.034381866455078125, -0.03131580352783203, -0.028249740600585938, -0.025183677673339844, -0.02211761474609375, -0.019051551818847656, -0.015985488891601562, -0.012919425964355469, -0.009853363037109375, -0.006787300109863281, -0.0037212371826171875, -0.0006551742553710938, 0.002410888671875, 0.005476951599121094, 0.008543014526367188, 0.011609077453613281, 0.014675140380859375, 0.01774120330810547, 0.020807266235351562, 0.023873329162597656, 0.02693939208984375, 0.030005455017089844, 0.03307151794433594, 0.03613758087158203, 0.039203643798828125, 0.04226970672607422, 0.04533576965332031, 0.048401832580566406, 0.0514678955078125, 0.054533958435058594, 0.05760002136230469, 0.06066608428955078, 0.06373214721679688, 0.06679821014404297, 0.06986427307128906, 0.07293033599853516, 0.07599639892578125, 0.07906246185302734, 0.08212852478027344, 0.08519458770751953, 0.08826065063476562, 0.09132671356201172, 0.09439277648925781, 0.0974588394165039, 0.10052490234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 8.0, 17.0, 19.0, 23.0, 31.0, 22.0, 36.0, 39.0, 39.0, 56.0, 45.0, 55.0, 66.0, 75.0, 66.0, 51.0, 56.0, 55.0, 36.0, 37.0, 37.0, 29.0, 19.0, 14.0, 16.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244903564453125, -0.02372908592224121, -0.022967815399169922, -0.022206544876098633, -0.021445274353027344, -0.020684003829956055, -0.019922733306884766, -0.019161462783813477, -0.018400192260742188, -0.0176389217376709, -0.01687765121459961, -0.01611638069152832, -0.015355110168457031, -0.014593839645385742, -0.013832569122314453, -0.013071298599243164, -0.012310028076171875, -0.011548757553100586, -0.010787487030029297, -0.010026216506958008, -0.009264945983886719, -0.00850367546081543, -0.007742404937744141, -0.0069811344146728516, -0.0062198638916015625, -0.0054585933685302734, -0.004697322845458984, -0.003936052322387695, -0.0031747817993164062, -0.002413511276245117, -0.0016522407531738281, -0.0008909702301025391, -0.00012969970703125, 0.0006315708160400391, 0.0013928413391113281, 0.002154111862182617, 0.0029153823852539062, 0.0036766529083251953, 0.004437923431396484, 0.0051991939544677734, 0.0059604644775390625, 0.0067217350006103516, 0.007483005523681641, 0.00824427604675293, 0.009005546569824219, 0.009766817092895508, 0.010528087615966797, 0.011289358139038086, 0.012050628662109375, 0.012811899185180664, 0.013573169708251953, 0.014334440231323242, 0.015095710754394531, 0.01585698127746582, 0.01661825180053711, 0.0173795223236084, 0.018140792846679688, 0.018902063369750977, 0.019663333892822266, 0.020424604415893555, 0.021185874938964844, 0.021947145462036133, 0.022708415985107422, 0.02346968650817871, 0.02423095703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 12.0, 12.0, 21.0, 34.0, 41.0, 52.0, 76.0, 109.0, 174.0, 233.0, 318.0, 524.0, 954.0, 1895.0, 3884.0, 9881.0, 27873.0, 88781.0, 356294.0, 404812.0, 101579.0, 31174.0, 10726.0, 4361.0, 2016.0, 983.0, 578.0, 378.0, 241.0, 159.0, 93.0, 74.0, 73.0, 37.0, 21.0, 20.0, 21.0, 8.0, 8.0, 6.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.120025634765625, -0.11639404296875, -0.112762451171875, -0.109130859375, -0.105499267578125, -0.10186767578125, -0.098236083984375, -0.0946044921875, -0.090972900390625, -0.08734130859375, -0.083709716796875, -0.080078125, -0.076446533203125, -0.07281494140625, -0.069183349609375, -0.0655517578125, -0.061920166015625, -0.05828857421875, -0.054656982421875, -0.051025390625, -0.047393798828125, -0.04376220703125, -0.040130615234375, -0.0364990234375, -0.032867431640625, -0.02923583984375, -0.025604248046875, -0.02197265625, -0.018341064453125, -0.01470947265625, -0.011077880859375, -0.0074462890625, -0.003814697265625, -0.00018310546875, 0.003448486328125, 0.007080078125, 0.010711669921875, 0.01434326171875, 0.017974853515625, 0.0216064453125, 0.025238037109375, 0.02886962890625, 0.032501220703125, 0.0361328125, 0.039764404296875, 0.04339599609375, 0.047027587890625, 0.0506591796875, 0.054290771484375, 0.05792236328125, 0.061553955078125, 0.065185546875, 0.068817138671875, 0.07244873046875, 0.076080322265625, 0.0797119140625, 0.083343505859375, 0.08697509765625, 0.090606689453125, 0.09423828125, 0.097869873046875, 0.10150146484375, 0.105133056640625, 0.1087646484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 5.0, 10.0, 11.0, 9.0, 14.0, 17.0, 21.0, 27.0, 29.0, 30.0, 42.0, 36.0, 44.0, 47.0, 40.0, 48.0, 52.0, 54.0, 47.0, 46.0, 43.0, 47.0, 52.0, 38.0, 42.0, 26.0, 17.0, 16.0, 14.0, 15.0, 16.0, 11.0, 8.0, 9.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09312629699707031, -0.08957290649414062, -0.08601951599121094, -0.08246612548828125, -0.07891273498535156, -0.07535934448242188, -0.07180595397949219, -0.0682525634765625, -0.06469917297363281, -0.061145782470703125, -0.05759239196777344, -0.05403900146484375, -0.05048561096191406, -0.046932220458984375, -0.04337882995605469, -0.039825439453125, -0.03627204895019531, -0.032718658447265625, -0.029165267944335938, -0.02561187744140625, -0.022058486938476562, -0.018505096435546875, -0.014951705932617188, -0.0113983154296875, -0.007844924926757812, -0.004291534423828125, -0.0007381439208984375, 0.00281524658203125, 0.0063686370849609375, 0.009922027587890625, 0.013475418090820312, 0.01702880859375, 0.020582199096679688, 0.024135589599609375, 0.027688980102539062, 0.03124237060546875, 0.03479576110839844, 0.038349151611328125, 0.04190254211425781, 0.0454559326171875, 0.04900932312011719, 0.052562713623046875, 0.05611610412597656, 0.05966949462890625, 0.06322288513183594, 0.06677627563476562, 0.07032966613769531, 0.073883056640625, 0.07743644714355469, 0.08098983764648438, 0.08454322814941406, 0.08809661865234375, 0.09165000915527344, 0.09520339965820312, 0.09875679016113281, 0.1023101806640625, 0.10586357116699219, 0.10941696166992188, 0.11297035217285156, 0.11652374267578125, 0.12007713317871094, 0.12363052368164062, 0.1271839141845703, 0.1307373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 11.0, 14.0, 34.0, 48.0, 68.0, 95.0, 191.0, 239.0, 531.0, 1054.0, 2345.0, 6162.0, 22586.0, 126141.0, 690588.0, 159301.0, 27021.0, 7087.0, 2612.0, 1129.0, 527.0, 307.0, 148.0, 98.0, 61.0, 46.0, 31.0, 14.0, 21.0, 4.0, 9.0, 5.0, 5.0, 7.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10290718078613281, -0.09888076782226562, -0.09485435485839844, -0.09082794189453125, -0.08680152893066406, -0.08277511596679688, -0.07874870300292969, -0.0747222900390625, -0.07069587707519531, -0.06666946411132812, -0.06264305114746094, -0.05861663818359375, -0.05459022521972656, -0.050563812255859375, -0.04653739929199219, -0.042510986328125, -0.03848457336425781, -0.034458160400390625, -0.030431747436523438, -0.02640533447265625, -0.022378921508789062, -0.018352508544921875, -0.014326095581054688, -0.0102996826171875, -0.0062732696533203125, -0.002246856689453125, 0.0017795562744140625, 0.00580596923828125, 0.009832382202148438, 0.013858795166015625, 0.017885208129882812, 0.02191162109375, 0.025938034057617188, 0.029964447021484375, 0.03399085998535156, 0.03801727294921875, 0.04204368591308594, 0.046070098876953125, 0.05009651184082031, 0.0541229248046875, 0.05814933776855469, 0.062175750732421875, 0.06620216369628906, 0.07022857666015625, 0.07425498962402344, 0.07828140258789062, 0.08230781555175781, 0.086334228515625, 0.09036064147949219, 0.09438705444335938, 0.09841346740722656, 0.10243988037109375, 0.10646629333496094, 0.11049270629882812, 0.11451911926269531, 0.1185455322265625, 0.12257194519042969, 0.12659835815429688, 0.13062477111816406, 0.13465118408203125, 0.13867759704589844, 0.14270401000976562, 0.1467304229736328, 0.1507568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 10.0, 15.0, 13.0, 12.0, 22.0, 35.0, 45.0, 48.0, 50.0, 59.0, 71.0, 61.0, 78.0, 75.0, 67.0, 82.0, 39.0, 42.0, 25.0, 29.0, 16.0, 14.0, 12.0, 16.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.029273986816406e-05, -3.8689933717250824e-05, -3.7087127566337585e-05, -3.548432141542435e-05, -3.388151526451111e-05, -3.227870911359787e-05, -3.067590296268463e-05, -2.9073096811771393e-05, -2.7470290660858154e-05, -2.5867484509944916e-05, -2.4264678359031677e-05, -2.266187220811844e-05, -2.10590660572052e-05, -1.945625990629196e-05, -1.7853453755378723e-05, -1.6250647604465485e-05, -1.4647841453552246e-05, -1.3045035302639008e-05, -1.1442229151725769e-05, -9.83942300081253e-06, -8.236616849899292e-06, -6.6338106989860535e-06, -5.031004548072815e-06, -3.4281983971595764e-06, -1.8253922462463379e-06, -2.2258609533309937e-07, 1.3802200555801392e-06, 2.9830262064933777e-06, 4.585832357406616e-06, 6.188638508319855e-06, 7.791444659233093e-06, 9.394250810146332e-06, 1.099705696105957e-05, 1.2599863111972809e-05, 1.4202669262886047e-05, 1.5805475413799286e-05, 1.7408281564712524e-05, 1.9011087715625763e-05, 2.0613893866539e-05, 2.221670001745224e-05, 2.381950616836548e-05, 2.5422312319278717e-05, 2.7025118470191956e-05, 2.8627924621105194e-05, 3.0230730772018433e-05, 3.183353692293167e-05, 3.343634307384491e-05, 3.503914922475815e-05, 3.664195537567139e-05, 3.8244761526584625e-05, 3.9847567677497864e-05, 4.14503738284111e-05, 4.305317997932434e-05, 4.465598613023758e-05, 4.625879228115082e-05, 4.7861598432064056e-05, 4.9464404582977295e-05, 5.1067210733890533e-05, 5.267001688480377e-05, 5.427282303571701e-05, 5.587562918663025e-05, 5.747843533754349e-05, 5.9081241488456726e-05, 6.0684047639369965e-05, 6.22868537902832e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 10.0, 15.0, 12.0, 24.0, 23.0, 30.0, 55.0, 59.0, 106.0, 121.0, 190.0, 300.0, 518.0, 943.0, 1970.0, 4132.0, 9323.0, 24855.0, 81671.0, 370543.0, 417370.0, 90700.0, 26846.0, 9908.0, 4311.0, 1945.0, 1055.0, 528.0, 321.0, 212.0, 135.0, 85.0, 63.0, 43.0, 33.0, 22.0, 16.0, 12.0, 18.0, 7.0, 9.0, 4.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.071044921875, -0.0686798095703125, -0.066314697265625, -0.0639495849609375, -0.06158447265625, -0.0592193603515625, -0.056854248046875, -0.0544891357421875, -0.0521240234375, -0.0497589111328125, -0.047393798828125, -0.0450286865234375, -0.04266357421875, -0.0402984619140625, -0.037933349609375, -0.0355682373046875, -0.033203125, -0.0308380126953125, -0.028472900390625, -0.0261077880859375, -0.02374267578125, -0.0213775634765625, -0.019012451171875, -0.0166473388671875, -0.0142822265625, -0.0119171142578125, -0.009552001953125, -0.0071868896484375, -0.00482177734375, -0.0024566650390625, -9.1552734375e-05, 0.0022735595703125, 0.004638671875, 0.0070037841796875, 0.009368896484375, 0.0117340087890625, 0.01409912109375, 0.0164642333984375, 0.018829345703125, 0.0211944580078125, 0.0235595703125, 0.0259246826171875, 0.028289794921875, 0.0306549072265625, 0.03302001953125, 0.0353851318359375, 0.037750244140625, 0.0401153564453125, 0.04248046875, 0.0448455810546875, 0.047210693359375, 0.0495758056640625, 0.05194091796875, 0.0543060302734375, 0.056671142578125, 0.0590362548828125, 0.0614013671875, 0.0637664794921875, 0.066131591796875, 0.0684967041015625, 0.07086181640625, 0.0732269287109375, 0.075592041015625, 0.0779571533203125, 0.080322265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 6.0, 5.0, 7.0, 3.0, 9.0, 10.0, 7.0, 11.0, 23.0, 31.0, 32.0, 33.0, 40.0, 58.0, 87.0, 116.0, 113.0, 82.0, 74.0, 62.0, 35.0, 32.0, 23.0, 20.0, 15.0, 8.0, 11.0, 6.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.05446052551269531, -0.052585601806640625, -0.05071067810058594, -0.04883575439453125, -0.04696083068847656, -0.045085906982421875, -0.04321098327636719, -0.0413360595703125, -0.03946113586425781, -0.037586212158203125, -0.03571128845214844, -0.03383636474609375, -0.03196144104003906, -0.030086517333984375, -0.028211593627929688, -0.026336669921875, -0.024461746215820312, -0.022586822509765625, -0.020711898803710938, -0.01883697509765625, -0.016962051391601562, -0.015087127685546875, -0.013212203979492188, -0.0113372802734375, -0.009462356567382812, -0.007587432861328125, -0.0057125091552734375, -0.00383758544921875, -0.0019626617431640625, -8.7738037109375e-05, 0.0017871856689453125, 0.003662109375, 0.0055370330810546875, 0.007411956787109375, 0.009286880493164062, 0.01116180419921875, 0.013036727905273438, 0.014911651611328125, 0.016786575317382812, 0.0186614990234375, 0.020536422729492188, 0.022411346435546875, 0.024286270141601562, 0.02616119384765625, 0.028036117553710938, 0.029911041259765625, 0.03178596496582031, 0.033660888671875, 0.03553581237792969, 0.037410736083984375, 0.03928565979003906, 0.04116058349609375, 0.04303550720214844, 0.044910430908203125, 0.04678535461425781, 0.0486602783203125, 0.05053520202636719, 0.052410125732421875, 0.05428504943847656, 0.05615997314453125, 0.05803489685058594, 0.059909820556640625, 0.06178474426269531, 0.06365966796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 13.0, 17.0, 32.0, 42.0, 64.0, 101.0, 136.0, 126.0, 137.0, 99.0, 100.0, 54.0, 32.0, 12.0, 13.0, 10.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45304882526397705, -0.4243328273296356, -0.3956168293952942, -0.36690086126327515, -0.3381848633289337, -0.3094688653945923, -0.28075286746025085, -0.2520368695259094, -0.2233208864927292, -0.19460488855838776, -0.16588890552520752, -0.1371729075908661, -0.10845691710710526, -0.07974092662334442, -0.05102492868900299, -0.022308945655822754, 0.006407052278518677, 0.03512304276227951, 0.06383903324604034, 0.09255503118038177, 0.12127102166414261, 0.14998701214790344, 0.17870301008224487, 0.2074189931154251, 0.23613499104976654, 0.2648509740829468, 0.2935669720172882, 0.32228296995162964, 0.35099896788597107, 0.3797149658203125, 0.40843093395233154, 0.437146931886673, 0.4658629298210144, 0.49457892775535583, 0.5232949256896973, 0.5520108938217163, 0.5807269215583801, 0.6094428896903992, 0.638158917427063, 0.666874885559082, 0.6955908536911011, 0.7243068218231201, 0.7530228495597839, 0.781738817691803, 0.8104548454284668, 0.8391708135604858, 0.8678867816925049, 0.8966028094291687, 0.9253188371658325, 0.9540348052978516, 0.9827508330345154, 1.0114668607711792, 1.0401828289031982, 1.0688987970352173, 1.0976147651672363, 1.1263307332992554, 1.1550467014312744, 1.1837626695632935, 1.2124786376953125, 1.241194725036621, 1.2699106931686401, 1.2986266613006592, 1.3273426294326782, 1.3560585975646973, 1.3847746849060059]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 4.0, 4.0, 15.0, 3.0, 14.0, 5.0, 26.0, 17.0, 22.0, 22.0, 32.0, 34.0, 26.0, 43.0, 25.0, 43.0, 41.0, 42.0, 46.0, 42.0, 46.0, 29.0, 43.0, 40.0, 50.0, 35.0, 38.0, 31.0, 24.0, 21.0, 25.0, 20.0, 17.0, 18.0, 6.0, 10.0, 5.0, 7.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.6243494153022766, -0.6065165400505066, -0.5886836647987366, -0.5708507895469666, -0.5530179142951965, -0.5351850390434265, -0.5173521637916565, -0.4995192885398865, -0.48168641328811646, -0.46385353803634644, -0.4460206627845764, -0.4281877875328064, -0.4103549122810364, -0.39252203702926636, -0.37468916177749634, -0.3568562865257263, -0.3390234410762787, -0.32119056582450867, -0.30335769057273865, -0.28552481532096863, -0.2676919400691986, -0.2498590648174286, -0.23202620446681976, -0.21419332921504974, -0.19636045396327972, -0.1785275787115097, -0.16069470345973969, -0.14286184310913086, -0.12502896785736084, -0.10719608515501022, -0.0893632173538208, -0.07153034210205078, -0.05369746685028076, -0.03586459159851074, -0.01803172007203102, -0.00019884854555130005, 0.01763402670621872, 0.03546690195798874, 0.05329976975917816, 0.07113264501094818, 0.0889655202627182, 0.10679839551448822, 0.12463127076625824, 0.14246413111686707, 0.16029700636863708, 0.1781298816204071, 0.19596275687217712, 0.21379563212394714, 0.23162850737571716, 0.24946138262748718, 0.2672942578792572, 0.2851271331310272, 0.30296000838279724, 0.32079288363456726, 0.3386257290840149, 0.3564586043357849, 0.37429147958755493, 0.39212435483932495, 0.40995723009109497, 0.427790105342865, 0.445622980594635, 0.46345585584640503, 0.48128873109817505, 0.49912160634994507, 0.5169544816017151]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 10.0, 5.0, 7.0, 8.0, 9.0, 19.0, 26.0, 36.0, 55.0, 95.0, 121.0, 201.0, 324.0, 453.0, 749.0, 1308.0, 2158.0, 3917.0, 7088.0, 14270.0, 31409.0, 82453.0, 347514.0, 3228096.0, 332643.0, 80347.0, 30450.0, 13848.0, 7079.0, 3866.0, 2226.0, 1307.0, 794.0, 518.0, 305.0, 196.0, 122.0, 81.0, 57.0, 34.0, 26.0, 13.0, 12.0, 14.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07579898834228516, -0.07322883605957031, -0.07065868377685547, -0.06808853149414062, -0.06551837921142578, -0.06294822692871094, -0.060378074645996094, -0.05780792236328125, -0.055237770080566406, -0.05266761779785156, -0.05009746551513672, -0.047527313232421875, -0.04495716094970703, -0.04238700866699219, -0.039816856384277344, -0.0372467041015625, -0.034676551818847656, -0.03210639953613281, -0.02953624725341797, -0.026966094970703125, -0.02439594268798828, -0.021825790405273438, -0.019255638122558594, -0.01668548583984375, -0.014115333557128906, -0.011545181274414062, -0.008975028991699219, -0.006404876708984375, -0.0038347244262695312, -0.0012645721435546875, 0.0013055801391601562, 0.003875732421875, 0.006445884704589844, 0.009016036987304688, 0.011586189270019531, 0.014156341552734375, 0.01672649383544922, 0.019296646118164062, 0.021866798400878906, 0.02443695068359375, 0.027007102966308594, 0.029577255249023438, 0.03214740753173828, 0.034717559814453125, 0.03728771209716797, 0.03985786437988281, 0.042428016662597656, 0.0449981689453125, 0.047568321228027344, 0.05013847351074219, 0.05270862579345703, 0.055278778076171875, 0.05784893035888672, 0.06041908264160156, 0.0629892349243164, 0.06555938720703125, 0.0681295394897461, 0.07069969177246094, 0.07326984405517578, 0.07583999633789062, 0.07841014862060547, 0.08098030090332031, 0.08355045318603516, 0.08612060546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 4.0, 14.0, 14.0, 14.0, 19.0, 29.0, 31.0, 23.0, 29.0, 33.0, 39.0, 45.0, 51.0, 55.0, 55.0, 45.0, 46.0, 42.0, 61.0, 47.0, 41.0, 35.0, 32.0, 25.0, 39.0, 16.0, 17.0, 13.0, 17.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0236358642578125, -0.022953510284423828, -0.022271156311035156, -0.021588802337646484, -0.020906448364257812, -0.02022409439086914, -0.01954174041748047, -0.018859386444091797, -0.018177032470703125, -0.017494678497314453, -0.01681232452392578, -0.01612997055053711, -0.015447616577148438, -0.014765262603759766, -0.014082908630371094, -0.013400554656982422, -0.01271820068359375, -0.012035846710205078, -0.011353492736816406, -0.010671138763427734, -0.009988784790039062, -0.00930643081665039, -0.008624076843261719, -0.007941722869873047, -0.007259368896484375, -0.006577014923095703, -0.005894660949707031, -0.005212306976318359, -0.0045299530029296875, -0.0038475990295410156, -0.0031652450561523438, -0.002482891082763672, -0.001800537109375, -0.0011181831359863281, -0.00043582916259765625, 0.0002465248107910156, 0.0009288787841796875, 0.0016112327575683594, 0.0022935867309570312, 0.002975940704345703, 0.003658294677734375, 0.004340648651123047, 0.005023002624511719, 0.005705356597900391, 0.0063877105712890625, 0.007070064544677734, 0.007752418518066406, 0.008434772491455078, 0.00911712646484375, 0.009799480438232422, 0.010481834411621094, 0.011164188385009766, 0.011846542358398438, 0.01252889633178711, 0.013211250305175781, 0.013893604278564453, 0.014575958251953125, 0.015258312225341797, 0.01594066619873047, 0.01662302017211914, 0.017305374145507812, 0.017987728118896484, 0.018670082092285156, 0.019352436065673828, 0.0200347900390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 6.0, 3.0, 13.0, 19.0, 32.0, 32.0, 51.0, 68.0, 122.0, 172.0, 235.0, 375.0, 602.0, 962.0, 1728.0, 3417.0, 7404.0, 19207.0, 58651.0, 264351.0, 3190667.0, 510964.0, 88674.0, 26631.0, 10131.0, 4415.0, 2155.0, 1184.0, 652.0, 426.0, 303.0, 206.0, 126.0, 95.0, 63.0, 40.0, 30.0, 21.0, 19.0, 11.0, 5.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.15625, -0.15174102783203125, -0.1472320556640625, -0.14272308349609375, -0.138214111328125, -0.13370513916015625, -0.1291961669921875, -0.12468719482421875, -0.12017822265625, -0.11566925048828125, -0.1111602783203125, -0.10665130615234375, -0.102142333984375, -0.09763336181640625, -0.0931243896484375, -0.08861541748046875, -0.0841064453125, -0.07959747314453125, -0.0750885009765625, -0.07057952880859375, -0.066070556640625, -0.06156158447265625, -0.0570526123046875, -0.05254364013671875, -0.04803466796875, -0.04352569580078125, -0.0390167236328125, -0.03450775146484375, -0.029998779296875, -0.02548980712890625, -0.0209808349609375, -0.01647186279296875, -0.011962890625, -0.00745391845703125, -0.0029449462890625, 0.00156402587890625, 0.006072998046875, 0.01058197021484375, 0.0150909423828125, 0.01959991455078125, 0.02410888671875, 0.02861785888671875, 0.0331268310546875, 0.03763580322265625, 0.042144775390625, 0.04665374755859375, 0.0511627197265625, 0.05567169189453125, 0.0601806640625, 0.06468963623046875, 0.0691986083984375, 0.07370758056640625, 0.078216552734375, 0.08272552490234375, 0.0872344970703125, 0.09174346923828125, 0.09625244140625, 0.10076141357421875, 0.1052703857421875, 0.10977935791015625, 0.114288330078125, 0.11879730224609375, 0.1233062744140625, 0.12781524658203125, 0.13232421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 2.0, 11.0, 7.0, 6.0, 20.0, 27.0, 43.0, 48.0, 97.0, 203.0, 442.0, 1797.0, 689.0, 286.0, 135.0, 100.0, 55.0, 43.0, 17.0, 15.0, 8.0, 5.0, 2.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08624267578125, -0.08368206024169922, -0.08112144470214844, -0.07856082916259766, -0.07600021362304688, -0.0734395980834961, -0.07087898254394531, -0.06831836700439453, -0.06575775146484375, -0.06319713592529297, -0.06063652038574219, -0.058075904846191406, -0.055515289306640625, -0.052954673767089844, -0.05039405822753906, -0.04783344268798828, -0.0452728271484375, -0.04271221160888672, -0.04015159606933594, -0.037590980529785156, -0.035030364990234375, -0.032469749450683594, -0.029909133911132812, -0.02734851837158203, -0.02478790283203125, -0.02222728729248047, -0.019666671752929688, -0.017106056213378906, -0.014545440673828125, -0.011984825134277344, -0.009424209594726562, -0.006863594055175781, -0.004302978515625, -0.0017423629760742188, 0.0008182525634765625, 0.0033788681030273438, 0.005939483642578125, 0.008500099182128906, 0.011060714721679688, 0.013621330261230469, 0.01618194580078125, 0.01874256134033203, 0.021303176879882812, 0.023863792419433594, 0.026424407958984375, 0.028985023498535156, 0.03154563903808594, 0.03410625457763672, 0.0366668701171875, 0.03922748565673828, 0.04178810119628906, 0.044348716735839844, 0.046909332275390625, 0.049469947814941406, 0.05203056335449219, 0.05459117889404297, 0.05715179443359375, 0.05971240997314453, 0.06227302551269531, 0.0648336410522461, 0.06739425659179688, 0.06995487213134766, 0.07251548767089844, 0.07507610321044922, 0.07763671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 31.0, 87.0, 192.0, 267.0, 242.0, 112.0, 48.0, 8.0, 6.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5530012249946594, -0.5230609178543091, -0.49312061071395874, -0.4631803035736084, -0.43323999643325806, -0.4032996892929077, -0.3733593821525574, -0.34341907501220703, -0.3134787678718567, -0.28353846073150635, -0.253598153591156, -0.22365784645080566, -0.19371753931045532, -0.16377723217010498, -0.13383692502975464, -0.1038966178894043, -0.07395631074905396, -0.04401600360870361, -0.014075696468353271, 0.01586461067199707, 0.04580491781234741, 0.07574522495269775, 0.1056855320930481, 0.13562583923339844, 0.16556614637374878, 0.19550645351409912, 0.22544676065444946, 0.2553870677947998, 0.28532737493515015, 0.3152676820755005, 0.34520798921585083, 0.37514829635620117, 0.4050886631011963, 0.43502897024154663, 0.464969277381897, 0.4949095845222473, 0.5248498916625977, 0.554790198802948, 0.5847305059432983, 0.6146708130836487, 0.644611120223999, 0.6745514273643494, 0.7044917345046997, 0.73443204164505, 0.7643723487854004, 0.7943126559257507, 0.8242529630661011, 0.8541932702064514, 0.8841335773468018, 0.9140738844871521, 0.9440141916275024, 0.9739544987678528, 1.0038948059082031, 1.0338351726531982, 1.0637754201889038, 1.0937156677246094, 1.1236560344696045, 1.1535964012145996, 1.1835366487503052, 1.2134768962860107, 1.2434172630310059, 1.273357629776001, 1.3032978773117065, 1.333238124847412, 1.3631784915924072]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 6.0, 11.0, 10.0, 10.0, 15.0, 28.0, 14.0, 21.0, 37.0, 32.0, 42.0, 38.0, 34.0, 35.0, 36.0, 40.0, 46.0, 47.0, 45.0, 38.0, 38.0, 42.0, 31.0, 35.0, 36.0, 19.0, 31.0, 22.0, 22.0, 19.0, 10.0, 12.0, 12.0, 14.0, 12.0, 8.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20667040348052979, -0.19992177188396454, -0.1931731402873993, -0.18642450869083405, -0.1796758770942688, -0.17292724549770355, -0.1661786139011383, -0.15942999720573425, -0.1526813507080078, -0.14593271911144257, -0.13918408751487732, -0.13243545591831207, -0.12568682432174683, -0.11893819272518158, -0.11218956857919693, -0.10544093698263168, -0.09869231283664703, -0.09194368124008179, -0.08519504964351654, -0.0784464180469513, -0.07169778645038605, -0.0649491548538208, -0.05820053070783615, -0.051451899111270905, -0.04470326751470566, -0.03795463591814041, -0.031206006184220314, -0.024457376450300217, -0.01770874485373497, -0.010960113257169724, -0.004211485385894775, 0.002537146210670471, 0.009285777807235718, 0.016034409403800964, 0.02278303913772106, 0.02953166887164116, 0.036280300468206406, 0.04302893206477165, 0.0497775599360466, 0.05652619153261185, 0.0632748231291771, 0.07002345472574234, 0.07677208632230759, 0.08352071046829224, 0.09026934206485748, 0.09701797366142273, 0.10376660525798798, 0.11051523685455322, 0.11726386845111847, 0.12401250004768372, 0.13076113164424896, 0.1375097632408142, 0.14425839483737946, 0.1510070264339447, 0.15775564312934875, 0.1645042896270752, 0.17125290632247925, 0.1780015379190445, 0.18475016951560974, 0.191498801112175, 0.19824743270874023, 0.20499606430530548, 0.21174469590187073, 0.21849331259727478, 0.22524195909500122]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 11.0, 28.0, 25.0, 46.0, 62.0, 111.0, 175.0, 251.0, 347.0, 602.0, 939.0, 1554.0, 2488.0, 4323.0, 7165.0, 12326.0, 21456.0, 36904.0, 64043.0, 115578.0, 229409.0, 253454.0, 128815.0, 70663.0, 40944.0, 23226.0, 13731.0, 7911.0, 4626.0, 2834.0, 1695.0, 1036.0, 646.0, 408.0, 252.0, 158.0, 96.0, 88.0, 26.0, 25.0, 22.0, 12.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.071533203125, -0.06915569305419922, -0.06677818298339844, -0.06440067291259766, -0.062023162841796875, -0.059645652770996094, -0.05726814270019531, -0.05489063262939453, -0.05251312255859375, -0.05013561248779297, -0.04775810241699219, -0.045380592346191406, -0.043003082275390625, -0.040625572204589844, -0.03824806213378906, -0.03587055206298828, -0.0334930419921875, -0.03111553192138672, -0.028738021850585938, -0.026360511779785156, -0.023983001708984375, -0.021605491638183594, -0.019227981567382812, -0.01685047149658203, -0.01447296142578125, -0.012095451354980469, -0.009717941284179688, -0.007340431213378906, -0.004962921142578125, -0.0025854110717773438, -0.0002079010009765625, 0.0021696090698242188, 0.004547119140625, 0.006924629211425781, 0.009302139282226562, 0.011679649353027344, 0.014057159423828125, 0.016434669494628906, 0.018812179565429688, 0.02118968963623047, 0.02356719970703125, 0.02594470977783203, 0.028322219848632812, 0.030699729919433594, 0.033077239990234375, 0.035454750061035156, 0.03783226013183594, 0.04020977020263672, 0.0425872802734375, 0.04496479034423828, 0.04734230041503906, 0.049719810485839844, 0.052097320556640625, 0.054474830627441406, 0.05685234069824219, 0.05922985076904297, 0.06160736083984375, 0.06398487091064453, 0.06636238098144531, 0.0687398910522461, 0.07111740112304688, 0.07349491119384766, 0.07587242126464844, 0.07824993133544922, 0.08062744140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 5.0, 12.0, 5.0, 13.0, 18.0, 23.0, 15.0, 19.0, 22.0, 18.0, 35.0, 31.0, 36.0, 35.0, 38.0, 43.0, 43.0, 43.0, 42.0, 52.0, 33.0, 53.0, 41.0, 36.0, 30.0, 32.0, 29.0, 22.0, 26.0, 27.0, 18.0, 17.0, 10.0, 9.0, 9.0, 6.0, 9.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0221099853515625, -0.021448612213134766, -0.02078723907470703, -0.020125865936279297, -0.019464492797851562, -0.018803119659423828, -0.018141746520996094, -0.01748037338256836, -0.016819000244140625, -0.01615762710571289, -0.015496253967285156, -0.014834880828857422, -0.014173507690429688, -0.013512134552001953, -0.012850761413574219, -0.012189388275146484, -0.01152801513671875, -0.010866641998291016, -0.010205268859863281, -0.009543895721435547, -0.008882522583007812, -0.008221149444580078, -0.007559776306152344, -0.006898403167724609, -0.006237030029296875, -0.005575656890869141, -0.004914283752441406, -0.004252910614013672, -0.0035915374755859375, -0.002930164337158203, -0.0022687911987304688, -0.0016074180603027344, -0.000946044921875, -0.0002846717834472656, 0.00037670135498046875, 0.0010380744934082031, 0.0016994476318359375, 0.002360820770263672, 0.0030221939086914062, 0.0036835670471191406, 0.004344940185546875, 0.005006313323974609, 0.005667686462402344, 0.006329059600830078, 0.0069904327392578125, 0.007651805877685547, 0.008313179016113281, 0.008974552154541016, 0.00963592529296875, 0.010297298431396484, 0.010958671569824219, 0.011620044708251953, 0.012281417846679688, 0.012942790985107422, 0.013604164123535156, 0.01426553726196289, 0.014926910400390625, 0.01558828353881836, 0.016249656677246094, 0.016911029815673828, 0.017572402954101562, 0.018233776092529297, 0.01889514923095703, 0.019556522369384766, 0.0202178955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 8.0, 14.0, 21.0, 27.0, 44.0, 55.0, 101.0, 176.0, 308.0, 455.0, 819.0, 1565.0, 3591.0, 10891.0, 44515.0, 255486.0, 601776.0, 97470.0, 20538.0, 5886.0, 2225.0, 1076.0, 535.0, 338.0, 216.0, 132.0, 103.0, 56.0, 44.0, 20.0, 16.0, 13.0, 8.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.21923828125, -0.21264266967773438, -0.20604705810546875, -0.19945144653320312, -0.1928558349609375, -0.18626022338867188, -0.17966461181640625, -0.17306900024414062, -0.166473388671875, -0.15987777709960938, -0.15328216552734375, -0.14668655395507812, -0.1400909423828125, -0.13349533081054688, -0.12689971923828125, -0.12030410766601562, -0.11370849609375, -0.10711288452148438, -0.10051727294921875, -0.09392166137695312, -0.0873260498046875, -0.08073043823242188, -0.07413482666015625, -0.06753921508789062, -0.060943603515625, -0.054347991943359375, -0.04775238037109375, -0.041156768798828125, -0.0345611572265625, -0.027965545654296875, -0.02136993408203125, -0.014774322509765625, -0.0081787109375, -0.001583099365234375, 0.00501251220703125, 0.011608123779296875, 0.0182037353515625, 0.024799346923828125, 0.03139495849609375, 0.037990570068359375, 0.044586181640625, 0.051181793212890625, 0.05777740478515625, 0.06437301635742188, 0.0709686279296875, 0.07756423950195312, 0.08415985107421875, 0.09075546264648438, 0.09735107421875, 0.10394668579101562, 0.11054229736328125, 0.11713790893554688, 0.1237335205078125, 0.13032913208007812, 0.13692474365234375, 0.14352035522460938, 0.150115966796875, 0.15671157836914062, 0.16330718994140625, 0.16990280151367188, 0.1764984130859375, 0.18309402465820312, 0.18968963623046875, 0.19628524780273438, 0.202880859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 13.0, 17.0, 12.0, 15.0, 24.0, 29.0, 26.0, 45.0, 41.0, 41.0, 52.0, 55.0, 54.0, 62.0, 52.0, 60.0, 52.0, 51.0, 49.0, 35.0, 40.0, 24.0, 24.0, 27.0, 13.0, 19.0, 13.0, 16.0, 10.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1402587890625, -0.13572311401367188, -0.13118743896484375, -0.12665176391601562, -0.1221160888671875, -0.11758041381835938, -0.11304473876953125, -0.10850906372070312, -0.103973388671875, -0.09943771362304688, -0.09490203857421875, -0.09036636352539062, -0.0858306884765625, -0.08129501342773438, -0.07675933837890625, -0.07222366333007812, -0.06768798828125, -0.06315231323242188, -0.05861663818359375, -0.054080963134765625, -0.0495452880859375, -0.045009613037109375, -0.04047393798828125, -0.035938262939453125, -0.031402587890625, -0.026866912841796875, -0.02233123779296875, -0.017795562744140625, -0.0132598876953125, -0.008724212646484375, -0.00418853759765625, 0.000347137451171875, 0.0048828125, 0.009418487548828125, 0.01395416259765625, 0.018489837646484375, 0.0230255126953125, 0.027561187744140625, 0.03209686279296875, 0.036632537841796875, 0.041168212890625, 0.045703887939453125, 0.05023956298828125, 0.054775238037109375, 0.0593109130859375, 0.06384658813476562, 0.06838226318359375, 0.07291793823242188, 0.07745361328125, 0.08198928833007812, 0.08652496337890625, 0.09106063842773438, 0.0955963134765625, 0.10013198852539062, 0.10466766357421875, 0.10920333862304688, 0.113739013671875, 0.11827468872070312, 0.12281036376953125, 0.12734603881835938, 0.1318817138671875, 0.13641738891601562, 0.14095306396484375, 0.14548873901367188, 0.1500244140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 10.0, 15.0, 12.0, 24.0, 23.0, 46.0, 46.0, 91.0, 182.0, 400.0, 1393.0, 8778.0, 374379.0, 649929.0, 10607.0, 1606.0, 519.0, 197.0, 93.0, 51.0, 34.0, 31.0, 21.0, 22.0, 16.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.490478515625, -0.4764823913574219, -0.46248626708984375, -0.4484901428222656, -0.4344940185546875, -0.4204978942871094, -0.40650177001953125, -0.3925056457519531, -0.378509521484375, -0.3645133972167969, -0.35051727294921875, -0.3365211486816406, -0.3225250244140625, -0.3085289001464844, -0.29453277587890625, -0.2805366516113281, -0.26654052734375, -0.2525444030761719, -0.23854827880859375, -0.22455215454101562, -0.2105560302734375, -0.19655990600585938, -0.18256378173828125, -0.16856765747070312, -0.154571533203125, -0.14057540893554688, -0.12657928466796875, -0.11258316040039062, -0.0985870361328125, -0.08459091186523438, -0.07059478759765625, -0.056598663330078125, -0.0426025390625, -0.028606414794921875, -0.01461029052734375, -0.000614166259765625, 0.0133819580078125, 0.027378082275390625, 0.04137420654296875, 0.055370330810546875, 0.069366455078125, 0.08336257934570312, 0.09735870361328125, 0.11135482788085938, 0.1253509521484375, 0.13934707641601562, 0.15334320068359375, 0.16733932495117188, 0.18133544921875, 0.19533157348632812, 0.20932769775390625, 0.22332382202148438, 0.2373199462890625, 0.2513160705566406, 0.26531219482421875, 0.2793083190917969, 0.293304443359375, 0.3073005676269531, 0.32129669189453125, 0.3352928161621094, 0.3492889404296875, 0.3632850646972656, 0.37728118896484375, 0.3912773132324219, 0.4052734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 5.0, 18.0, 22.0, 28.0, 44.0, 62.0, 79.0, 100.0, 85.0, 100.0, 65.0, 90.0, 74.0, 56.0, 42.0, 25.0, 30.0, 14.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.429983139038086e-05, -5.22444024682045e-05, -5.018897354602814e-05, -4.8133544623851776e-05, -4.6078115701675415e-05, -4.4022686779499054e-05, -4.196725785732269e-05, -3.991182893514633e-05, -3.785640001296997e-05, -3.580097109079361e-05, -3.374554216861725e-05, -3.169011324644089e-05, -2.9634684324264526e-05, -2.7579255402088165e-05, -2.5523826479911804e-05, -2.3468397557735443e-05, -2.1412968635559082e-05, -1.935753971338272e-05, -1.730211079120636e-05, -1.5246681869029999e-05, -1.3191252946853638e-05, -1.1135824024677277e-05, -9.080395102500916e-06, -7.0249661803245544e-06, -4.969537258148193e-06, -2.9141083359718323e-06, -8.586794137954712e-07, 1.1967495083808899e-06, 3.252178430557251e-06, 5.307607352733612e-06, 7.363036274909973e-06, 9.418465197086334e-06, 1.1473894119262695e-05, 1.3529323041439056e-05, 1.5584751963615417e-05, 1.764018088579178e-05, 1.969560980796814e-05, 2.17510387301445e-05, 2.3806467652320862e-05, 2.5861896574497223e-05, 2.7917325496673584e-05, 2.9972754418849945e-05, 3.2028183341026306e-05, 3.408361226320267e-05, 3.613904118537903e-05, 3.819447010755539e-05, 4.024989902973175e-05, 4.230532795190811e-05, 4.436075687408447e-05, 4.6416185796260834e-05, 4.8471614718437195e-05, 5.0527043640613556e-05, 5.258247256278992e-05, 5.463790148496628e-05, 5.669333040714264e-05, 5.8748759329319e-05, 6.080418825149536e-05, 6.285961717367172e-05, 6.491504609584808e-05, 6.697047501802444e-05, 6.90259039402008e-05, 7.108133286237717e-05, 7.313676178455353e-05, 7.519219070672989e-05, 7.724761962890625e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 9.0, 18.0, 11.0, 23.0, 33.0, 49.0, 50.0, 86.0, 132.0, 217.0, 460.0, 871.0, 1874.0, 5280.0, 27694.0, 739424.0, 250553.0, 15071.0, 3631.0, 1421.0, 652.0, 339.0, 216.0, 133.0, 84.0, 45.0, 47.0, 28.0, 19.0, 21.0, 13.0, 7.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20402145385742188, -0.19612884521484375, -0.18823623657226562, -0.1803436279296875, -0.17245101928710938, -0.16455841064453125, -0.15666580200195312, -0.148773193359375, -0.14088058471679688, -0.13298797607421875, -0.12509536743164062, -0.1172027587890625, -0.10931015014648438, -0.10141754150390625, -0.09352493286132812, -0.08563232421875, -0.07773971557617188, -0.06984710693359375, -0.061954498291015625, -0.0540618896484375, -0.046169281005859375, -0.03827667236328125, -0.030384063720703125, -0.022491455078125, -0.014598846435546875, -0.00670623779296875, 0.001186370849609375, 0.0090789794921875, 0.016971588134765625, 0.02486419677734375, 0.032756805419921875, 0.0406494140625, 0.048542022705078125, 0.05643463134765625, 0.06432723999023438, 0.0722198486328125, 0.08011245727539062, 0.08800506591796875, 0.09589767456054688, 0.103790283203125, 0.11168289184570312, 0.11957550048828125, 0.12746810913085938, 0.1353607177734375, 0.14325332641601562, 0.15114593505859375, 0.15903854370117188, 0.16693115234375, 0.17482376098632812, 0.18271636962890625, 0.19060897827148438, 0.1985015869140625, 0.20639419555664062, 0.21428680419921875, 0.22217941284179688, 0.230072021484375, 0.23796463012695312, 0.24585723876953125, 0.2537498474121094, 0.2616424560546875, 0.2695350646972656, 0.27742767333984375, 0.2853202819824219, 0.293212890625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 13.0, 9.0, 37.0, 38.0, 84.0, 121.0, 208.0, 205.0, 112.0, 63.0, 30.0, 19.0, 12.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2017822265625, -0.19672775268554688, -0.19167327880859375, -0.18661880493164062, -0.1815643310546875, -0.17650985717773438, -0.17145538330078125, -0.16640090942382812, -0.161346435546875, -0.15629196166992188, -0.15123748779296875, -0.14618301391601562, -0.1411285400390625, -0.13607406616210938, -0.13101959228515625, -0.12596511840820312, -0.12091064453125, -0.11585617065429688, -0.11080169677734375, -0.10574722290039062, -0.1006927490234375, -0.09563827514648438, -0.09058380126953125, -0.08552932739257812, -0.080474853515625, -0.07542037963867188, -0.07036590576171875, -0.06531143188476562, -0.0602569580078125, -0.055202484130859375, -0.05014801025390625, -0.045093536376953125, -0.0400390625, -0.034984588623046875, -0.02993011474609375, -0.024875640869140625, -0.0198211669921875, -0.014766693115234375, -0.00971221923828125, -0.004657745361328125, 0.000396728515625, 0.005451202392578125, 0.01050567626953125, 0.015560150146484375, 0.0206146240234375, 0.025669097900390625, 0.03072357177734375, 0.035778045654296875, 0.04083251953125, 0.045886993408203125, 0.05094146728515625, 0.055995941162109375, 0.0610504150390625, 0.06610488891601562, 0.07115936279296875, 0.07621383666992188, 0.081268310546875, 0.08632278442382812, 0.09137725830078125, 0.09643173217773438, 0.1014862060546875, 0.10654067993164062, 0.11159515380859375, 0.11664962768554688, 0.1217041015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 9.0, 20.0, 26.0, 55.0, 86.0, 144.0, 191.0, 166.0, 151.0, 69.0, 40.0, 22.0, 14.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.904351830482483, -1.8404170274734497, -1.776482343673706, -1.7125475406646729, -1.6486128568649292, -1.584678053855896, -1.5207433700561523, -1.4568085670471191, -1.392873764038086, -1.3289389610290527, -1.265004277229309, -1.2010694742202759, -1.1371347904205322, -1.073199987411499, -1.0092651844024658, -0.9453305006027222, -0.8813958168029785, -0.8174610733985901, -0.7535263299942017, -0.6895915269851685, -0.6256568431854248, -0.5617220401763916, -0.4977872967720032, -0.43385255336761475, -0.3699178099632263, -0.3059830665588379, -0.24204830825328827, -0.17811354994773865, -0.11417880654335022, -0.05024406313896179, 0.013690710067749023, 0.07762545347213745, 0.14156031608581543, 0.20549505949020386, 0.2694298028945923, 0.3333645761013031, 0.39729931950569153, 0.46123406291007996, 0.5251688361167908, 0.5891035795211792, 0.6530383229255676, 0.716973066329956, 0.7809078097343445, 0.8448425531387329, 0.9087773561477661, 0.9727120399475098, 1.036646842956543, 1.1005816459655762, 1.1645163297653198, 1.228451132774353, 1.2923858165740967, 1.3563206195831299, 1.4202553033828735, 1.4841901063919067, 1.5481247901916504, 1.6120595932006836, 1.6759943962097168, 1.73992919921875, 1.8038638830184937, 1.8677986860275269, 1.9317333698272705, 1.9956681728363037, 2.059602975845337, 2.123537540435791, 2.187472343444824]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 1.0, 11.0, 8.0, 15.0, 12.0, 14.0, 23.0, 18.0, 26.0, 32.0, 40.0, 43.0, 48.0, 46.0, 55.0, 51.0, 76.0, 58.0, 55.0, 46.0, 37.0, 46.0, 32.0, 34.0, 34.0, 29.0, 18.0, 22.0, 16.0, 17.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.694084107875824, -0.6658458113670349, -0.6376074552536011, -0.609369158744812, -0.581130862236023, -0.5528925061225891, -0.5246542096138, -0.4964158833026886, -0.46817755699157715, -0.4399392306804657, -0.41170090436935425, -0.3834626078605652, -0.35522428154945374, -0.3269859552383423, -0.2987476587295532, -0.2705093324184418, -0.24227100610733032, -0.21403267979621887, -0.18579436838626862, -0.15755605697631836, -0.1293177306652069, -0.10107940435409546, -0.0728410929441452, -0.044602781534194946, -0.016364455223083496, 0.011873863637447357, 0.04011218249797821, 0.06835050135850906, 0.09658882021903992, 0.12482714653015137, 0.15306545794010162, 0.18130376935005188, 0.20954203605651855, 0.23778036236763, 0.26601868867874146, 0.2942569851875305, 0.32249531149864197, 0.3507336378097534, 0.3789719343185425, 0.40721026062965393, 0.4354485869407654, 0.46368691325187683, 0.4919252395629883, 0.5201635360717773, 0.5484018325805664, 0.5766401886940002, 0.6048784852027893, 0.6331168413162231, 0.6613551378250122, 0.6895934343338013, 0.7178317904472351, 0.7460700869560242, 0.774308443069458, 0.8025467395782471, 0.8307850360870361, 0.8590233325958252, 0.887261688709259, 0.9154999852180481, 0.9437383413314819, 0.971976637840271, 1.00021493434906, 1.0284533500671387, 1.0566916465759277, 1.0849299430847168, 1.1131682395935059]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 11.0, 15.0, 26.0, 42.0, 47.0, 80.0, 114.0, 209.0, 342.0, 544.0, 959.0, 1677.0, 3120.0, 6173.0, 13961.0, 34089.0, 101128.0, 525630.0, 3132314.0, 259427.0, 67353.0, 24888.0, 10825.0, 5152.0, 2608.0, 1434.0, 826.0, 487.0, 285.0, 162.0, 121.0, 68.0, 64.0, 33.0, 19.0, 11.0, 12.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11365509033203125, -0.1102447509765625, -0.10683441162109375, -0.103424072265625, -0.10001373291015625, -0.0966033935546875, -0.09319305419921875, -0.08978271484375, -0.08637237548828125, -0.0829620361328125, -0.07955169677734375, -0.076141357421875, -0.07273101806640625, -0.0693206787109375, -0.06591033935546875, -0.0625, -0.05908966064453125, -0.0556793212890625, -0.05226898193359375, -0.048858642578125, -0.04544830322265625, -0.0420379638671875, -0.03862762451171875, -0.03521728515625, -0.03180694580078125, -0.0283966064453125, -0.02498626708984375, -0.021575927734375, -0.01816558837890625, -0.0147552490234375, -0.01134490966796875, -0.0079345703125, -0.00452423095703125, -0.0011138916015625, 0.00229644775390625, 0.005706787109375, 0.00911712646484375, 0.0125274658203125, 0.01593780517578125, 0.01934814453125, 0.02275848388671875, 0.0261688232421875, 0.02957916259765625, 0.032989501953125, 0.03639984130859375, 0.0398101806640625, 0.04322052001953125, 0.046630859375, 0.05004119873046875, 0.0534515380859375, 0.05686187744140625, 0.060272216796875, 0.06368255615234375, 0.0670928955078125, 0.07050323486328125, 0.07391357421875, 0.07732391357421875, 0.0807342529296875, 0.08414459228515625, 0.087554931640625, 0.09096527099609375, 0.0943756103515625, 0.09778594970703125, 0.1011962890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 11.0, 13.0, 18.0, 30.0, 29.0, 33.0, 39.0, 44.0, 58.0, 42.0, 71.0, 61.0, 49.0, 56.0, 59.0, 67.0, 53.0, 47.0, 46.0, 41.0, 30.0, 23.0, 14.0, 9.0, 5.0, 11.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290374755859375, -0.02801823616027832, -0.02699899673461914, -0.02597975730895996, -0.02496051788330078, -0.0239412784576416, -0.022922039031982422, -0.021902799606323242, -0.020883560180664062, -0.019864320755004883, -0.018845081329345703, -0.017825841903686523, -0.016806602478027344, -0.015787363052368164, -0.014768123626708984, -0.013748884201049805, -0.012729644775390625, -0.011710405349731445, -0.010691165924072266, -0.009671926498413086, -0.008652687072753906, -0.0076334476470947266, -0.006614208221435547, -0.005594968795776367, -0.0045757293701171875, -0.003556489944458008, -0.002537250518798828, -0.0015180110931396484, -0.0004987716674804688, 0.0005204677581787109, 0.0015397071838378906, 0.0025589466094970703, 0.00357818603515625, 0.00459742546081543, 0.005616664886474609, 0.006635904312133789, 0.007655143737792969, 0.008674383163452148, 0.009693622589111328, 0.010712862014770508, 0.011732101440429688, 0.012751340866088867, 0.013770580291748047, 0.014789819717407227, 0.015809059143066406, 0.016828298568725586, 0.017847537994384766, 0.018866777420043945, 0.019886016845703125, 0.020905256271362305, 0.021924495697021484, 0.022943735122680664, 0.023962974548339844, 0.024982213973999023, 0.026001453399658203, 0.027020692825317383, 0.028039932250976562, 0.029059171676635742, 0.030078411102294922, 0.0310976505279541, 0.03211688995361328, 0.03313612937927246, 0.03415536880493164, 0.03517460823059082, 0.03619384765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 11.0, 19.0, 19.0, 40.0, 65.0, 55.0, 122.0, 144.0, 253.0, 465.0, 728.0, 1412.0, 3045.0, 7997.0, 25504.0, 107731.0, 893390.0, 2896106.0, 196583.0, 40754.0, 11754.0, 4207.0, 1787.0, 855.0, 463.0, 277.0, 157.0, 97.0, 69.0, 56.0, 29.0, 23.0, 13.0, 4.0, 11.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12170791625976562, -0.11621856689453125, -0.11072921752929688, -0.1052398681640625, -0.09975051879882812, -0.09426116943359375, -0.08877182006835938, -0.083282470703125, -0.07779312133789062, -0.07230377197265625, -0.06681442260742188, -0.0613250732421875, -0.055835723876953125, -0.05034637451171875, -0.044857025146484375, -0.03936767578125, -0.033878326416015625, -0.02838897705078125, -0.022899627685546875, -0.0174102783203125, -0.011920928955078125, -0.00643157958984375, -0.000942230224609375, 0.004547119140625, 0.010036468505859375, 0.01552581787109375, 0.021015167236328125, 0.0265045166015625, 0.031993865966796875, 0.03748321533203125, 0.042972564697265625, 0.0484619140625, 0.053951263427734375, 0.05944061279296875, 0.06492996215820312, 0.0704193115234375, 0.07590866088867188, 0.08139801025390625, 0.08688735961914062, 0.092376708984375, 0.09786605834960938, 0.10335540771484375, 0.10884475708007812, 0.1143341064453125, 0.11982345581054688, 0.12531280517578125, 0.13080215454101562, 0.13629150390625, 0.14178085327148438, 0.14727020263671875, 0.15275955200195312, 0.1582489013671875, 0.16373825073242188, 0.16922760009765625, 0.17471694946289062, 0.180206298828125, 0.18569564819335938, 0.19118499755859375, 0.19667434692382812, 0.2021636962890625, 0.20765304565429688, 0.21314239501953125, 0.21863174438476562, 0.22412109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 27.0, 38.0, 44.0, 80.0, 115.0, 209.0, 446.0, 1300.0, 931.0, 329.0, 211.0, 117.0, 55.0, 44.0, 30.0, 19.0, 20.0, 10.0, 3.0, 9.0, 1.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1265869140625, -0.123565673828125, -0.12054443359375, -0.117523193359375, -0.114501953125, -0.111480712890625, -0.10845947265625, -0.105438232421875, -0.1024169921875, -0.099395751953125, -0.09637451171875, -0.093353271484375, -0.09033203125, -0.087310791015625, -0.08428955078125, -0.081268310546875, -0.0782470703125, -0.075225830078125, -0.07220458984375, -0.069183349609375, -0.066162109375, -0.063140869140625, -0.06011962890625, -0.057098388671875, -0.0540771484375, -0.051055908203125, -0.04803466796875, -0.045013427734375, -0.0419921875, -0.038970947265625, -0.03594970703125, -0.032928466796875, -0.0299072265625, -0.026885986328125, -0.02386474609375, -0.020843505859375, -0.017822265625, -0.014801025390625, -0.01177978515625, -0.008758544921875, -0.0057373046875, -0.002716064453125, 0.00030517578125, 0.003326416015625, 0.00634765625, 0.009368896484375, 0.01239013671875, 0.015411376953125, 0.0184326171875, 0.021453857421875, 0.02447509765625, 0.027496337890625, 0.030517578125, 0.033538818359375, 0.03656005859375, 0.039581298828125, 0.0426025390625, 0.045623779296875, 0.04864501953125, 0.051666259765625, 0.0546875, 0.057708740234375, 0.06072998046875, 0.063751220703125, 0.0667724609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 36.0, 88.0, 114.0, 182.0, 180.0, 167.0, 100.0, 74.0, 24.0, 11.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478748679161072, -0.5223398208618164, -0.49680474400520325, -0.4712696671485901, -0.4457346200942993, -0.42019957304000854, -0.3946644961833954, -0.3691294193267822, -0.34359437227249146, -0.3180593252182007, -0.2925242483615875, -0.26698917150497437, -0.2414541244506836, -0.21591906249523163, -0.19038400053977966, -0.1648489385843277, -0.13931387662887573, -0.11377881467342377, -0.0882437527179718, -0.06270869076251984, -0.03717362880706787, -0.011638566851615906, 0.01389649510383606, 0.039431557059288025, 0.06496661901473999, 0.09050168097019196, 0.11603674292564392, 0.1415718048810959, 0.16710686683654785, 0.19264192879199982, 0.21817699074745178, 0.24371205270290375, 0.2692471742630005, 0.29478222131729126, 0.3203172981739044, 0.3458523750305176, 0.37138742208480835, 0.3969224691390991, 0.4224575459957123, 0.44799262285232544, 0.4735276699066162, 0.499062716960907, 0.5245977640151978, 0.5501328706741333, 0.5756679177284241, 0.6012029647827148, 0.6267380714416504, 0.6522731184959412, 0.6778081655502319, 0.7033432126045227, 0.7288782596588135, 0.754413366317749, 0.7799484133720398, 0.8054834604263306, 0.8310185670852661, 0.8565536141395569, 0.8820886611938477, 0.9076237082481384, 0.9331587553024292, 0.9586938619613647, 0.9842289090156555, 1.0097639560699463, 1.0352990627288818, 1.0608340501785278, 1.0863691568374634]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 10.0, 6.0, 13.0, 16.0, 17.0, 17.0, 25.0, 32.0, 38.0, 30.0, 36.0, 45.0, 53.0, 49.0, 57.0, 43.0, 54.0, 48.0, 60.0, 54.0, 34.0, 44.0, 42.0, 32.0, 28.0, 19.0, 16.0, 23.0, 9.0, 12.0, 7.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29751962423324585, -0.28751102089881897, -0.2775024473667145, -0.2674938440322876, -0.2574852705001831, -0.24747666716575623, -0.23746807873249054, -0.22745949029922485, -0.21745088696479797, -0.2074422985315323, -0.1974337100982666, -0.18742510676383972, -0.17741651833057404, -0.16740792989730835, -0.15739934146404266, -0.14739075303077698, -0.1373821645975113, -0.1273735761642456, -0.11736498028039932, -0.10735639184713364, -0.09734779596328735, -0.08733920753002167, -0.07733061909675598, -0.0673220232129097, -0.05731343477964401, -0.04730484262108803, -0.03729625046253204, -0.027287662029266357, -0.017279069870710373, -0.007270477712154388, 0.0027381107211112976, 0.01274670660495758, 0.022755295038223267, 0.03276388719677925, 0.042772479355335236, 0.05278106778860092, 0.0627896636724472, 0.07279825210571289, 0.08280684053897858, 0.09281543642282486, 0.10282402485609055, 0.11283261328935623, 0.12284120917320251, 0.1328497976064682, 0.1428583860397339, 0.15286698937416077, 0.16287556290626526, 0.17288416624069214, 0.18289275467395782, 0.1929013431072235, 0.2029099315404892, 0.21291851997375488, 0.22292712330818176, 0.23293571174144745, 0.24294430017471313, 0.25295290350914, 0.2629614770412445, 0.2729700803756714, 0.2829786539077759, 0.29298725724220276, 0.30299583077430725, 0.31300443410873413, 0.3230130076408386, 0.3330216109752655, 0.3430302143096924]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 15.0, 14.0, 16.0, 35.0, 57.0, 77.0, 125.0, 232.0, 392.0, 633.0, 1131.0, 2213.0, 4325.0, 8629.0, 18492.0, 39487.0, 91106.0, 454644.0, 292754.0, 71002.0, 32700.0, 15295.0, 7212.0, 3590.0, 1873.0, 1048.0, 544.0, 325.0, 224.0, 105.0, 98.0, 59.0, 35.0, 19.0, 15.0, 11.0, 5.0, 6.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12711524963378906, -0.12312698364257812, -0.11913871765136719, -0.11515045166015625, -0.11116218566894531, -0.10717391967773438, -0.10318565368652344, -0.0991973876953125, -0.09520912170410156, -0.09122085571289062, -0.08723258972167969, -0.08324432373046875, -0.07925605773925781, -0.07526779174804688, -0.07127952575683594, -0.067291259765625, -0.06330299377441406, -0.059314727783203125, -0.05532646179199219, -0.05133819580078125, -0.04734992980957031, -0.043361663818359375, -0.03937339782714844, -0.0353851318359375, -0.03139686584472656, -0.027408599853515625, -0.023420333862304688, -0.01943206787109375, -0.015443801879882812, -0.011455535888671875, -0.0074672698974609375, -0.00347900390625, 0.0005092620849609375, 0.004497528076171875, 0.008485794067382812, 0.01247406005859375, 0.016462326049804688, 0.020450592041015625, 0.024438858032226562, 0.0284271240234375, 0.03241539001464844, 0.036403656005859375, 0.04039192199707031, 0.04438018798828125, 0.04836845397949219, 0.052356719970703125, 0.05634498596191406, 0.060333251953125, 0.06432151794433594, 0.06830978393554688, 0.07229804992675781, 0.07628631591796875, 0.08027458190917969, 0.08426284790039062, 0.08825111389160156, 0.0922393798828125, 0.09622764587402344, 0.10021591186523438, 0.10420417785644531, 0.10819244384765625, 0.11218070983886719, 0.11616897583007812, 0.12015724182128906, 0.1241455078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 3.0, 5.0, 6.0, 7.0, 9.0, 6.0, 10.0, 15.0, 18.0, 15.0, 30.0, 30.0, 28.0, 27.0, 35.0, 33.0, 46.0, 35.0, 47.0, 34.0, 48.0, 39.0, 44.0, 38.0, 54.0, 40.0, 42.0, 33.0, 31.0, 32.0, 29.0, 24.0, 15.0, 14.0, 15.0, 11.0, 11.0, 10.0, 5.0, 8.0, 6.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02496337890625, -0.024183273315429688, -0.023403167724609375, -0.022623062133789062, -0.02184295654296875, -0.021062850952148438, -0.020282745361328125, -0.019502639770507812, -0.0187225341796875, -0.017942428588867188, -0.017162322998046875, -0.016382217407226562, -0.01560211181640625, -0.014822006225585938, -0.014041900634765625, -0.013261795043945312, -0.012481689453125, -0.011701583862304688, -0.010921478271484375, -0.010141372680664062, -0.00936126708984375, -0.008581161499023438, -0.007801055908203125, -0.0070209503173828125, -0.0062408447265625, -0.0054607391357421875, -0.004680633544921875, -0.0039005279541015625, -0.00312042236328125, -0.0023403167724609375, -0.001560211181640625, -0.0007801055908203125, 0.0, 0.0007801055908203125, 0.001560211181640625, 0.0023403167724609375, 0.00312042236328125, 0.0039005279541015625, 0.004680633544921875, 0.0054607391357421875, 0.0062408447265625, 0.0070209503173828125, 0.007801055908203125, 0.008581161499023438, 0.00936126708984375, 0.010141372680664062, 0.010921478271484375, 0.011701583862304688, 0.012481689453125, 0.013261795043945312, 0.014041900634765625, 0.014822006225585938, 0.01560211181640625, 0.016382217407226562, 0.017162322998046875, 0.017942428588867188, 0.0187225341796875, 0.019502639770507812, 0.020282745361328125, 0.021062850952148438, 0.02184295654296875, 0.022623062133789062, 0.023403167724609375, 0.024183273315429688, 0.02496337890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 6.0, 13.0, 23.0, 19.0, 31.0, 39.0, 56.0, 58.0, 73.0, 89.0, 146.0, 217.0, 280.0, 367.0, 633.0, 1118.0, 1925.0, 4037.0, 10661.0, 31264.0, 93729.0, 638720.0, 185822.0, 49795.0, 16896.0, 6171.0, 2583.0, 1301.0, 742.0, 431.0, 328.0, 234.0, 170.0, 142.0, 95.0, 74.0, 56.0, 47.0, 36.0, 23.0, 21.0, 21.0, 4.0, 10.0, 9.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.156982421875, -0.15218353271484375, -0.1473846435546875, -0.14258575439453125, -0.137786865234375, -0.13298797607421875, -0.1281890869140625, -0.12339019775390625, -0.11859130859375, -0.11379241943359375, -0.1089935302734375, -0.10419464111328125, -0.099395751953125, -0.09459686279296875, -0.0897979736328125, -0.08499908447265625, -0.0802001953125, -0.07540130615234375, -0.0706024169921875, -0.06580352783203125, -0.061004638671875, -0.05620574951171875, -0.0514068603515625, -0.04660797119140625, -0.04180908203125, -0.03701019287109375, -0.0322113037109375, -0.02741241455078125, -0.022613525390625, -0.01781463623046875, -0.0130157470703125, -0.00821685791015625, -0.00341796875, 0.00138092041015625, 0.0061798095703125, 0.01097869873046875, 0.015777587890625, 0.02057647705078125, 0.0253753662109375, 0.03017425537109375, 0.03497314453125, 0.03977203369140625, 0.0445709228515625, 0.04936981201171875, 0.054168701171875, 0.05896759033203125, 0.0637664794921875, 0.06856536865234375, 0.0733642578125, 0.07816314697265625, 0.0829620361328125, 0.08776092529296875, 0.092559814453125, 0.09735870361328125, 0.1021575927734375, 0.10695648193359375, 0.11175537109375, 0.11655426025390625, 0.1213531494140625, 0.12615203857421875, 0.130950927734375, 0.13574981689453125, 0.1405487060546875, 0.14534759521484375, 0.150146484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 8.0, 8.0, 19.0, 10.0, 21.0, 28.0, 46.0, 54.0, 55.0, 47.0, 59.0, 58.0, 60.0, 61.0, 52.0, 57.0, 62.0, 58.0, 45.0, 37.0, 28.0, 27.0, 18.0, 15.0, 15.0, 10.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1678466796875, -0.1627788543701172, -0.15771102905273438, -0.15264320373535156, -0.14757537841796875, -0.14250755310058594, -0.13743972778320312, -0.1323719024658203, -0.1273040771484375, -0.12223625183105469, -0.11716842651367188, -0.11210060119628906, -0.10703277587890625, -0.10196495056152344, -0.09689712524414062, -0.09182929992675781, -0.086761474609375, -0.08169364929199219, -0.07662582397460938, -0.07155799865722656, -0.06649017333984375, -0.06142234802246094, -0.056354522705078125, -0.05128669738769531, -0.0462188720703125, -0.04115104675292969, -0.036083221435546875, -0.031015396118164062, -0.02594757080078125, -0.020879745483398438, -0.015811920166015625, -0.010744094848632812, -0.00567626953125, -0.0006084442138671875, 0.004459381103515625, 0.009527206420898438, 0.01459503173828125, 0.019662857055664062, 0.024730682373046875, 0.029798507690429688, 0.0348663330078125, 0.03993415832519531, 0.045001983642578125, 0.05006980895996094, 0.05513763427734375, 0.06020545959472656, 0.06527328491210938, 0.07034111022949219, 0.075408935546875, 0.08047676086425781, 0.08554458618164062, 0.09061241149902344, 0.09568023681640625, 0.10074806213378906, 0.10581588745117188, 0.11088371276855469, 0.1159515380859375, 0.12101936340332031, 0.12608718872070312, 0.13115501403808594, 0.13622283935546875, 0.14129066467285156, 0.14635848999023438, 0.1514263153076172, 0.156494140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 11.0, 10.0, 16.0, 18.0, 26.0, 53.0, 94.0, 189.0, 522.0, 2598.0, 29158.0, 941765.0, 68602.0, 4183.0, 723.0, 261.0, 127.0, 65.0, 49.0, 28.0, 23.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.394134521484375, -0.38275146484375, -0.371368408203125, -0.3599853515625, -0.348602294921875, -0.33721923828125, -0.325836181640625, -0.314453125, -0.303070068359375, -0.29168701171875, -0.280303955078125, -0.2689208984375, -0.257537841796875, -0.24615478515625, -0.234771728515625, -0.223388671875, -0.212005615234375, -0.20062255859375, -0.189239501953125, -0.1778564453125, -0.166473388671875, -0.15509033203125, -0.143707275390625, -0.13232421875, -0.120941162109375, -0.10955810546875, -0.098175048828125, -0.0867919921875, -0.075408935546875, -0.06402587890625, -0.052642822265625, -0.041259765625, -0.029876708984375, -0.01849365234375, -0.007110595703125, 0.0042724609375, 0.015655517578125, 0.02703857421875, 0.038421630859375, 0.0498046875, 0.061187744140625, 0.07257080078125, 0.083953857421875, 0.0953369140625, 0.106719970703125, 0.11810302734375, 0.129486083984375, 0.140869140625, 0.152252197265625, 0.16363525390625, 0.175018310546875, 0.1864013671875, 0.197784423828125, 0.20916748046875, 0.220550537109375, 0.23193359375, 0.243316650390625, 0.25469970703125, 0.266082763671875, 0.2774658203125, 0.288848876953125, 0.30023193359375, 0.311614990234375, 0.322998046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 10.0, 20.0, 31.0, 41.0, 78.0, 129.0, 138.0, 150.0, 142.0, 87.0, 61.0, 31.0, 25.0, 18.0, 11.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.930662155151367e-05, -5.6224875152111053e-05, -5.3143128752708435e-05, -5.006138235330582e-05, -4.69796359539032e-05, -4.389788955450058e-05, -4.081614315509796e-05, -3.773439675569534e-05, -3.4652650356292725e-05, -3.1570903956890106e-05, -2.8489157557487488e-05, -2.540741115808487e-05, -2.232566475868225e-05, -1.9243918359279633e-05, -1.6162171959877014e-05, -1.3080425560474396e-05, -9.998679161071777e-06, -6.916932761669159e-06, -3.8351863622665405e-06, -7.534399628639221e-07, 2.3283064365386963e-06, 5.410052835941315e-06, 8.491799235343933e-06, 1.1573545634746552e-05, 1.465529203414917e-05, 1.773703843355179e-05, 2.0818784832954407e-05, 2.3900531232357025e-05, 2.6982277631759644e-05, 3.0064024031162262e-05, 3.314577043056488e-05, 3.62275168299675e-05, 3.930926322937012e-05, 4.2391009628772736e-05, 4.5472756028175354e-05, 4.855450242757797e-05, 5.163624882698059e-05, 5.471799522638321e-05, 5.779974162578583e-05, 6.0881488025188446e-05, 6.396323442459106e-05, 6.704498082399368e-05, 7.01267272233963e-05, 7.320847362279892e-05, 7.629022002220154e-05, 7.937196642160416e-05, 8.245371282100677e-05, 8.55354592204094e-05, 8.861720561981201e-05, 9.169895201921463e-05, 9.478069841861725e-05, 9.786244481801987e-05, 0.00010094419121742249, 0.0001040259376168251, 0.00010710768401622772, 0.00011018943041563034, 0.00011327117681503296, 0.00011635292321443558, 0.0001194346696138382, 0.00012251641601324081, 0.00012559816241264343, 0.00012867990881204605, 0.00013176165521144867, 0.0001348434016108513, 0.0001379251480102539]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 15.0, 20.0, 22.0, 50.0, 62.0, 115.0, 191.0, 328.0, 757.0, 2540.0, 12395.0, 184138.0, 816426.0, 25448.0, 3885.0, 1081.0, 431.0, 238.0, 143.0, 88.0, 58.0, 39.0, 30.0, 10.0, 10.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2435302734375, -0.23595809936523438, -0.22838592529296875, -0.22081375122070312, -0.2132415771484375, -0.20566940307617188, -0.19809722900390625, -0.19052505493164062, -0.182952880859375, -0.17538070678710938, -0.16780853271484375, -0.16023635864257812, -0.1526641845703125, -0.14509201049804688, -0.13751983642578125, -0.12994766235351562, -0.12237548828125, -0.11480331420898438, -0.10723114013671875, -0.09965896606445312, -0.0920867919921875, -0.08451461791992188, -0.07694244384765625, -0.06937026977539062, -0.061798095703125, -0.054225921630859375, -0.04665374755859375, -0.039081573486328125, -0.0315093994140625, -0.023937225341796875, -0.01636505126953125, -0.008792877197265625, -0.001220703125, 0.006351470947265625, 0.01392364501953125, 0.021495819091796875, 0.0290679931640625, 0.036640167236328125, 0.04421234130859375, 0.051784515380859375, 0.059356689453125, 0.06692886352539062, 0.07450103759765625, 0.08207321166992188, 0.0896453857421875, 0.09721755981445312, 0.10478973388671875, 0.11236190795898438, 0.11993408203125, 0.12750625610351562, 0.13507843017578125, 0.14265060424804688, 0.1502227783203125, 0.15779495239257812, 0.16536712646484375, 0.17293930053710938, 0.180511474609375, 0.18808364868164062, 0.19565582275390625, 0.20322799682617188, 0.2108001708984375, 0.21837234497070312, 0.22594451904296875, 0.23351669311523438, 0.2410888671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 6.0, 12.0, 12.0, 20.0, 19.0, 25.0, 43.0, 68.0, 163.0, 276.0, 162.0, 60.0, 24.0, 31.0, 22.0, 15.0, 11.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1295166015625, -0.125762939453125, -0.12200927734375, -0.118255615234375, -0.114501953125, -0.110748291015625, -0.10699462890625, -0.103240966796875, -0.0994873046875, -0.095733642578125, -0.09197998046875, -0.088226318359375, -0.08447265625, -0.080718994140625, -0.07696533203125, -0.073211669921875, -0.0694580078125, -0.065704345703125, -0.06195068359375, -0.058197021484375, -0.054443359375, -0.050689697265625, -0.04693603515625, -0.043182373046875, -0.0394287109375, -0.035675048828125, -0.03192138671875, -0.028167724609375, -0.0244140625, -0.020660400390625, -0.01690673828125, -0.013153076171875, -0.0093994140625, -0.005645751953125, -0.00189208984375, 0.001861572265625, 0.005615234375, 0.009368896484375, 0.01312255859375, 0.016876220703125, 0.0206298828125, 0.024383544921875, 0.02813720703125, 0.031890869140625, 0.03564453125, 0.039398193359375, 0.04315185546875, 0.046905517578125, 0.0506591796875, 0.054412841796875, 0.05816650390625, 0.061920166015625, 0.065673828125, 0.069427490234375, 0.07318115234375, 0.076934814453125, 0.0806884765625, 0.084442138671875, 0.08819580078125, 0.091949462890625, 0.095703125, 0.099456787109375, 0.10321044921875, 0.106964111328125, 0.1107177734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 5.0, 21.0, 50.0, 123.0, 220.0, 256.0, 199.0, 85.0, 29.0, 13.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1755073070526123, -1.0989019870758057, -1.022296667098999, -0.9456912279129028, -0.8690859079360962, -0.7924805879592896, -0.7158752083778381, -0.6392698287963867, -0.5626645088195801, -0.48605915904045105, -0.409453809261322, -0.332848459482193, -0.25624310970306396, -0.17963775992393494, -0.10303241014480591, -0.026427030563354492, 0.05017828941345215, 0.12678363919258118, 0.2033889889717102, 0.27999433875083923, 0.35659968852996826, 0.4332050383090973, 0.5098103880882263, 0.5864157676696777, 0.6630210876464844, 0.739626407623291, 0.8162317872047424, 0.8928371667861938, 0.9694424867630005, 1.0460478067398071, 1.1226532459259033, 1.19925856590271, 1.2758641242980957, 1.3524694442749023, 1.429074764251709, 1.5056802034378052, 1.5822855234146118, 1.6588908433914185, 1.7354962825775146, 1.8121016025543213, 1.888706922531128, 1.9653122425079346, 2.041917562484741, 2.118522882461548, 2.1951284408569336, 2.2717337608337402, 2.348339080810547, 2.4249444007873535, 2.50154972076416, 2.578155040740967, 2.6547603607177734, 2.73136568069458, 2.8079710006713867, 2.8845765590667725, 2.961181879043579, 3.0377871990203857, 3.1143925189971924, 3.190997838973999, 3.2676031589508057, 3.3442084789276123, 3.420814037322998, 3.4974193572998047, 3.5740246772766113, 3.650629997253418, 3.7272353172302246]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 10.0, 9.0, 14.0, 20.0, 14.0, 16.0, 24.0, 30.0, 23.0, 32.0, 25.0, 36.0, 45.0, 43.0, 44.0, 60.0, 52.0, 55.0, 45.0, 42.0, 56.0, 46.0, 41.0, 24.0, 26.0, 27.0, 20.0, 22.0, 25.0, 9.0, 15.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8387554287910461, -0.8171766996383667, -0.7955979108810425, -0.774019181728363, -0.7524404525756836, -0.7308617234230042, -0.7092829942703247, -0.6877042055130005, -0.666125476360321, -0.6445467472076416, -0.6229679584503174, -0.6013892292976379, -0.5798105001449585, -0.558231770992279, -0.5366530418395996, -0.5150742530822754, -0.49349552392959595, -0.4719167947769165, -0.4503380358219147, -0.42875927686691284, -0.4071805477142334, -0.38560181856155396, -0.3640230596065521, -0.3424443006515503, -0.32086557149887085, -0.2992868423461914, -0.2777080833911896, -0.25612932443618774, -0.2345505952835083, -0.21297185122966766, -0.19139310717582703, -0.1698143631219864, -0.14823567867279053, -0.1266569346189499, -0.10507819056510925, -0.08349944651126862, -0.06192070245742798, -0.04034195840358734, -0.018763214349746704, 0.002815529704093933, 0.02439427375793457, 0.04597301781177521, 0.06755176186561584, 0.08913050591945648, 0.11070924997329712, 0.13228799402713776, 0.1538667380809784, 0.17544548213481903, 0.19702422618865967, 0.2186029702425003, 0.24018171429634094, 0.2617604732513428, 0.2833392024040222, 0.30491793155670166, 0.3264966905117035, 0.3480754494667053, 0.36965417861938477, 0.3912329077720642, 0.41281166672706604, 0.43439042568206787, 0.4559691548347473, 0.47754788398742676, 0.4991266429424286, 0.5207054018974304, 0.5422841310501099]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 14.0, 8.0, 19.0, 26.0, 31.0, 54.0, 100.0, 142.0, 228.0, 389.0, 709.0, 1166.0, 2143.0, 4281.0, 8755.0, 19781.0, 51008.0, 173474.0, 3005724.0, 746496.0, 112258.0, 37534.0, 15310.0, 6829.0, 3472.0, 1798.0, 980.0, 613.0, 348.0, 220.0, 137.0, 74.0, 63.0, 27.0, 21.0, 18.0, 16.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.1324300765991211, -0.1286296844482422, -0.12482929229736328, -0.12102890014648438, -0.11722850799560547, -0.11342811584472656, -0.10962772369384766, -0.10582733154296875, -0.10202693939208984, -0.09822654724121094, -0.09442615509033203, -0.09062576293945312, -0.08682537078857422, -0.08302497863769531, -0.0792245864868164, -0.0754241943359375, -0.0716238021850586, -0.06782341003417969, -0.06402301788330078, -0.060222625732421875, -0.05642223358154297, -0.05262184143066406, -0.048821449279785156, -0.04502105712890625, -0.041220664978027344, -0.03742027282714844, -0.03361988067626953, -0.029819488525390625, -0.02601909637451172, -0.022218704223632812, -0.018418312072753906, -0.014617919921875, -0.010817527770996094, -0.0070171356201171875, -0.0032167434692382812, 0.000583648681640625, 0.004384040832519531, 0.008184432983398438, 0.011984825134277344, 0.01578521728515625, 0.019585609436035156, 0.023386001586914062, 0.02718639373779297, 0.030986785888671875, 0.03478717803955078, 0.03858757019042969, 0.042387962341308594, 0.0461883544921875, 0.049988746643066406, 0.05378913879394531, 0.05758953094482422, 0.061389923095703125, 0.06519031524658203, 0.06899070739746094, 0.07279109954833984, 0.07659149169921875, 0.08039188385009766, 0.08419227600097656, 0.08799266815185547, 0.09179306030273438, 0.09559345245361328, 0.09939384460449219, 0.1031942367553711, 0.10699462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 6.0, 12.0, 8.0, 19.0, 20.0, 25.0, 23.0, 45.0, 40.0, 46.0, 53.0, 42.0, 56.0, 50.0, 63.0, 64.0, 52.0, 57.0, 61.0, 49.0, 42.0, 27.0, 26.0, 24.0, 19.0, 19.0, 11.0, 10.0, 6.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030792236328125, -0.029666900634765625, -0.02854156494140625, -0.027416229248046875, -0.0262908935546875, -0.025165557861328125, -0.02404022216796875, -0.022914886474609375, -0.02178955078125, -0.020664215087890625, -0.01953887939453125, -0.018413543701171875, -0.0172882080078125, -0.016162872314453125, -0.01503753662109375, -0.013912200927734375, -0.012786865234375, -0.011661529541015625, -0.01053619384765625, -0.009410858154296875, -0.0082855224609375, -0.007160186767578125, -0.00603485107421875, -0.004909515380859375, -0.0037841796875, -0.002658843994140625, -0.00153350830078125, -0.000408172607421875, 0.0007171630859375, 0.001842498779296875, 0.00296783447265625, 0.004093170166015625, 0.005218505859375, 0.006343841552734375, 0.00746917724609375, 0.008594512939453125, 0.0097198486328125, 0.010845184326171875, 0.01197052001953125, 0.013095855712890625, 0.01422119140625, 0.015346527099609375, 0.01647186279296875, 0.017597198486328125, 0.0187225341796875, 0.019847869873046875, 0.02097320556640625, 0.022098541259765625, 0.023223876953125, 0.024349212646484375, 0.02547454833984375, 0.026599884033203125, 0.0277252197265625, 0.028850555419921875, 0.02997589111328125, 0.031101226806640625, 0.0322265625, 0.033351898193359375, 0.03447723388671875, 0.035602569580078125, 0.0367279052734375, 0.037853240966796875, 0.03897857666015625, 0.040103912353515625, 0.041229248046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 9.0, 13.0, 14.0, 22.0, 25.0, 27.0, 38.0, 66.0, 87.0, 109.0, 131.0, 222.0, 305.0, 570.0, 992.0, 1992.0, 4874.0, 14218.0, 54503.0, 358490.0, 3460041.0, 235746.0, 41751.0, 11720.0, 4092.0, 1743.0, 927.0, 470.0, 332.0, 195.0, 146.0, 92.0, 78.0, 69.0, 50.0, 25.0, 19.0, 20.0, 13.0, 10.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.224853515625, -0.21831893920898438, -0.21178436279296875, -0.20524978637695312, -0.1987152099609375, -0.19218063354492188, -0.18564605712890625, -0.17911148071289062, -0.172576904296875, -0.16604232788085938, -0.15950775146484375, -0.15297317504882812, -0.1464385986328125, -0.13990402221679688, -0.13336944580078125, -0.12683486938476562, -0.12030029296875, -0.11376571655273438, -0.10723114013671875, -0.10069656372070312, -0.0941619873046875, -0.08762741088867188, -0.08109283447265625, -0.07455825805664062, -0.068023681640625, -0.061489105224609375, -0.05495452880859375, -0.048419952392578125, -0.0418853759765625, -0.035350799560546875, -0.02881622314453125, -0.022281646728515625, -0.0157470703125, -0.009212493896484375, -0.00267791748046875, 0.003856658935546875, 0.0103912353515625, 0.016925811767578125, 0.02346038818359375, 0.029994964599609375, 0.036529541015625, 0.043064117431640625, 0.04959869384765625, 0.056133270263671875, 0.0626678466796875, 0.06920242309570312, 0.07573699951171875, 0.08227157592773438, 0.08880615234375, 0.09534072875976562, 0.10187530517578125, 0.10840988159179688, 0.1149444580078125, 0.12147903442382812, 0.12801361083984375, 0.13454818725585938, 0.141082763671875, 0.14761734008789062, 0.15415191650390625, 0.16068649291992188, 0.1672210693359375, 0.17375564575195312, 0.18029022216796875, 0.18682479858398438, 0.193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 14.0, 21.0, 39.0, 75.0, 134.0, 330.0, 1568.0, 1262.0, 303.0, 141.0, 62.0, 35.0, 21.0, 17.0, 11.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11498737335205078, -0.11101722717285156, -0.10704708099365234, -0.10307693481445312, -0.0991067886352539, -0.09513664245605469, -0.09116649627685547, -0.08719635009765625, -0.08322620391845703, -0.07925605773925781, -0.0752859115600586, -0.07131576538085938, -0.06734561920166016, -0.06337547302246094, -0.05940532684326172, -0.0554351806640625, -0.05146503448486328, -0.04749488830566406, -0.043524742126464844, -0.039554595947265625, -0.035584449768066406, -0.03161430358886719, -0.02764415740966797, -0.02367401123046875, -0.01970386505126953, -0.015733718872070312, -0.011763572692871094, -0.007793426513671875, -0.0038232803344726562, 0.0001468658447265625, 0.004117012023925781, 0.008087158203125, 0.012057304382324219, 0.016027450561523438, 0.019997596740722656, 0.023967742919921875, 0.027937889099121094, 0.03190803527832031, 0.03587818145751953, 0.03984832763671875, 0.04381847381591797, 0.04778861999511719, 0.051758766174316406, 0.055728912353515625, 0.059699058532714844, 0.06366920471191406, 0.06763935089111328, 0.0716094970703125, 0.07557964324951172, 0.07954978942871094, 0.08351993560791016, 0.08749008178710938, 0.0914602279663086, 0.09543037414550781, 0.09940052032470703, 0.10337066650390625, 0.10734081268310547, 0.11131095886230469, 0.1152811050415039, 0.11925125122070312, 0.12322139739990234, 0.12719154357910156, 0.13116168975830078, 0.1351318359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 9.0, 24.0, 45.0, 85.0, 124.0, 184.0, 156.0, 133.0, 97.0, 55.0, 42.0, 20.0, 10.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9729800820350647, -0.9513079524040222, -0.9296358227729797, -0.9079636931419373, -0.8862915635108948, -0.8646194338798523, -0.8429473638534546, -0.8212752342224121, -0.7996031045913696, -0.7779309749603271, -0.7562588453292847, -0.7345867156982422, -0.7129145860671997, -0.6912424564361572, -0.6695703268051147, -0.6478981971740723, -0.6262260675430298, -0.6045539379119873, -0.5828818082809448, -0.5612096786499023, -0.5395375490188599, -0.5178654193878174, -0.4961933195590973, -0.4745211899280548, -0.45284906029701233, -0.43117693066596985, -0.40950480103492737, -0.3878327012062073, -0.3661605715751648, -0.3444884419441223, -0.32281631231307983, -0.30114418268203735, -0.2794719934463501, -0.2577998638153076, -0.23612773418426514, -0.21445561945438385, -0.19278348982334137, -0.1711113601922989, -0.1494392454624176, -0.12776711583137512, -0.10609498620033264, -0.08442285656929016, -0.06275073438882828, -0.041078612208366394, -0.019406482577323914, 0.002265647053718567, 0.023937761783599854, 0.045609891414642334, 0.06728202104568481, 0.0889541506767273, 0.11062627285718918, 0.13229839503765106, 0.15397052466869354, 0.17564265429973602, 0.1973147690296173, 0.2189868986606598, 0.24065902829170227, 0.26233115792274475, 0.28400328755378723, 0.3056753873825073, 0.3273475170135498, 0.3490196466445923, 0.37069177627563477, 0.39236390590667725, 0.4140360355377197]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 7.0, 9.0, 8.0, 16.0, 17.0, 17.0, 18.0, 25.0, 26.0, 28.0, 23.0, 27.0, 27.0, 35.0, 36.0, 44.0, 49.0, 48.0, 34.0, 48.0, 35.0, 33.0, 29.0, 36.0, 41.0, 27.0, 23.0, 32.0, 20.0, 23.0, 23.0, 16.0, 15.0, 17.0, 8.0, 10.0, 10.0, 9.0, 12.0, 10.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.26798975467681885, -0.26048341393470764, -0.25297704339027405, -0.24547070264816284, -0.23796434700489044, -0.23045799136161804, -0.22295165061950684, -0.21544529497623444, -0.20793893933296204, -0.20043258368968964, -0.19292622804641724, -0.18541988730430603, -0.17791353166103363, -0.17040717601776123, -0.16290083527565002, -0.15539447963237762, -0.14788812398910522, -0.14038176834583282, -0.13287541270256042, -0.12536907196044922, -0.11786271631717682, -0.11035636067390442, -0.10285001248121262, -0.09534366428852081, -0.08783730864524841, -0.08033095300197601, -0.07282460480928421, -0.06531825661659241, -0.05781190097332001, -0.050305549055337906, -0.042799197137355804, -0.0352928452193737, -0.0277864933013916, -0.0202801413834095, -0.012773789465427399, -0.005267437547445297, 0.002238914370536804, 0.009745266288518906, 0.017251618206501007, 0.02475797012448311, 0.03226432204246521, 0.03977067396044731, 0.04727702587842941, 0.054783377796411514, 0.062289729714393616, 0.06979608535766602, 0.07730243355035782, 0.08480878174304962, 0.09231513738632202, 0.09982149302959442, 0.10732784122228622, 0.11483418941497803, 0.12234054505825043, 0.12984690070152283, 0.13735324144363403, 0.14485959708690643, 0.15236595273017883, 0.15987230837345123, 0.16737866401672363, 0.17488500475883484, 0.18239136040210724, 0.18989771604537964, 0.19740405678749084, 0.20491041243076324, 0.21241676807403564]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 8.0, 4.0, 7.0, 10.0, 9.0, 27.0, 22.0, 29.0, 56.0, 72.0, 117.0, 163.0, 342.0, 667.0, 1390.0, 2952.0, 6621.0, 13703.0, 27959.0, 64459.0, 348127.0, 444951.0, 76440.0, 31025.0, 15369.0, 7416.0, 3417.0, 1532.0, 734.0, 371.0, 202.0, 111.0, 63.0, 42.0, 33.0, 33.0, 20.0, 16.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.119140625, -0.11542606353759766, -0.11171150207519531, -0.10799694061279297, -0.10428237915039062, -0.10056781768798828, -0.09685325622558594, -0.0931386947631836, -0.08942413330078125, -0.0857095718383789, -0.08199501037597656, -0.07828044891357422, -0.07456588745117188, -0.07085132598876953, -0.06713676452636719, -0.06342220306396484, -0.0597076416015625, -0.055993080139160156, -0.05227851867675781, -0.04856395721435547, -0.044849395751953125, -0.04113483428955078, -0.03742027282714844, -0.033705711364746094, -0.02999114990234375, -0.026276588439941406, -0.022562026977539062, -0.01884746551513672, -0.015132904052734375, -0.011418342590332031, -0.0077037811279296875, -0.003989219665527344, -0.000274658203125, 0.0034399032592773438, 0.0071544647216796875, 0.010869026184082031, 0.014583587646484375, 0.01829814910888672, 0.022012710571289062, 0.025727272033691406, 0.02944183349609375, 0.033156394958496094, 0.03687095642089844, 0.04058551788330078, 0.044300079345703125, 0.04801464080810547, 0.05172920227050781, 0.055443763732910156, 0.0591583251953125, 0.06287288665771484, 0.06658744812011719, 0.07030200958251953, 0.07401657104492188, 0.07773113250732422, 0.08144569396972656, 0.0851602554321289, 0.08887481689453125, 0.0925893783569336, 0.09630393981933594, 0.10001850128173828, 0.10373306274414062, 0.10744762420654297, 0.11116218566894531, 0.11487674713134766, 0.11859130859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 9.0, 11.0, 16.0, 10.0, 15.0, 26.0, 15.0, 21.0, 28.0, 31.0, 24.0, 40.0, 22.0, 43.0, 27.0, 39.0, 43.0, 40.0, 44.0, 47.0, 35.0, 42.0, 33.0, 30.0, 42.0, 29.0, 37.0, 36.0, 18.0, 15.0, 17.0, 15.0, 7.0, 21.0, 6.0, 8.0, 14.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0261993408203125, -0.025350570678710938, -0.024501800537109375, -0.023653030395507812, -0.02280426025390625, -0.021955490112304688, -0.021106719970703125, -0.020257949829101562, -0.0194091796875, -0.018560409545898438, -0.017711639404296875, -0.016862869262695312, -0.01601409912109375, -0.015165328979492188, -0.014316558837890625, -0.013467788696289062, -0.0126190185546875, -0.011770248413085938, -0.010921478271484375, -0.010072708129882812, -0.00922393798828125, -0.008375167846679688, -0.007526397705078125, -0.0066776275634765625, -0.005828857421875, -0.0049800872802734375, -0.004131317138671875, -0.0032825469970703125, -0.00243377685546875, -0.0015850067138671875, -0.000736236572265625, 0.0001125335693359375, 0.0009613037109375, 0.0018100738525390625, 0.002658843994140625, 0.0035076141357421875, 0.00435638427734375, 0.0052051544189453125, 0.006053924560546875, 0.0069026947021484375, 0.00775146484375, 0.008600234985351562, 0.009449005126953125, 0.010297775268554688, 0.01114654541015625, 0.011995315551757812, 0.012844085693359375, 0.013692855834960938, 0.0145416259765625, 0.015390396118164062, 0.016239166259765625, 0.017087936401367188, 0.01793670654296875, 0.018785476684570312, 0.019634246826171875, 0.020483016967773438, 0.021331787109375, 0.022180557250976562, 0.023029327392578125, 0.023878097534179688, 0.02472686767578125, 0.025575637817382812, 0.026424407958984375, 0.027273178100585938, 0.0281219482421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 6.0, 10.0, 13.0, 20.0, 21.0, 36.0, 51.0, 88.0, 162.0, 208.0, 451.0, 941.0, 2422.0, 7056.0, 22383.0, 69406.0, 767240.0, 129440.0, 32029.0, 10460.0, 3450.0, 1285.0, 586.0, 298.0, 163.0, 114.0, 60.0, 40.0, 31.0, 22.0, 9.0, 8.0, 6.0, 12.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.228271484375, -0.2220458984375, -0.2158203125, -0.2095947265625, -0.203369140625, -0.1971435546875, -0.19091796875, -0.1846923828125, -0.178466796875, -0.1722412109375, -0.166015625, -0.1597900390625, -0.153564453125, -0.1473388671875, -0.14111328125, -0.1348876953125, -0.128662109375, -0.1224365234375, -0.1162109375, -0.1099853515625, -0.103759765625, -0.0975341796875, -0.09130859375, -0.0850830078125, -0.078857421875, -0.0726318359375, -0.06640625, -0.0601806640625, -0.053955078125, -0.0477294921875, -0.04150390625, -0.0352783203125, -0.029052734375, -0.0228271484375, -0.0166015625, -0.0103759765625, -0.004150390625, 0.0020751953125, 0.00830078125, 0.0145263671875, 0.020751953125, 0.0269775390625, 0.033203125, 0.0394287109375, 0.045654296875, 0.0518798828125, 0.05810546875, 0.0643310546875, 0.070556640625, 0.0767822265625, 0.0830078125, 0.0892333984375, 0.095458984375, 0.1016845703125, 0.10791015625, 0.1141357421875, 0.120361328125, 0.1265869140625, 0.1328125, 0.1390380859375, 0.145263671875, 0.1514892578125, 0.15771484375, 0.1639404296875, 0.170166015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 6.0, 5.0, 6.0, 17.0, 19.0, 23.0, 28.0, 32.0, 45.0, 53.0, 44.0, 54.0, 61.0, 74.0, 68.0, 71.0, 63.0, 45.0, 48.0, 43.0, 40.0, 28.0, 26.0, 16.0, 14.0, 16.0, 13.0, 6.0, 10.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.20047950744628906, -0.19478225708007812, -0.1890850067138672, -0.18338775634765625, -0.1776905059814453, -0.17199325561523438, -0.16629600524902344, -0.1605987548828125, -0.15490150451660156, -0.14920425415039062, -0.1435070037841797, -0.13780975341796875, -0.1321125030517578, -0.12641525268554688, -0.12071800231933594, -0.115020751953125, -0.10932350158691406, -0.10362625122070312, -0.09792900085449219, -0.09223175048828125, -0.08653450012207031, -0.08083724975585938, -0.07513999938964844, -0.0694427490234375, -0.06374549865722656, -0.058048248291015625, -0.05235099792480469, -0.04665374755859375, -0.04095649719238281, -0.035259246826171875, -0.029561996459960938, -0.02386474609375, -0.018167495727539062, -0.012470245361328125, -0.0067729949951171875, -0.00107574462890625, 0.0046215057373046875, 0.010318756103515625, 0.016016006469726562, 0.0217132568359375, 0.027410507202148438, 0.033107757568359375, 0.03880500793457031, 0.04450225830078125, 0.05019950866699219, 0.055896759033203125, 0.06159400939941406, 0.067291259765625, 0.07298851013183594, 0.07868576049804688, 0.08438301086425781, 0.09008026123046875, 0.09577751159667969, 0.10147476196289062, 0.10717201232910156, 0.1128692626953125, 0.11856651306152344, 0.12426376342773438, 0.1299610137939453, 0.13565826416015625, 0.1413555145263672, 0.14705276489257812, 0.15275001525878906, 0.158447265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 11.0, 20.0, 23.0, 25.0, 38.0, 47.0, 95.0, 133.0, 203.0, 322.0, 563.0, 922.0, 1628.0, 2963.0, 6025.0, 12620.0, 28002.0, 69142.0, 606507.0, 233118.0, 46447.0, 20245.0, 9336.0, 4541.0, 2352.0, 1279.0, 744.0, 443.0, 265.0, 179.0, 90.0, 51.0, 44.0, 28.0, 31.0, 17.0, 14.0, 7.0, 8.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0716552734375, -0.0695352554321289, -0.06741523742675781, -0.06529521942138672, -0.06317520141601562, -0.06105518341064453, -0.05893516540527344, -0.056815147399902344, -0.05469512939453125, -0.052575111389160156, -0.05045509338378906, -0.04833507537841797, -0.046215057373046875, -0.04409503936767578, -0.04197502136230469, -0.039855003356933594, -0.0377349853515625, -0.035614967346191406, -0.03349494934082031, -0.03137493133544922, -0.029254913330078125, -0.02713489532470703, -0.025014877319335938, -0.022894859313964844, -0.02077484130859375, -0.018654823303222656, -0.016534805297851562, -0.014414787292480469, -0.012294769287109375, -0.010174751281738281, -0.008054733276367188, -0.005934715270996094, -0.003814697265625, -0.0016946792602539062, 0.0004253387451171875, 0.0025453567504882812, 0.004665374755859375, 0.006785392761230469, 0.008905410766601562, 0.011025428771972656, 0.01314544677734375, 0.015265464782714844, 0.017385482788085938, 0.01950550079345703, 0.021625518798828125, 0.02374553680419922, 0.025865554809570312, 0.027985572814941406, 0.0301055908203125, 0.032225608825683594, 0.03434562683105469, 0.03646564483642578, 0.038585662841796875, 0.04070568084716797, 0.04282569885253906, 0.044945716857910156, 0.04706573486328125, 0.049185752868652344, 0.05130577087402344, 0.05342578887939453, 0.055545806884765625, 0.05766582489013672, 0.05978584289550781, 0.061905860900878906, 0.06402587890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 15.0, 14.0, 27.0, 38.0, 44.0, 66.0, 75.0, 93.0, 109.0, 119.0, 107.0, 81.0, 56.0, 29.0, 25.0, 17.0, 19.0, 10.0, 17.0, 1.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.645917892456055e-05, -6.464775651693344e-05, -6.283633410930634e-05, -6.102491170167923e-05, -5.9213489294052124e-05, -5.740206688642502e-05, -5.559064447879791e-05, -5.377922207117081e-05, -5.19677996635437e-05, -5.0156377255916595e-05, -4.834495484828949e-05, -4.6533532440662384e-05, -4.472211003303528e-05, -4.291068762540817e-05, -4.109926521778107e-05, -3.928784281015396e-05, -3.7476420402526855e-05, -3.566499799489975e-05, -3.3853575587272644e-05, -3.204215317964554e-05, -3.0230730772018433e-05, -2.8419308364391327e-05, -2.660788595676422e-05, -2.4796463549137115e-05, -2.298504114151001e-05, -2.1173618733882904e-05, -1.93621963262558e-05, -1.7550773918628693e-05, -1.5739351511001587e-05, -1.3927929103374481e-05, -1.2116506695747375e-05, -1.030508428812027e-05, -8.493661880493164e-06, -6.682239472866058e-06, -4.870817065238953e-06, -3.059394657611847e-06, -1.2479722499847412e-06, 5.634501576423645e-07, 2.3748725652694702e-06, 4.186294972896576e-06, 5.997717380523682e-06, 7.809139788150787e-06, 9.620562195777893e-06, 1.1431984603404999e-05, 1.3243407011032104e-05, 1.505482941865921e-05, 1.6866251826286316e-05, 1.867767423391342e-05, 2.0489096641540527e-05, 2.2300519049167633e-05, 2.411194145679474e-05, 2.5923363864421844e-05, 2.773478627204895e-05, 2.9546208679676056e-05, 3.135763108730316e-05, 3.316905349493027e-05, 3.498047590255737e-05, 3.679189831018448e-05, 3.8603320717811584e-05, 4.041474312543869e-05, 4.2226165533065796e-05, 4.40375879406929e-05, 4.584901034832001e-05, 4.766043275594711e-05, 4.947185516357422e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 11.0, 9.0, 9.0, 25.0, 42.0, 69.0, 151.0, 259.0, 593.0, 1562.0, 4633.0, 16197.0, 70088.0, 812799.0, 110708.0, 21933.0, 6041.0, 1968.0, 751.0, 342.0, 159.0, 85.0, 44.0, 30.0, 13.0, 13.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.08701324462890625, -0.0833282470703125, -0.07964324951171875, -0.075958251953125, -0.07227325439453125, -0.0685882568359375, -0.06490325927734375, -0.06121826171875, -0.05753326416015625, -0.0538482666015625, -0.05016326904296875, -0.046478271484375, -0.04279327392578125, -0.0391082763671875, -0.03542327880859375, -0.03173828125, -0.02805328369140625, -0.0243682861328125, -0.02068328857421875, -0.016998291015625, -0.01331329345703125, -0.0096282958984375, -0.00594329833984375, -0.00225830078125, 0.00142669677734375, 0.0051116943359375, 0.00879669189453125, 0.012481689453125, 0.01616668701171875, 0.0198516845703125, 0.02353668212890625, 0.0272216796875, 0.03090667724609375, 0.0345916748046875, 0.03827667236328125, 0.041961669921875, 0.04564666748046875, 0.0493316650390625, 0.05301666259765625, 0.05670166015625, 0.06038665771484375, 0.0640716552734375, 0.06775665283203125, 0.071441650390625, 0.07512664794921875, 0.0788116455078125, 0.08249664306640625, 0.086181640625, 0.08986663818359375, 0.0935516357421875, 0.09723663330078125, 0.100921630859375, 0.10460662841796875, 0.1082916259765625, 0.11197662353515625, 0.11566162109375, 0.11934661865234375, 0.1230316162109375, 0.12671661376953125, 0.130401611328125, 0.13408660888671875, 0.1377716064453125, 0.14145660400390625, 0.1451416015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 7.0, 7.0, 6.0, 8.0, 14.0, 26.0, 26.0, 37.0, 96.0, 150.0, 203.0, 146.0, 81.0, 44.0, 25.0, 14.0, 18.0, 11.0, 12.0, 10.0, 9.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055267333984375, -0.0530095100402832, -0.050751686096191406, -0.04849386215209961, -0.04623603820800781, -0.043978214263916016, -0.04172039031982422, -0.03946256637573242, -0.037204742431640625, -0.03494691848754883, -0.03268909454345703, -0.030431270599365234, -0.028173446655273438, -0.02591562271118164, -0.023657798767089844, -0.021399974822998047, -0.01914215087890625, -0.016884326934814453, -0.014626502990722656, -0.01236867904663086, -0.010110855102539062, -0.007853031158447266, -0.005595207214355469, -0.003337383270263672, -0.001079559326171875, 0.0011782646179199219, 0.0034360885620117188, 0.005693912506103516, 0.007951736450195312, 0.01020956039428711, 0.012467384338378906, 0.014725208282470703, 0.0169830322265625, 0.019240856170654297, 0.021498680114746094, 0.02375650405883789, 0.026014328002929688, 0.028272151947021484, 0.03052997589111328, 0.03278779983520508, 0.035045623779296875, 0.03730344772338867, 0.03956127166748047, 0.041819095611572266, 0.04407691955566406, 0.04633474349975586, 0.048592567443847656, 0.05085039138793945, 0.05310821533203125, 0.05536603927612305, 0.057623863220214844, 0.05988168716430664, 0.06213951110839844, 0.06439733505249023, 0.06665515899658203, 0.06891298294067383, 0.07117080688476562, 0.07342863082885742, 0.07568645477294922, 0.07794427871704102, 0.08020210266113281, 0.08245992660522461, 0.0847177505493164, 0.0869755744934082, 0.0892333984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 10.0, 10.0, 28.0, 40.0, 69.0, 95.0, 131.0, 152.0, 149.0, 121.0, 78.0, 47.0, 37.0, 23.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5589745044708252, -1.5216351747512817, -1.4842958450317383, -1.4469563961029053, -1.4096170663833618, -1.3722777366638184, -1.334938406944275, -1.2975990772247314, -1.2602596282958984, -1.222920298576355, -1.1855809688568115, -1.1482415199279785, -1.110902190208435, -1.0735628604888916, -1.0362235307693481, -0.9988842010498047, -0.9615448713302612, -0.9242055416107178, -0.8868661522865295, -0.8495268225669861, -0.8121874332427979, -0.7748481035232544, -0.7375087738037109, -0.7001694440841675, -0.6628300547599792, -0.6254907250404358, -0.5881513357162476, -0.5508120059967041, -0.5134726762771606, -0.4761332869529724, -0.43879395723342896, -0.4014545977115631, -0.3641153573989868, -0.32677599787712097, -0.2894366383552551, -0.25209730863571167, -0.21475794911384583, -0.17741858959197998, -0.14007924497127533, -0.10273990035057068, -0.06540054082870483, -0.028061188757419586, 0.009278163313865662, 0.04661751538515091, 0.08395686745643616, 0.121296226978302, 0.15863557159900665, 0.1959749162197113, 0.23331427574157715, 0.270653635263443, 0.30799299478530884, 0.3453323245048523, 0.38267168402671814, 0.420011043548584, 0.45735037326812744, 0.4946897327899933, 0.5320290923118591, 0.5693684220314026, 0.6067078113555908, 0.6440471410751343, 0.6813864707946777, 0.718725860118866, 0.7560651898384094, 0.7934045791625977, 0.8307439088821411]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 9.0, 8.0, 17.0, 11.0, 20.0, 15.0, 23.0, 30.0, 40.0, 18.0, 38.0, 33.0, 46.0, 47.0, 38.0, 30.0, 46.0, 50.0, 46.0, 50.0, 51.0, 45.0, 42.0, 35.0, 26.0, 22.0, 24.0, 31.0, 17.0, 15.0, 17.0, 10.0, 6.0, 7.0, 7.0, 7.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.7214030623435974, -0.7007407546043396, -0.680078387260437, -0.6594160795211792, -0.6387537717819214, -0.6180914044380188, -0.597429096698761, -0.5767667293548584, -0.5561044216156006, -0.5354421138763428, -0.5147797465324402, -0.4941174387931824, -0.4734551012516022, -0.452792763710022, -0.43213045597076416, -0.41146811842918396, -0.39080578088760376, -0.37014344334602356, -0.34948110580444336, -0.32881879806518555, -0.30815646052360535, -0.28749412298202515, -0.26683181524276733, -0.24616947770118713, -0.22550714015960693, -0.20484480261802673, -0.18418247997760773, -0.16352015733718872, -0.14285781979560852, -0.12219548970460892, -0.10153315961360931, -0.08087083697319031, -0.06020849943161011, -0.039546169340610504, -0.0188838392496109, 0.0017784908413887024, 0.022440820932388306, 0.04310315102338791, 0.06376548111438751, 0.08442780375480652, 0.10509014129638672, 0.12575247883796692, 0.14641480147838593, 0.16707712411880493, 0.18773946166038513, 0.20840179920196533, 0.22906412184238434, 0.24972644448280334, 0.27038878202438354, 0.29105111956596375, 0.31171345710754395, 0.33237576484680176, 0.35303810238838196, 0.37370043992996216, 0.39436274766921997, 0.41502508521080017, 0.43568742275238037, 0.45634976029396057, 0.47701209783554077, 0.4976744055747986, 0.5183367729187012, 0.538999080657959, 0.5596613883972168, 0.5803236961364746, 0.6009860634803772]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 10.0, 16.0, 26.0, 34.0, 55.0, 77.0, 144.0, 274.0, 506.0, 865.0, 1728.0, 3601.0, 8113.0, 20184.0, 60820.0, 303292.0, 3490451.0, 221863.0, 51017.0, 17356.0, 7174.0, 3221.0, 1584.0, 820.0, 445.0, 260.0, 141.0, 72.0, 58.0, 31.0, 16.0, 8.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1959228515625, -0.19054412841796875, -0.1851654052734375, -0.17978668212890625, -0.174407958984375, -0.16902923583984375, -0.1636505126953125, -0.15827178955078125, -0.15289306640625, -0.14751434326171875, -0.1421356201171875, -0.13675689697265625, -0.131378173828125, -0.12599945068359375, -0.1206207275390625, -0.11524200439453125, -0.10986328125, -0.10448455810546875, -0.0991058349609375, -0.09372711181640625, -0.088348388671875, -0.08296966552734375, -0.0775909423828125, -0.07221221923828125, -0.06683349609375, -0.06145477294921875, -0.0560760498046875, -0.05069732666015625, -0.045318603515625, -0.03993988037109375, -0.0345611572265625, -0.02918243408203125, -0.0238037109375, -0.01842498779296875, -0.0130462646484375, -0.00766754150390625, -0.002288818359375, 0.00308990478515625, 0.0084686279296875, 0.01384735107421875, 0.01922607421875, 0.02460479736328125, 0.0299835205078125, 0.03536224365234375, 0.040740966796875, 0.04611968994140625, 0.0514984130859375, 0.05687713623046875, 0.062255859375, 0.06763458251953125, 0.0730133056640625, 0.07839202880859375, 0.083770751953125, 0.08914947509765625, 0.0945281982421875, 0.09990692138671875, 0.10528564453125, 0.11066436767578125, 0.1160430908203125, 0.12142181396484375, 0.126800537109375, 0.13217926025390625, 0.1375579833984375, 0.14293670654296875, 0.1483154296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 1.0, 6.0, 3.0, 10.0, 11.0, 11.0, 11.0, 15.0, 26.0, 35.0, 22.0, 29.0, 39.0, 49.0, 50.0, 44.0, 50.0, 60.0, 55.0, 51.0, 68.0, 51.0, 45.0, 36.0, 39.0, 39.0, 18.0, 27.0, 19.0, 28.0, 20.0, 9.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03302001953125, -0.03185272216796875, -0.0306854248046875, -0.02951812744140625, -0.028350830078125, -0.02718353271484375, -0.0260162353515625, -0.02484893798828125, -0.023681640625, -0.02251434326171875, -0.0213470458984375, -0.02017974853515625, -0.019012451171875, -0.01784515380859375, -0.0166778564453125, -0.01551055908203125, -0.01434326171875, -0.01317596435546875, -0.0120086669921875, -0.01084136962890625, -0.009674072265625, -0.00850677490234375, -0.0073394775390625, -0.00617218017578125, -0.0050048828125, -0.00383758544921875, -0.0026702880859375, -0.00150299072265625, -0.000335693359375, 0.00083160400390625, 0.0019989013671875, 0.00316619873046875, 0.00433349609375, 0.00550079345703125, 0.0066680908203125, 0.00783538818359375, 0.009002685546875, 0.01016998291015625, 0.0113372802734375, 0.01250457763671875, 0.013671875, 0.01483917236328125, 0.0160064697265625, 0.01717376708984375, 0.018341064453125, 0.01950836181640625, 0.0206756591796875, 0.02184295654296875, 0.02301025390625, 0.02417755126953125, 0.0253448486328125, 0.02651214599609375, 0.027679443359375, 0.02884674072265625, 0.0300140380859375, 0.03118133544921875, 0.0323486328125, 0.03351593017578125, 0.0346832275390625, 0.03585052490234375, 0.037017822265625, 0.03818511962890625, 0.0393524169921875, 0.04051971435546875, 0.04168701171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 14.0, 19.0, 25.0, 21.0, 41.0, 45.0, 86.0, 128.0, 191.0, 274.0, 452.0, 607.0, 1046.0, 1724.0, 2981.0, 5692.0, 13342.0, 38869.0, 174722.0, 3342947.0, 497887.0, 73593.0, 21231.0, 8518.0, 3925.0, 2166.0, 1324.0, 795.0, 571.0, 345.0, 183.0, 159.0, 119.0, 67.0, 51.0, 38.0, 25.0, 13.0, 8.0, 6.0, 5.0, 8.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22071266174316406, -0.21303176879882812, -0.2053508758544922, -0.19766998291015625, -0.1899890899658203, -0.18230819702148438, -0.17462730407714844, -0.1669464111328125, -0.15926551818847656, -0.15158462524414062, -0.1439037322998047, -0.13622283935546875, -0.1285419464111328, -0.12086105346679688, -0.11318016052246094, -0.105499267578125, -0.09781837463378906, -0.09013748168945312, -0.08245658874511719, -0.07477569580078125, -0.06709480285644531, -0.059413909912109375, -0.05173301696777344, -0.0440521240234375, -0.03637123107910156, -0.028690338134765625, -0.021009445190429688, -0.01332855224609375, -0.0056476593017578125, 0.002033233642578125, 0.009714126586914062, 0.01739501953125, 0.025075912475585938, 0.032756805419921875, 0.04043769836425781, 0.04811859130859375, 0.05579948425292969, 0.06348037719726562, 0.07116127014160156, 0.0788421630859375, 0.08652305603027344, 0.09420394897460938, 0.10188484191894531, 0.10956573486328125, 0.11724662780761719, 0.12492752075195312, 0.13260841369628906, 0.140289306640625, 0.14797019958496094, 0.15565109252929688, 0.1633319854736328, 0.17101287841796875, 0.1786937713623047, 0.18637466430664062, 0.19405555725097656, 0.2017364501953125, 0.20941734313964844, 0.21709823608398438, 0.2247791290283203, 0.23246002197265625, 0.2401409149169922, 0.24782180786132812, 0.25550270080566406, 0.26318359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 10.0, 5.0, 5.0, 15.0, 18.0, 21.0, 32.0, 51.0, 101.0, 155.0, 350.0, 2153.0, 596.0, 217.0, 129.0, 71.0, 31.0, 32.0, 18.0, 18.0, 7.0, 9.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1243896484375, -0.12058067321777344, -0.11677169799804688, -0.11296272277832031, -0.10915374755859375, -0.10534477233886719, -0.10153579711914062, -0.09772682189941406, -0.0939178466796875, -0.09010887145996094, -0.08629989624023438, -0.08249092102050781, -0.07868194580078125, -0.07487297058105469, -0.07106399536132812, -0.06725502014160156, -0.063446044921875, -0.05963706970214844, -0.055828094482421875, -0.05201911926269531, -0.04821014404296875, -0.04440116882324219, -0.040592193603515625, -0.03678321838378906, -0.0329742431640625, -0.029165267944335938, -0.025356292724609375, -0.021547317504882812, -0.01773834228515625, -0.013929367065429688, -0.010120391845703125, -0.0063114166259765625, -0.00250244140625, 0.0013065338134765625, 0.005115509033203125, 0.008924484252929688, 0.01273345947265625, 0.016542434692382812, 0.020351409912109375, 0.024160385131835938, 0.0279693603515625, 0.03177833557128906, 0.035587310791015625, 0.03939628601074219, 0.04320526123046875, 0.04701423645019531, 0.050823211669921875, 0.05463218688964844, 0.058441162109375, 0.06225013732910156, 0.06605911254882812, 0.06986808776855469, 0.07367706298828125, 0.07748603820800781, 0.08129501342773438, 0.08510398864746094, 0.0889129638671875, 0.09272193908691406, 0.09653091430664062, 0.10033988952636719, 0.10414886474609375, 0.10795783996582031, 0.11176681518554688, 0.11557579040527344, 0.119384765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 8.0, 31.0, 69.0, 116.0, 208.0, 217.0, 148.0, 105.0, 44.0, 23.0, 20.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5500032901763916, -0.5155172944068909, -0.48103129863739014, -0.4465453028678894, -0.41205930709838867, -0.37757331132888794, -0.3430872857570648, -0.3086012899875641, -0.27411529421806335, -0.23962929844856262, -0.2051433026790619, -0.17065729200839996, -0.13617129623889923, -0.1016853004693985, -0.06719928979873657, -0.03271329402923584, 0.0017727017402648926, 0.03625870123505592, 0.07074470072984695, 0.10523070394992828, 0.13971669971942902, 0.17420269548892975, 0.20868870615959167, 0.2431747019290924, 0.27766069769859314, 0.31214669346809387, 0.3466326892375946, 0.3811187148094177, 0.41560471057891846, 0.4500907063484192, 0.4845767021179199, 0.5190626978874207, 0.5535486936569214, 0.5880346894264221, 0.6225206851959229, 0.6570066809654236, 0.6914926767349243, 0.725978672504425, 0.7604646682739258, 0.7949507236480713, 0.8294366598129272, 0.863922655582428, 0.8984086513519287, 0.9328946471214294, 0.9673806428909302, 1.0018666982650757, 1.0363526344299316, 1.0708386898040771, 1.1053247451782227, 1.1398108005523682, 1.1742967367172241, 1.2087827920913696, 1.2432687282562256, 1.277754783630371, 1.312240719795227, 1.3467267751693726, 1.3812127113342285, 1.415698766708374, 1.45018470287323, 1.4846707582473755, 1.5191566944122314, 1.553642749786377, 1.588128685951233, 1.6226147413253784, 1.6571006774902344]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 9.0, 4.0, 7.0, 7.0, 20.0, 9.0, 14.0, 12.0, 22.0, 23.0, 31.0, 22.0, 24.0, 24.0, 22.0, 35.0, 22.0, 31.0, 35.0, 45.0, 51.0, 31.0, 41.0, 41.0, 45.0, 34.0, 31.0, 34.0, 27.0, 30.0, 31.0, 26.0, 27.0, 25.0, 20.0, 13.0, 16.0, 9.0, 4.0, 14.0, 5.0, 9.0, 7.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3495801091194153, -0.33873802423477173, -0.32789596915245056, -0.317053884267807, -0.30621182918548584, -0.2953697443008423, -0.28452765941619873, -0.2736855745315552, -0.262843519449234, -0.25200143456459045, -0.2411593794822693, -0.23031729459762573, -0.21947522461414337, -0.208633154630661, -0.19779106974601746, -0.1869489997625351, -0.17610692977905273, -0.16526485979557037, -0.154422789812088, -0.14358070492744446, -0.1327386349439621, -0.12189656496047974, -0.11105448752641678, -0.10021241009235382, -0.08937034010887146, -0.0785282701253891, -0.06768619269132614, -0.05684411898255348, -0.04600204527378082, -0.03515997156500816, -0.024317897856235504, -0.013475820422172546, -0.0026337504386901855, 0.008208323270082474, 0.019050396978855133, 0.029892470687627792, 0.04073454439640045, 0.05157661810517311, 0.06241869181394577, 0.07326076924800873, 0.08410283923149109, 0.09494490921497345, 0.10578698664903641, 0.11662906408309937, 0.12747113406658173, 0.1383132040500641, 0.14915528893470764, 0.15999735891819, 0.17083942890167236, 0.18168149888515472, 0.19252356886863708, 0.20336565375328064, 0.214207723736763, 0.22504979372024536, 0.23589187860488892, 0.24673394858837128, 0.25757601857185364, 0.2684181034564972, 0.27926015853881836, 0.2901022434234619, 0.30094432830810547, 0.31178638339042664, 0.3226284682750702, 0.33347052335739136, 0.3443126082420349]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 8.0, 15.0, 31.0, 30.0, 41.0, 67.0, 97.0, 145.0, 191.0, 292.0, 469.0, 844.0, 1386.0, 2461.0, 4637.0, 8755.0, 16611.0, 30758.0, 56811.0, 104118.0, 219823.0, 296327.0, 141606.0, 74227.0, 41057.0, 22163.0, 11559.0, 6230.0, 3302.0, 1799.0, 953.0, 617.0, 364.0, 215.0, 172.0, 103.0, 71.0, 57.0, 33.0, 31.0, 25.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.109588623046875, -0.1060791015625, -0.102569580078125, -0.09906005859375, -0.095550537109375, -0.092041015625, -0.088531494140625, -0.08502197265625, -0.081512451171875, -0.0780029296875, -0.074493408203125, -0.07098388671875, -0.067474365234375, -0.06396484375, -0.060455322265625, -0.05694580078125, -0.053436279296875, -0.0499267578125, -0.046417236328125, -0.04290771484375, -0.039398193359375, -0.035888671875, -0.032379150390625, -0.02886962890625, -0.025360107421875, -0.0218505859375, -0.018341064453125, -0.01483154296875, -0.011322021484375, -0.0078125, -0.004302978515625, -0.00079345703125, 0.002716064453125, 0.0062255859375, 0.009735107421875, 0.01324462890625, 0.016754150390625, 0.020263671875, 0.023773193359375, 0.02728271484375, 0.030792236328125, 0.0343017578125, 0.037811279296875, 0.04132080078125, 0.044830322265625, 0.04833984375, 0.051849365234375, 0.05535888671875, 0.058868408203125, 0.0623779296875, 0.065887451171875, 0.06939697265625, 0.072906494140625, 0.076416015625, 0.079925537109375, 0.08343505859375, 0.086944580078125, 0.0904541015625, 0.093963623046875, 0.09747314453125, 0.100982666015625, 0.1044921875, 0.108001708984375, 0.11151123046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 11.0, 6.0, 12.0, 12.0, 8.0, 18.0, 22.0, 17.0, 23.0, 26.0, 33.0, 29.0, 27.0, 23.0, 26.0, 45.0, 55.0, 50.0, 40.0, 33.0, 39.0, 52.0, 47.0, 37.0, 30.0, 46.0, 36.0, 30.0, 15.0, 28.0, 23.0, 16.0, 13.0, 12.0, 14.0, 9.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03515625, -0.0339818000793457, -0.032807350158691406, -0.03163290023803711, -0.030458450317382812, -0.029284000396728516, -0.02810955047607422, -0.026935100555419922, -0.025760650634765625, -0.024586200714111328, -0.02341175079345703, -0.022237300872802734, -0.021062850952148438, -0.01988840103149414, -0.018713951110839844, -0.017539501190185547, -0.01636505126953125, -0.015190601348876953, -0.014016151428222656, -0.01284170150756836, -0.011667251586914062, -0.010492801666259766, -0.009318351745605469, -0.008143901824951172, -0.006969451904296875, -0.005795001983642578, -0.004620552062988281, -0.0034461021423339844, -0.0022716522216796875, -0.0010972023010253906, 7.724761962890625e-05, 0.0012516975402832031, 0.0024261474609375, 0.003600597381591797, 0.004775047302246094, 0.005949497222900391, 0.0071239471435546875, 0.008298397064208984, 0.009472846984863281, 0.010647296905517578, 0.011821746826171875, 0.012996196746826172, 0.014170646667480469, 0.015345096588134766, 0.016519546508789062, 0.01769399642944336, 0.018868446350097656, 0.020042896270751953, 0.02121734619140625, 0.022391796112060547, 0.023566246032714844, 0.02474069595336914, 0.025915145874023438, 0.027089595794677734, 0.02826404571533203, 0.029438495635986328, 0.030612945556640625, 0.03178739547729492, 0.03296184539794922, 0.034136295318603516, 0.03531074523925781, 0.03648519515991211, 0.037659645080566406, 0.0388340950012207, 0.040008544921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 7.0, 6.0, 6.0, 13.0, 13.0, 15.0, 17.0, 24.0, 29.0, 52.0, 54.0, 79.0, 114.0, 155.0, 201.0, 280.0, 385.0, 563.0, 947.0, 1887.0, 4643.0, 13557.0, 44187.0, 145017.0, 562026.0, 188848.0, 56891.0, 17170.0, 5752.0, 2321.0, 1138.0, 613.0, 376.0, 311.0, 190.0, 153.0, 131.0, 104.0, 68.0, 55.0, 38.0, 29.0, 26.0, 19.0, 6.0, 15.0, 2.0, 1.0, 7.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.22412109375, -0.21724700927734375, -0.2103729248046875, -0.20349884033203125, -0.196624755859375, -0.18975067138671875, -0.1828765869140625, -0.17600250244140625, -0.16912841796875, -0.16225433349609375, -0.1553802490234375, -0.14850616455078125, -0.141632080078125, -0.13475799560546875, -0.1278839111328125, -0.12100982666015625, -0.1141357421875, -0.10726165771484375, -0.1003875732421875, -0.09351348876953125, -0.086639404296875, -0.07976531982421875, -0.0728912353515625, -0.06601715087890625, -0.05914306640625, -0.05226898193359375, -0.0453948974609375, -0.03852081298828125, -0.031646728515625, -0.02477264404296875, -0.0178985595703125, -0.01102447509765625, -0.004150390625, 0.00272369384765625, 0.0095977783203125, 0.01647186279296875, 0.023345947265625, 0.03022003173828125, 0.0370941162109375, 0.04396820068359375, 0.05084228515625, 0.05771636962890625, 0.0645904541015625, 0.07146453857421875, 0.078338623046875, 0.08521270751953125, 0.0920867919921875, 0.09896087646484375, 0.1058349609375, 0.11270904541015625, 0.1195831298828125, 0.12645721435546875, 0.133331298828125, 0.14020538330078125, 0.1470794677734375, 0.15395355224609375, 0.16082763671875, 0.16770172119140625, 0.1745758056640625, 0.18144989013671875, 0.188323974609375, 0.19519805908203125, 0.2020721435546875, 0.20894622802734375, 0.2158203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 3.0, 7.0, 7.0, 7.0, 15.0, 12.0, 19.0, 17.0, 17.0, 22.0, 37.0, 33.0, 35.0, 44.0, 35.0, 47.0, 57.0, 51.0, 54.0, 39.0, 57.0, 51.0, 39.0, 40.0, 21.0, 22.0, 32.0, 23.0, 25.0, 26.0, 18.0, 9.0, 11.0, 15.0, 5.0, 12.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.2347412109375, -0.22794151306152344, -0.22114181518554688, -0.2143421173095703, -0.20754241943359375, -0.2007427215576172, -0.19394302368164062, -0.18714332580566406, -0.1803436279296875, -0.17354393005371094, -0.16674423217773438, -0.1599445343017578, -0.15314483642578125, -0.1463451385498047, -0.13954544067382812, -0.13274574279785156, -0.125946044921875, -0.11914634704589844, -0.11234664916992188, -0.10554695129394531, -0.09874725341796875, -0.09194755554199219, -0.08514785766601562, -0.07834815979003906, -0.0715484619140625, -0.06474876403808594, -0.057949066162109375, -0.05114936828613281, -0.04434967041015625, -0.03754997253417969, -0.030750274658203125, -0.023950576782226562, -0.01715087890625, -0.010351181030273438, -0.003551483154296875, 0.0032482147216796875, 0.01004791259765625, 0.016847610473632812, 0.023647308349609375, 0.030447006225585938, 0.0372467041015625, 0.04404640197753906, 0.050846099853515625, 0.05764579772949219, 0.06444549560546875, 0.07124519348144531, 0.07804489135742188, 0.08484458923339844, 0.091644287109375, 0.09844398498535156, 0.10524368286132812, 0.11204338073730469, 0.11884307861328125, 0.1256427764892578, 0.13244247436523438, 0.13924217224121094, 0.1460418701171875, 0.15284156799316406, 0.15964126586914062, 0.1664409637451172, 0.17324066162109375, 0.1800403594970703, 0.18684005737304688, 0.19363975524902344, 0.200439453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 9.0, 7.0, 10.0, 24.0, 29.0, 48.0, 65.0, 127.0, 272.0, 600.0, 1663.0, 7778.0, 111757.0, 869151.0, 49852.0, 4997.0, 1217.0, 423.0, 192.0, 106.0, 69.0, 32.0, 36.0, 30.0, 19.0, 9.0, 5.0, 10.0, 3.0, 1.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.426513671875, -0.4159507751464844, -0.40538787841796875, -0.3948249816894531, -0.3842620849609375, -0.3736991882324219, -0.36313629150390625, -0.3525733947753906, -0.342010498046875, -0.3314476013183594, -0.32088470458984375, -0.3103218078613281, -0.2997589111328125, -0.2891960144042969, -0.27863311767578125, -0.2680702209472656, -0.25750732421875, -0.24694442749023438, -0.23638153076171875, -0.22581863403320312, -0.2152557373046875, -0.20469284057617188, -0.19412994384765625, -0.18356704711914062, -0.173004150390625, -0.16244125366210938, -0.15187835693359375, -0.14131546020507812, -0.1307525634765625, -0.12018966674804688, -0.10962677001953125, -0.09906387329101562, -0.0885009765625, -0.07793807983398438, -0.06737518310546875, -0.056812286376953125, -0.0462493896484375, -0.035686492919921875, -0.02512359619140625, -0.014560699462890625, -0.003997802734375, 0.006565093994140625, 0.01712799072265625, 0.027690887451171875, 0.0382537841796875, 0.048816680908203125, 0.05937957763671875, 0.06994247436523438, 0.08050537109375, 0.09106826782226562, 0.10163116455078125, 0.11219406127929688, 0.1227569580078125, 0.13331985473632812, 0.14388275146484375, 0.15444564819335938, 0.165008544921875, 0.17557144165039062, 0.18613433837890625, 0.19669723510742188, 0.2072601318359375, 0.21782302856445312, 0.22838592529296875, 0.23894882202148438, 0.24951171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 6.0, 8.0, 10.0, 19.0, 18.0, 31.0, 50.0, 60.0, 88.0, 102.0, 114.0, 126.0, 99.0, 68.0, 61.0, 39.0, 34.0, 12.0, 18.0, 14.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.772445678710938e-05, -7.520057260990143e-05, -7.267668843269348e-05, -7.015280425548553e-05, -6.762892007827759e-05, -6.510503590106964e-05, -6.25811517238617e-05, -6.005726754665375e-05, -5.75333833694458e-05, -5.5009499192237854e-05, -5.248561501502991e-05, -4.996173083782196e-05, -4.7437846660614014e-05, -4.491396248340607e-05, -4.239007830619812e-05, -3.986619412899017e-05, -3.7342309951782227e-05, -3.481842577457428e-05, -3.229454159736633e-05, -2.9770657420158386e-05, -2.724677324295044e-05, -2.4722889065742493e-05, -2.2199004888534546e-05, -1.96751207113266e-05, -1.7151236534118652e-05, -1.4627352356910706e-05, -1.2103468179702759e-05, -9.579584002494812e-06, -7.055699825286865e-06, -4.5318156480789185e-06, -2.0079314708709717e-06, 5.159527063369751e-07, 3.039836883544922e-06, 5.563721060752869e-06, 8.087605237960815e-06, 1.0611489415168762e-05, 1.3135373592376709e-05, 1.5659257769584656e-05, 1.8183141946792603e-05, 2.070702612400055e-05, 2.3230910301208496e-05, 2.5754794478416443e-05, 2.827867865562439e-05, 3.0802562832832336e-05, 3.332644701004028e-05, 3.585033118724823e-05, 3.837421536445618e-05, 4.0898099541664124e-05, 4.342198371887207e-05, 4.594586789608002e-05, 4.8469752073287964e-05, 5.099363625049591e-05, 5.351752042770386e-05, 5.6041404604911804e-05, 5.856528878211975e-05, 6.10891729593277e-05, 6.361305713653564e-05, 6.613694131374359e-05, 6.866082549095154e-05, 7.118470966815948e-05, 7.370859384536743e-05, 7.623247802257538e-05, 7.875636219978333e-05, 8.128024637699127e-05, 8.380413055419922e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 17.0, 16.0, 19.0, 22.0, 52.0, 88.0, 121.0, 216.0, 311.0, 580.0, 1134.0, 2575.0, 6361.0, 27516.0, 310319.0, 633411.0, 50336.0, 9045.0, 3175.0, 1482.0, 749.0, 388.0, 240.0, 116.0, 82.0, 57.0, 36.0, 23.0, 11.0, 9.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.2254962921142578, -0.21869277954101562, -0.21188926696777344, -0.20508575439453125, -0.19828224182128906, -0.19147872924804688, -0.1846752166748047, -0.1778717041015625, -0.1710681915283203, -0.16426467895507812, -0.15746116638183594, -0.15065765380859375, -0.14385414123535156, -0.13705062866210938, -0.1302471160888672, -0.123443603515625, -0.11664009094238281, -0.10983657836914062, -0.10303306579589844, -0.09622955322265625, -0.08942604064941406, -0.08262252807617188, -0.07581901550292969, -0.0690155029296875, -0.06221199035644531, -0.055408477783203125, -0.04860496520996094, -0.04180145263671875, -0.03499794006347656, -0.028194427490234375, -0.021390914916992188, -0.01458740234375, -0.0077838897705078125, -0.000980377197265625, 0.0058231353759765625, 0.01262664794921875, 0.019430160522460938, 0.026233673095703125, 0.03303718566894531, 0.0398406982421875, 0.04664421081542969, 0.053447723388671875, 0.06025123596191406, 0.06705474853515625, 0.07385826110839844, 0.08066177368164062, 0.08746528625488281, 0.094268798828125, 0.10107231140136719, 0.10787582397460938, 0.11467933654785156, 0.12148284912109375, 0.12828636169433594, 0.13508987426757812, 0.1418933868408203, 0.1486968994140625, 0.1555004119873047, 0.16230392456054688, 0.16910743713378906, 0.17591094970703125, 0.18271446228027344, 0.18951797485351562, 0.1963214874267578, 0.203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 8.0, 5.0, 4.0, 3.0, 12.0, 15.0, 34.0, 24.0, 43.0, 72.0, 73.0, 135.0, 175.0, 112.0, 83.0, 64.0, 47.0, 30.0, 19.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.17006874084472656, -0.16496658325195312, -0.1598644256591797, -0.15476226806640625, -0.1496601104736328, -0.14455795288085938, -0.13945579528808594, -0.1343536376953125, -0.12925148010253906, -0.12414932250976562, -0.11904716491699219, -0.11394500732421875, -0.10884284973144531, -0.10374069213867188, -0.09863853454589844, -0.093536376953125, -0.08843421936035156, -0.08333206176757812, -0.07822990417480469, -0.07312774658203125, -0.06802558898925781, -0.06292343139648438, -0.05782127380371094, -0.0527191162109375, -0.04761695861816406, -0.042514801025390625, -0.03741264343261719, -0.03231048583984375, -0.027208328247070312, -0.022106170654296875, -0.017004013061523438, -0.01190185546875, -0.0067996978759765625, -0.001697540283203125, 0.0034046173095703125, 0.00850677490234375, 0.013608932495117188, 0.018711090087890625, 0.023813247680664062, 0.0289154052734375, 0.03401756286621094, 0.039119720458984375, 0.04422187805175781, 0.04932403564453125, 0.05442619323730469, 0.059528350830078125, 0.06463050842285156, 0.069732666015625, 0.07483482360839844, 0.07993698120117188, 0.08503913879394531, 0.09014129638671875, 0.09524345397949219, 0.10034561157226562, 0.10544776916503906, 0.1105499267578125, 0.11565208435058594, 0.12075424194335938, 0.1258563995361328, 0.13095855712890625, 0.1360607147216797, 0.14116287231445312, 0.14626502990722656, 0.1513671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 14.0, 38.0, 54.0, 77.0, 115.0, 150.0, 159.0, 131.0, 91.0, 68.0, 43.0, 22.0, 12.0, 11.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583528995513916, -1.5179442167282104, -1.4523593187332153, -1.3867745399475098, -1.3211896419525146, -1.255604863166809, -1.1900200843811035, -1.1244351863861084, -1.0588504076004028, -0.9932655692100525, -0.9276807308197021, -0.8620959520339966, -0.7965111136436462, -0.7309262752532959, -0.6653414964675903, -0.59975665807724, -0.5341718196868896, -0.4685869812965393, -0.40300217270851135, -0.3374173641204834, -0.27183252573013306, -0.20624768733978271, -0.14066287875175476, -0.0750780701637268, -0.009493231773376465, 0.05609159171581268, 0.12167641520500183, 0.18726123869419098, 0.2528460621833801, 0.31843090057373047, 0.3840157091617584, 0.4496005177497864, 0.5151851177215576, 0.580769956111908, 0.6463547945022583, 0.7119395732879639, 0.7775244116783142, 0.8431092500686646, 0.9086940288543701, 0.9742788672447205, 1.0398637056350708, 1.1054484844207764, 1.1710333824157715, 1.236618161201477, 1.3022029399871826, 1.3677878379821777, 1.4333726167678833, 1.4989573955535889, 1.564542293548584, 1.6301270723342896, 1.6957119703292847, 1.7612967491149902, 1.8268816471099854, 1.892466425895691, 1.9580512046813965, 2.0236361026763916, 2.0892210006713867, 2.154805898666382, 2.220390558242798, 2.285975456237793, 2.351560354232788, 2.417145252227783, 2.482729911804199, 2.5483148097991943, 2.6138994693756104]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 11.0, 9.0, 9.0, 11.0, 17.0, 19.0, 17.0, 17.0, 22.0, 30.0, 22.0, 29.0, 31.0, 36.0, 35.0, 31.0, 39.0, 47.0, 53.0, 48.0, 37.0, 49.0, 31.0, 43.0, 39.0, 42.0, 38.0, 28.0, 17.0, 21.0, 19.0, 15.0, 10.0, 15.0, 13.0, 8.0, 7.0, 9.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-1.1979303359985352, -1.1631454229354858, -1.1283605098724365, -1.0935757160186768, -1.0587908029556274, -1.0240058898925781, -0.9892209768295288, -0.9544361233711243, -0.9196512699127197, -0.8848663568496704, -0.8500815033912659, -0.8152965903282166, -0.780511736869812, -0.7457268238067627, -0.7109419107437134, -0.6761570572853088, -0.6413721442222595, -0.6065872311592102, -0.5718023777008057, -0.5370174646377563, -0.5022326111793518, -0.4674476981163025, -0.43266281485557556, -0.39787793159484863, -0.3630930483341217, -0.3283081650733948, -0.29352328181266785, -0.2587383985519409, -0.2239535003900528, -0.18916861712932587, -0.15438371896743774, -0.11959883570671082, -0.08481395244598389, -0.05002906545996666, -0.015244178473949432, 0.019540712237358093, 0.05432559549808502, 0.08911047875881195, 0.12389537692070007, 0.158680260181427, 0.19346514344215393, 0.22825002670288086, 0.2630349099636078, 0.2978197932243347, 0.33260470628738403, 0.3673895597457886, 0.4021744728088379, 0.4369593560695648, 0.47174423933029175, 0.5065291523933411, 0.5413140058517456, 0.5760989189147949, 0.6108837723731995, 0.6456686854362488, 0.6804535388946533, 0.7152384519577026, 0.750023365020752, 0.7848082780838013, 0.8195931315422058, 0.8543780446052551, 0.8891628980636597, 0.923947811126709, 0.9587327241897583, 0.9935175776481628, 1.0283024311065674]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 10.0, 10.0, 10.0, 25.0, 30.0, 35.0, 49.0, 96.0, 126.0, 171.0, 280.0, 486.0, 836.0, 1331.0, 2272.0, 4554.0, 8752.0, 18639.0, 43829.0, 125255.0, 669655.0, 2987207.0, 214559.0, 64743.0, 25998.0, 11850.0, 5945.0, 3177.0, 1764.0, 979.0, 583.0, 361.0, 219.0, 142.0, 94.0, 66.0, 42.0, 32.0, 24.0, 16.0, 3.0, 12.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1488037109375, -0.1438770294189453, -0.13895034790039062, -0.13402366638183594, -0.12909698486328125, -0.12417030334472656, -0.11924362182617188, -0.11431694030761719, -0.1093902587890625, -0.10446357727050781, -0.09953689575195312, -0.09461021423339844, -0.08968353271484375, -0.08475685119628906, -0.07983016967773438, -0.07490348815917969, -0.069976806640625, -0.06505012512207031, -0.060123443603515625, -0.05519676208496094, -0.05027008056640625, -0.04534339904785156, -0.040416717529296875, -0.03549003601074219, -0.0305633544921875, -0.025636672973632812, -0.020709991455078125, -0.015783309936523438, -0.01085662841796875, -0.0059299468994140625, -0.001003265380859375, 0.0039234161376953125, 0.00885009765625, 0.013776779174804688, 0.018703460693359375, 0.023630142211914062, 0.02855682373046875, 0.03348350524902344, 0.038410186767578125, 0.04333686828613281, 0.0482635498046875, 0.05319023132324219, 0.058116912841796875, 0.06304359436035156, 0.06797027587890625, 0.07289695739746094, 0.07782363891601562, 0.08275032043457031, 0.087677001953125, 0.09260368347167969, 0.09753036499023438, 0.10245704650878906, 0.10738372802734375, 0.11231040954589844, 0.11723709106445312, 0.12216377258300781, 0.1270904541015625, 0.1320171356201172, 0.13694381713867188, 0.14187049865722656, 0.14679718017578125, 0.15172386169433594, 0.15665054321289062, 0.1615772247314453, 0.16650390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 12.0, 8.0, 9.0, 24.0, 21.0, 23.0, 26.0, 27.0, 28.0, 32.0, 40.0, 38.0, 33.0, 57.0, 46.0, 60.0, 46.0, 47.0, 40.0, 39.0, 54.0, 38.0, 31.0, 30.0, 29.0, 30.0, 21.0, 15.0, 19.0, 13.0, 11.0, 8.0, 9.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.047943115234375, -0.04653644561767578, -0.04512977600097656, -0.043723106384277344, -0.042316436767578125, -0.040909767150878906, -0.03950309753417969, -0.03809642791748047, -0.03668975830078125, -0.03528308868408203, -0.03387641906738281, -0.032469749450683594, -0.031063079833984375, -0.029656410217285156, -0.028249740600585938, -0.02684307098388672, -0.0254364013671875, -0.02402973175048828, -0.022623062133789062, -0.021216392517089844, -0.019809722900390625, -0.018403053283691406, -0.016996383666992188, -0.015589714050292969, -0.01418304443359375, -0.012776374816894531, -0.011369705200195312, -0.009963035583496094, -0.008556365966796875, -0.007149696350097656, -0.0057430267333984375, -0.004336357116699219, -0.0029296875, -0.0015230178833007812, -0.0001163482666015625, 0.0012903213500976562, 0.002696990966796875, 0.004103660583496094, 0.0055103302001953125, 0.006916999816894531, 0.00832366943359375, 0.009730339050292969, 0.011137008666992188, 0.012543678283691406, 0.013950347900390625, 0.015357017517089844, 0.016763687133789062, 0.01817035675048828, 0.0195770263671875, 0.02098369598388672, 0.022390365600585938, 0.023797035217285156, 0.025203704833984375, 0.026610374450683594, 0.028017044067382812, 0.02942371368408203, 0.03083038330078125, 0.03223705291748047, 0.03364372253417969, 0.035050392150878906, 0.036457061767578125, 0.037863731384277344, 0.03927040100097656, 0.04067707061767578, 0.042083740234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 7.0, 8.0, 14.0, 26.0, 35.0, 31.0, 53.0, 79.0, 132.0, 168.0, 224.0, 371.0, 594.0, 1083.0, 2144.0, 5289.0, 15918.0, 64077.0, 463158.0, 3385403.0, 199435.0, 37699.0, 10504.0, 3797.0, 1637.0, 832.0, 483.0, 331.0, 252.0, 137.0, 98.0, 66.0, 57.0, 33.0, 20.0, 21.0, 16.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.27783203125, -0.2672767639160156, -0.25672149658203125, -0.24616622924804688, -0.2356109619140625, -0.22505569458007812, -0.21450042724609375, -0.20394515991210938, -0.193389892578125, -0.18283462524414062, -0.17227935791015625, -0.16172409057617188, -0.1511688232421875, -0.14061355590820312, -0.13005828857421875, -0.11950302124023438, -0.10894775390625, -0.09839248657226562, -0.08783721923828125, -0.07728195190429688, -0.0667266845703125, -0.056171417236328125, -0.04561614990234375, -0.035060882568359375, -0.024505615234375, -0.013950347900390625, -0.00339508056640625, 0.007160186767578125, 0.0177154541015625, 0.028270721435546875, 0.03882598876953125, 0.049381256103515625, 0.0599365234375, 0.07049179077148438, 0.08104705810546875, 0.09160232543945312, 0.1021575927734375, 0.11271286010742188, 0.12326812744140625, 0.13382339477539062, 0.144378662109375, 0.15493392944335938, 0.16548919677734375, 0.17604446411132812, 0.1865997314453125, 0.19715499877929688, 0.20771026611328125, 0.21826553344726562, 0.22882080078125, 0.23937606811523438, 0.24993133544921875, 0.2604866027832031, 0.2710418701171875, 0.2815971374511719, 0.29215240478515625, 0.3027076721191406, 0.313262939453125, 0.3238182067871094, 0.33437347412109375, 0.3449287414550781, 0.3554840087890625, 0.3660392761230469, 0.37659454345703125, 0.3871498107910156, 0.397705078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 9.0, 9.0, 20.0, 32.0, 32.0, 75.0, 131.0, 256.0, 1021.0, 1721.0, 310.0, 207.0, 90.0, 53.0, 26.0, 27.0, 15.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.27099609375, -0.2645606994628906, -0.25812530517578125, -0.2516899108886719, -0.2452545166015625, -0.23881912231445312, -0.23238372802734375, -0.22594833374023438, -0.219512939453125, -0.21307754516601562, -0.20664215087890625, -0.20020675659179688, -0.1937713623046875, -0.18733596801757812, -0.18090057373046875, -0.17446517944335938, -0.16802978515625, -0.16159439086914062, -0.15515899658203125, -0.14872360229492188, -0.1422882080078125, -0.13585281372070312, -0.12941741943359375, -0.12298202514648438, -0.116546630859375, -0.11011123657226562, -0.10367584228515625, -0.09724044799804688, -0.0908050537109375, -0.08436965942382812, -0.07793426513671875, -0.07149887084960938, -0.0650634765625, -0.058628082275390625, -0.05219268798828125, -0.045757293701171875, -0.0393218994140625, -0.032886505126953125, -0.02645111083984375, -0.020015716552734375, -0.013580322265625, -0.007144927978515625, -0.00070953369140625, 0.005725860595703125, 0.0121612548828125, 0.018596649169921875, 0.02503204345703125, 0.031467437744140625, 0.03790283203125, 0.044338226318359375, 0.05077362060546875, 0.057209014892578125, 0.0636444091796875, 0.07007980346679688, 0.07651519775390625, 0.08295059204101562, 0.089385986328125, 0.09582138061523438, 0.10225677490234375, 0.10869216918945312, 0.1151275634765625, 0.12156295776367188, 0.12799835205078125, 0.13443374633789062, 0.140869140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 13.0, 29.0, 70.0, 204.0, 324.0, 223.0, 101.0, 19.0, 13.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.812553882598877, -3.7325737476348877, -3.6525933742523193, -3.57261323928833, -3.492633104324341, -3.4126529693603516, -3.332672595977783, -3.252692461013794, -3.1727123260498047, -3.0927321910858154, -3.012751817703247, -2.932771682739258, -2.8527915477752686, -2.7728114128112793, -2.692831039428711, -2.6128509044647217, -2.5328707695007324, -2.452890634536743, -2.372910261154175, -2.2929301261901855, -2.2129499912261963, -2.132969856262207, -2.0529894828796387, -1.9730093479156494, -1.893028974533081, -1.8130487203598022, -1.733068585395813, -1.6530883312225342, -1.573108196258545, -1.4931279420852661, -1.4131476879119873, -1.333167552947998, -1.2531875371932983, -1.1732072830200195, -1.0932271480560303, -1.0132468938827515, -0.9332667589187622, -0.8532865047454834, -0.7733063101768494, -0.6933261156082153, -0.6133459210395813, -0.5333657264709473, -0.45338553190231323, -0.3734053075313568, -0.2934251129627228, -0.21344491839408875, -0.13346469402313232, -0.05348449945449829, 0.026495695114135742, 0.10647589713335037, 0.186456099152565, 0.26643630862236023, 0.34641650319099426, 0.4263966977596283, 0.5063769221305847, 0.5863571166992188, 0.6663373112678528, 0.7463175058364868, 0.8262977004051208, 0.9062778949737549, 0.9862581491470337, 1.066238284111023, 1.1462185382843018, 1.226198673248291, 1.3061789274215698]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 15.0, 13.0, 25.0, 32.0, 28.0, 44.0, 28.0, 39.0, 24.0, 37.0, 45.0, 44.0, 54.0, 56.0, 45.0, 39.0, 50.0, 42.0, 35.0, 46.0, 36.0, 36.0, 33.0, 32.0, 21.0, 13.0, 11.0, 14.0, 8.0, 10.0, 9.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5369692444801331, -0.5185194611549377, -0.5000696778297424, -0.4816198945045471, -0.4631701111793518, -0.4447203278541565, -0.4262705147266388, -0.4078207314014435, -0.38937094807624817, -0.37092116475105286, -0.35247138142585754, -0.33402159810066223, -0.31557178497314453, -0.2971220016479492, -0.2786722183227539, -0.2602224349975586, -0.24177265167236328, -0.22332286834716797, -0.20487308502197266, -0.18642328679561615, -0.16797350347042084, -0.14952372014522552, -0.13107392191886902, -0.1126241385936737, -0.0941743552684784, -0.07572457194328308, -0.05727478116750717, -0.03882499411702156, -0.02037520706653595, -0.0019254237413406372, 0.016524367034435272, 0.03497415781021118, 0.05342400074005127, 0.07187378406524658, 0.09032357484102249, 0.1087733656167984, 0.1272231489419937, 0.14567293226718903, 0.16412273049354553, 0.18257251381874084, 0.20102229714393616, 0.21947208046913147, 0.23792186379432678, 0.2563716471195221, 0.2748214602470398, 0.2932712435722351, 0.3117210268974304, 0.33017081022262573, 0.34862059354782104, 0.36707037687301636, 0.38552016019821167, 0.403969943523407, 0.4224197268486023, 0.4408695101737976, 0.4593193233013153, 0.4777691066265106, 0.49621888995170593, 0.5146687030792236, 0.533118486404419, 0.5515682697296143, 0.5700180530548096, 0.5884678363800049, 0.6069176197052002, 0.6253674030303955, 0.6438171863555908]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 1.0, 7.0, 18.0, 26.0, 29.0, 55.0, 78.0, 131.0, 187.0, 260.0, 438.0, 767.0, 1336.0, 2276.0, 4100.0, 7388.0, 14121.0, 27267.0, 53901.0, 109728.0, 213314.0, 271654.0, 169939.0, 83604.0, 41551.0, 21521.0, 10907.0, 5923.0, 3407.0, 1841.0, 1131.0, 614.0, 382.0, 234.0, 148.0, 92.0, 50.0, 42.0, 29.0, 21.0, 6.0, 12.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1276378631591797, -0.12356185913085938, -0.11948585510253906, -0.11540985107421875, -0.11133384704589844, -0.10725784301757812, -0.10318183898925781, -0.0991058349609375, -0.09502983093261719, -0.09095382690429688, -0.08687782287597656, -0.08280181884765625, -0.07872581481933594, -0.07464981079101562, -0.07057380676269531, -0.066497802734375, -0.06242179870605469, -0.058345794677734375, -0.05426979064941406, -0.05019378662109375, -0.04611778259277344, -0.042041778564453125, -0.03796577453613281, -0.0338897705078125, -0.029813766479492188, -0.025737762451171875, -0.021661758422851562, -0.01758575439453125, -0.013509750366210938, -0.009433746337890625, -0.0053577423095703125, -0.00128173828125, 0.0027942657470703125, 0.006870269775390625, 0.010946273803710938, 0.01502227783203125, 0.019098281860351562, 0.023174285888671875, 0.027250289916992188, 0.0313262939453125, 0.03540229797363281, 0.039478302001953125, 0.04355430603027344, 0.04763031005859375, 0.05170631408691406, 0.055782318115234375, 0.05985832214355469, 0.063934326171875, 0.06801033020019531, 0.07208633422851562, 0.07616233825683594, 0.08023834228515625, 0.08431434631347656, 0.08839035034179688, 0.09246635437011719, 0.0965423583984375, 0.10061836242675781, 0.10469436645507812, 0.10877037048339844, 0.11284637451171875, 0.11692237854003906, 0.12099838256835938, 0.1250743865966797, 0.129150390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 4.0, 3.0, 6.0, 8.0, 10.0, 14.0, 23.0, 17.0, 27.0, 11.0, 29.0, 23.0, 36.0, 32.0, 42.0, 43.0, 43.0, 52.0, 42.0, 47.0, 43.0, 41.0, 33.0, 38.0, 40.0, 37.0, 28.0, 29.0, 30.0, 34.0, 21.0, 23.0, 17.0, 12.0, 15.0, 8.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.053375244140625, -0.05192375183105469, -0.050472259521484375, -0.04902076721191406, -0.04756927490234375, -0.04611778259277344, -0.044666290283203125, -0.04321479797363281, -0.0417633056640625, -0.04031181335449219, -0.038860321044921875, -0.03740882873535156, -0.03595733642578125, -0.03450584411621094, -0.033054351806640625, -0.03160285949707031, -0.0301513671875, -0.028699874877929688, -0.027248382568359375, -0.025796890258789062, -0.02434539794921875, -0.022893905639648438, -0.021442413330078125, -0.019990921020507812, -0.0185394287109375, -0.017087936401367188, -0.015636444091796875, -0.014184951782226562, -0.01273345947265625, -0.011281967163085938, -0.009830474853515625, -0.008378982543945312, -0.006927490234375, -0.0054759979248046875, -0.004024505615234375, -0.0025730133056640625, -0.00112152099609375, 0.0003299713134765625, 0.001781463623046875, 0.0032329559326171875, 0.0046844482421875, 0.0061359405517578125, 0.007587432861328125, 0.009038925170898438, 0.01049041748046875, 0.011941909790039062, 0.013393402099609375, 0.014844894409179688, 0.01629638671875, 0.017747879028320312, 0.019199371337890625, 0.020650863647460938, 0.02210235595703125, 0.023553848266601562, 0.025005340576171875, 0.026456832885742188, 0.0279083251953125, 0.029359817504882812, 0.030811309814453125, 0.03226280212402344, 0.03371429443359375, 0.03516578674316406, 0.036617279052734375, 0.03806877136230469, 0.039520263671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 6.0, 6.0, 13.0, 10.0, 23.0, 30.0, 35.0, 46.0, 65.0, 97.0, 141.0, 224.0, 377.0, 571.0, 1283.0, 2760.0, 7724.0, 28573.0, 148352.0, 596558.0, 207935.0, 37562.0, 9483.0, 3300.0, 1400.0, 697.0, 430.0, 262.0, 183.0, 139.0, 79.0, 44.0, 38.0, 36.0, 22.0, 12.0, 9.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.38037109375, -0.3699760437011719, -0.35958099365234375, -0.3491859436035156, -0.3387908935546875, -0.3283958435058594, -0.31800079345703125, -0.3076057434082031, -0.297210693359375, -0.2868156433105469, -0.27642059326171875, -0.2660255432128906, -0.2556304931640625, -0.24523544311523438, -0.23484039306640625, -0.22444534301757812, -0.21405029296875, -0.20365524291992188, -0.19326019287109375, -0.18286514282226562, -0.1724700927734375, -0.16207504272460938, -0.15167999267578125, -0.14128494262695312, -0.130889892578125, -0.12049484252929688, -0.11009979248046875, -0.09970474243164062, -0.0893096923828125, -0.07891464233398438, -0.06851959228515625, -0.058124542236328125, -0.0477294921875, -0.037334442138671875, -0.02693939208984375, -0.016544342041015625, -0.0061492919921875, 0.004245758056640625, 0.01464080810546875, 0.025035858154296875, 0.035430908203125, 0.045825958251953125, 0.05622100830078125, 0.06661605834960938, 0.0770111083984375, 0.08740615844726562, 0.09780120849609375, 0.10819625854492188, 0.11859130859375, 0.12898635864257812, 0.13938140869140625, 0.14977645874023438, 0.1601715087890625, 0.17056655883789062, 0.18096160888671875, 0.19135665893554688, 0.201751708984375, 0.21214675903320312, 0.22254180908203125, 0.23293685913085938, 0.2433319091796875, 0.2537269592285156, 0.26412200927734375, 0.2745170593261719, 0.284912109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 3.0, 5.0, 5.0, 8.0, 18.0, 12.0, 12.0, 23.0, 20.0, 20.0, 17.0, 33.0, 45.0, 36.0, 37.0, 39.0, 49.0, 55.0, 55.0, 58.0, 52.0, 51.0, 46.0, 41.0, 34.0, 28.0, 33.0, 38.0, 30.0, 19.0, 17.0, 12.0, 12.0, 7.0, 13.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.36083984375, -0.3508110046386719, -0.34078216552734375, -0.3307533264160156, -0.3207244873046875, -0.3106956481933594, -0.30066680908203125, -0.2906379699707031, -0.280609130859375, -0.2705802917480469, -0.26055145263671875, -0.2505226135253906, -0.2404937744140625, -0.23046493530273438, -0.22043609619140625, -0.21040725708007812, -0.20037841796875, -0.19034957885742188, -0.18032073974609375, -0.17029190063476562, -0.1602630615234375, -0.15023422241210938, -0.14020538330078125, -0.13017654418945312, -0.120147705078125, -0.11011886596679688, -0.10009002685546875, -0.09006118774414062, -0.0800323486328125, -0.07000350952148438, -0.05997467041015625, -0.049945831298828125, -0.0399169921875, -0.029888153076171875, -0.01985931396484375, -0.009830474853515625, 0.0001983642578125, 0.010227203369140625, 0.02025604248046875, 0.030284881591796875, 0.040313720703125, 0.050342559814453125, 0.06037139892578125, 0.07040023803710938, 0.0804290771484375, 0.09045791625976562, 0.10048675537109375, 0.11051559448242188, 0.12054443359375, 0.13057327270507812, 0.14060211181640625, 0.15063095092773438, 0.1606597900390625, 0.17068862915039062, 0.18071746826171875, 0.19074630737304688, 0.200775146484375, 0.21080398559570312, 0.22083282470703125, 0.23086166381835938, 0.2408905029296875, 0.2509193420410156, 0.26094818115234375, 0.2709770202636719, 0.281005859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 2.0, 2.0, 3.0, 7.0, 16.0, 13.0, 22.0, 26.0, 34.0, 64.0, 105.0, 176.0, 339.0, 678.0, 1296.0, 2838.0, 7585.0, 22981.0, 98642.0, 461058.0, 354430.0, 70156.0, 17373.0, 5919.0, 2413.0, 1111.0, 556.0, 265.0, 161.0, 106.0, 55.0, 34.0, 25.0, 21.0, 9.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1549072265625, -0.14972496032714844, -0.14454269409179688, -0.1393604278564453, -0.13417816162109375, -0.1289958953857422, -0.12381362915039062, -0.11863136291503906, -0.1134490966796875, -0.10826683044433594, -0.10308456420898438, -0.09790229797363281, -0.09272003173828125, -0.08753776550292969, -0.08235549926757812, -0.07717323303222656, -0.071990966796875, -0.06680870056152344, -0.061626434326171875, -0.05644416809082031, -0.05126190185546875, -0.04607963562011719, -0.040897369384765625, -0.03571510314941406, -0.0305328369140625, -0.025350570678710938, -0.020168304443359375, -0.014986038208007812, -0.00980377197265625, -0.0046215057373046875, 0.000560760498046875, 0.0057430267333984375, 0.01092529296875, 0.016107559204101562, 0.021289825439453125, 0.026472091674804688, 0.03165435791015625, 0.03683662414550781, 0.042018890380859375, 0.04720115661621094, 0.0523834228515625, 0.05756568908691406, 0.06274795532226562, 0.06793022155761719, 0.07311248779296875, 0.07829475402832031, 0.08347702026367188, 0.08865928649902344, 0.093841552734375, 0.09902381896972656, 0.10420608520507812, 0.10938835144042969, 0.11457061767578125, 0.11975288391113281, 0.12493515014648438, 0.13011741638183594, 0.1352996826171875, 0.14048194885253906, 0.14566421508789062, 0.1508464813232422, 0.15602874755859375, 0.1612110137939453, 0.16639328002929688, 0.17157554626464844, 0.1767578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 17.0, 12.0, 13.0, 24.0, 33.0, 41.0, 34.0, 47.0, 50.0, 61.0, 59.0, 36.0, 63.0, 60.0, 52.0, 57.0, 44.0, 39.0, 35.0, 33.0, 38.0, 25.0, 17.0, 18.0, 11.0, 11.0, 10.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6372413635253906e-05, -4.494283348321915e-05, -4.351325333118439e-05, -4.208367317914963e-05, -4.065409302711487e-05, -3.922451287508011e-05, -3.779493272304535e-05, -3.636535257101059e-05, -3.493577241897583e-05, -3.350619226694107e-05, -3.207661211490631e-05, -3.064703196287155e-05, -2.9217451810836792e-05, -2.7787871658802032e-05, -2.6358291506767273e-05, -2.4928711354732513e-05, -2.3499131202697754e-05, -2.2069551050662994e-05, -2.0639970898628235e-05, -1.9210390746593475e-05, -1.7780810594558716e-05, -1.6351230442523956e-05, -1.4921650290489197e-05, -1.3492070138454437e-05, -1.2062489986419678e-05, -1.0632909834384918e-05, -9.203329682350159e-06, -7.7737495303154e-06, -6.34416937828064e-06, -4.91458922624588e-06, -3.4850090742111206e-06, -2.055428922176361e-06, -6.258487701416016e-07, 8.03731381893158e-07, 2.2333115339279175e-06, 3.662891685962677e-06, 5.0924718379974365e-06, 6.522051990032196e-06, 7.951632142066956e-06, 9.381212294101715e-06, 1.0810792446136475e-05, 1.2240372598171234e-05, 1.3669952750205994e-05, 1.5099532902240753e-05, 1.6529113054275513e-05, 1.7958693206310272e-05, 1.9388273358345032e-05, 2.081785351037979e-05, 2.224743366241455e-05, 2.367701381444931e-05, 2.510659396648407e-05, 2.653617411851883e-05, 2.796575427055359e-05, 2.939533442258835e-05, 3.082491457462311e-05, 3.225449472665787e-05, 3.368407487869263e-05, 3.5113655030727386e-05, 3.6543235182762146e-05, 3.7972815334796906e-05, 3.9402395486831665e-05, 4.0831975638866425e-05, 4.2261555790901184e-05, 4.3691135942935944e-05, 4.51207160949707e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 0.0, 3.0, 5.0, 6.0, 8.0, 13.0, 17.0, 36.0, 47.0, 70.0, 92.0, 129.0, 216.0, 414.0, 701.0, 1491.0, 3304.0, 8924.0, 30162.0, 142562.0, 547033.0, 244950.0, 47254.0, 12742.0, 4496.0, 1767.0, 860.0, 486.0, 284.0, 174.0, 102.0, 46.0, 55.0, 22.0, 17.0, 14.0, 10.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1761474609375, -0.1709136962890625, -0.165679931640625, -0.1604461669921875, -0.15521240234375, -0.1499786376953125, -0.144744873046875, -0.1395111083984375, -0.13427734375, -0.1290435791015625, -0.123809814453125, -0.1185760498046875, -0.11334228515625, -0.1081085205078125, -0.102874755859375, -0.0976409912109375, -0.0924072265625, -0.0871734619140625, -0.081939697265625, -0.0767059326171875, -0.07147216796875, -0.0662384033203125, -0.061004638671875, -0.0557708740234375, -0.050537109375, -0.0453033447265625, -0.040069580078125, -0.0348358154296875, -0.02960205078125, -0.0243682861328125, -0.019134521484375, -0.0139007568359375, -0.0086669921875, -0.0034332275390625, 0.001800537109375, 0.0070343017578125, 0.01226806640625, 0.0175018310546875, 0.022735595703125, 0.0279693603515625, 0.033203125, 0.0384368896484375, 0.043670654296875, 0.0489044189453125, 0.05413818359375, 0.0593719482421875, 0.064605712890625, 0.0698394775390625, 0.0750732421875, 0.0803070068359375, 0.085540771484375, 0.0907745361328125, 0.09600830078125, 0.1012420654296875, 0.106475830078125, 0.1117095947265625, 0.116943359375, 0.1221771240234375, 0.127410888671875, 0.1326446533203125, 0.13787841796875, 0.1431121826171875, 0.148345947265625, 0.1535797119140625, 0.1588134765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 17.0, 10.0, 21.0, 32.0, 49.0, 62.0, 73.0, 98.0, 88.0, 110.0, 100.0, 93.0, 62.0, 31.0, 27.0, 29.0, 17.0, 14.0, 15.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1875, -0.18230819702148438, -0.17711639404296875, -0.17192459106445312, -0.1667327880859375, -0.16154098510742188, -0.15634918212890625, -0.15115737915039062, -0.145965576171875, -0.14077377319335938, -0.13558197021484375, -0.13039016723632812, -0.1251983642578125, -0.12000656127929688, -0.11481475830078125, -0.10962295532226562, -0.10443115234375, -0.09923934936523438, -0.09404754638671875, -0.08885574340820312, -0.0836639404296875, -0.07847213745117188, -0.07328033447265625, -0.06808853149414062, -0.062896728515625, -0.057704925537109375, -0.05251312255859375, -0.047321319580078125, -0.0421295166015625, -0.036937713623046875, -0.03174591064453125, -0.026554107666015625, -0.0213623046875, -0.016170501708984375, -0.01097869873046875, -0.005786895751953125, -0.0005950927734375, 0.004596710205078125, 0.00978851318359375, 0.014980316162109375, 0.020172119140625, 0.025363922119140625, 0.03055572509765625, 0.035747528076171875, 0.0409393310546875, 0.046131134033203125, 0.05132293701171875, 0.056514739990234375, 0.06170654296875, 0.06689834594726562, 0.07209014892578125, 0.07728195190429688, 0.0824737548828125, 0.08766555786132812, 0.09285736083984375, 0.09804916381835938, 0.103240966796875, 0.10843276977539062, 0.11362457275390625, 0.11881637573242188, 0.1240081787109375, 0.12919998168945312, 0.13439178466796875, 0.13958358764648438, 0.144775390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 16.0, 63.0, 181.0, 290.0, 263.0, 153.0, 27.0, 11.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2634855508804321, -1.082746982574463, -0.9020082950592041, -0.7212697267532349, -0.5405310988426208, -0.35979247093200684, -0.1790539026260376, 0.0016847848892211914, 0.18242335319519043, 0.36316198110580444, 0.5439006090164185, 0.7246391773223877, 0.9053778052330017, 1.0861164331436157, 1.266855001449585, 1.4475936889648438, 1.628332257270813, 1.8090708255767822, 1.989809513092041, 2.1705479621887207, 2.3512866497039795, 2.5320253372192383, 2.712763786315918, 2.893502712249756, 3.0742411613464355, 3.2549798488616943, 3.435718297958374, 3.616456985473633, 3.7971956729888916, 3.9779343605041504, 4.15867280960083, 4.339411735534668, 4.5201497077941895, 4.700888156890869, 4.881627082824707, 5.062365531921387, 5.243103981018066, 5.423842906951904, 5.604581356048584, 5.785320281982422, 5.966058731079102, 6.146797180175781, 6.327536106109619, 6.508274555206299, 6.6890130043029785, 6.869751930236816, 7.050490379333496, 7.231228828430176, 7.4119672775268555, 7.592705726623535, 7.773444652557373, 7.954183101654053, 8.13492202758789, 8.31566047668457, 8.49639892578125, 8.67713737487793, 8.857876777648926, 9.038615226745605, 9.219353675842285, 9.400093078613281, 9.580831527709961, 9.76156997680664, 9.94230842590332, 10.123046875, 10.30378532409668]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 6.0, 11.0, 7.0, 13.0, 6.0, 24.0, 15.0, 23.0, 17.0, 32.0, 32.0, 32.0, 44.0, 62.0, 45.0, 46.0, 48.0, 47.0, 41.0, 47.0, 43.0, 47.0, 41.0, 39.0, 51.0, 34.0, 29.0, 11.0, 19.0, 16.0, 14.0, 12.0, 9.0, 4.0, 10.0, 6.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7388379573822021, -1.6875922679901123, -1.636346459388733, -1.585100769996643, -1.5338549613952637, -1.4826092720031738, -1.431363582611084, -1.3801178932189941, -1.3288720846176147, -1.277626395225525, -1.2263805866241455, -1.1751348972320557, -1.1238892078399658, -1.0726433992385864, -1.0213977098464966, -0.970151960849762, -0.9189062118530273, -0.8676604628562927, -0.8164147138595581, -0.7651690244674683, -0.7139232754707336, -0.662677526473999, -0.6114318370819092, -0.5601860880851746, -0.5089403390884399, -0.4576945900917053, -0.4064488708972931, -0.35520315170288086, -0.30395740270614624, -0.2527116537094116, -0.2014659345149994, -0.15022021532058716, -0.09897446632385254, -0.047728732228279114, 0.0035170018672943115, 0.05476273596286774, 0.10600847005844116, 0.15725421905517578, 0.208499938249588, 0.25974565744400024, 0.31099140644073486, 0.3622371554374695, 0.4134828746318817, 0.46472859382629395, 0.5159743428230286, 0.5672200918197632, 0.618465781211853, 0.6697115302085876, 0.7209572792053223, 0.7722030282020569, 0.8234487771987915, 0.8746944665908813, 0.925940215587616, 0.9771859645843506, 1.0284316539764404, 1.0796773433685303, 1.1309231519699097, 1.1821688413619995, 1.233414649963379, 1.2846603393554688, 1.3359060287475586, 1.387151837348938, 1.4383975267410278, 1.4896433353424072, 1.540889024734497]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 12.0, 9.0, 19.0, 20.0, 36.0, 57.0, 69.0, 85.0, 152.0, 222.0, 366.0, 669.0, 1152.0, 2123.0, 4441.0, 10911.0, 39514.0, 3783656.0, 304383.0, 28948.0, 8917.0, 3840.0, 1998.0, 1020.0, 581.0, 380.0, 232.0, 137.0, 109.0, 56.0, 61.0, 25.0, 23.0, 18.0, 7.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.36962890625, -0.3593330383300781, -0.34903717041015625, -0.3387413024902344, -0.3284454345703125, -0.3181495666503906, -0.30785369873046875, -0.2975578308105469, -0.287261962890625, -0.2769660949707031, -0.26667022705078125, -0.2563743591308594, -0.2460784912109375, -0.23578262329101562, -0.22548675537109375, -0.21519088745117188, -0.20489501953125, -0.19459915161132812, -0.18430328369140625, -0.17400741577148438, -0.1637115478515625, -0.15341567993164062, -0.14311981201171875, -0.13282394409179688, -0.122528076171875, -0.11223220825195312, -0.10193634033203125, -0.09164047241210938, -0.0813446044921875, -0.07104873657226562, -0.06075286865234375, -0.050457000732421875, -0.0401611328125, -0.029865264892578125, -0.01956939697265625, -0.009273529052734375, 0.0010223388671875, 0.011318206787109375, 0.02161407470703125, 0.031909942626953125, 0.042205810546875, 0.052501678466796875, 0.06279754638671875, 0.07309341430664062, 0.0833892822265625, 0.09368515014648438, 0.10398101806640625, 0.11427688598632812, 0.12457275390625, 0.13486862182617188, 0.14516448974609375, 0.15546035766601562, 0.1657562255859375, 0.17605209350585938, 0.18634796142578125, 0.19664382934570312, 0.206939697265625, 0.21723556518554688, 0.22753143310546875, 0.23782730102539062, 0.2481231689453125, 0.2584190368652344, 0.26871490478515625, 0.2790107727050781, 0.289306640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 5.0, 16.0, 14.0, 9.0, 20.0, 25.0, 20.0, 30.0, 20.0, 32.0, 25.0, 40.0, 39.0, 48.0, 51.0, 46.0, 46.0, 47.0, 50.0, 34.0, 43.0, 47.0, 42.0, 41.0, 25.0, 26.0, 25.0, 22.0, 20.0, 18.0, 17.0, 11.0, 6.0, 2.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.056915283203125, -0.055274009704589844, -0.05363273620605469, -0.05199146270751953, -0.050350189208984375, -0.04870891571044922, -0.04706764221191406, -0.045426368713378906, -0.04378509521484375, -0.042143821716308594, -0.04050254821777344, -0.03886127471923828, -0.037220001220703125, -0.03557872772216797, -0.03393745422363281, -0.032296180725097656, -0.0306549072265625, -0.029013633728027344, -0.027372360229492188, -0.02573108673095703, -0.024089813232421875, -0.02244853973388672, -0.020807266235351562, -0.019165992736816406, -0.01752471923828125, -0.015883445739746094, -0.014242172241210938, -0.012600898742675781, -0.010959625244140625, -0.009318351745605469, -0.0076770782470703125, -0.006035804748535156, -0.00439453125, -0.0027532577514648438, -0.0011119842529296875, 0.0005292892456054688, 0.002170562744140625, 0.0038118362426757812, 0.0054531097412109375, 0.007094383239746094, 0.00873565673828125, 0.010376930236816406, 0.012018203735351562, 0.013659477233886719, 0.015300750732421875, 0.01694202423095703, 0.018583297729492188, 0.020224571228027344, 0.0218658447265625, 0.023507118225097656, 0.025148391723632812, 0.02678966522216797, 0.028430938720703125, 0.03007221221923828, 0.03171348571777344, 0.033354759216308594, 0.03499603271484375, 0.036637306213378906, 0.03827857971191406, 0.03991985321044922, 0.041561126708984375, 0.04320240020751953, 0.04484367370605469, 0.046484947204589844, 0.048126220703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 9.0, 11.0, 15.0, 30.0, 25.0, 43.0, 81.0, 94.0, 184.0, 282.0, 516.0, 1263.0, 4570.0, 51646.0, 4103893.0, 25922.0, 3428.0, 1070.0, 509.0, 248.0, 175.0, 77.0, 64.0, 35.0, 31.0, 19.0, 8.0, 11.0, 3.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.17449951171875, -1.1370849609375, -1.09967041015625, -1.062255859375, -1.02484130859375, -0.9874267578125, -0.95001220703125, -0.91259765625, -0.87518310546875, -0.8377685546875, -0.80035400390625, -0.762939453125, -0.72552490234375, -0.6881103515625, -0.65069580078125, -0.61328125, -0.57586669921875, -0.5384521484375, -0.50103759765625, -0.463623046875, -0.42620849609375, -0.3887939453125, -0.35137939453125, -0.31396484375, -0.27655029296875, -0.2391357421875, -0.20172119140625, -0.164306640625, -0.12689208984375, -0.0894775390625, -0.05206298828125, -0.0146484375, 0.02276611328125, 0.0601806640625, 0.09759521484375, 0.135009765625, 0.17242431640625, 0.2098388671875, 0.24725341796875, 0.28466796875, 0.32208251953125, 0.3594970703125, 0.39691162109375, 0.434326171875, 0.47174072265625, 0.5091552734375, 0.54656982421875, 0.583984375, 0.62139892578125, 0.6588134765625, 0.69622802734375, 0.733642578125, 0.77105712890625, 0.8084716796875, 0.84588623046875, 0.88330078125, 0.92071533203125, 0.9581298828125, 0.99554443359375, 1.032958984375, 1.07037353515625, 1.1077880859375, 1.14520263671875, 1.1826171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 22.0, 58.0, 114.0, 3468.0, 251.0, 76.0, 24.0, 21.0, 15.0, 4.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.2231426239013672, -0.21752548217773438, -0.21190834045410156, -0.20629119873046875, -0.20067405700683594, -0.19505691528320312, -0.1894397735595703, -0.1838226318359375, -0.1782054901123047, -0.17258834838867188, -0.16697120666503906, -0.16135406494140625, -0.15573692321777344, -0.15011978149414062, -0.1445026397705078, -0.138885498046875, -0.1332683563232422, -0.12765121459960938, -0.12203407287597656, -0.11641693115234375, -0.11079978942871094, -0.10518264770507812, -0.09956550598144531, -0.0939483642578125, -0.08833122253417969, -0.08271408081054688, -0.07709693908691406, -0.07147979736328125, -0.06586265563964844, -0.060245513916015625, -0.05462837219238281, -0.04901123046875, -0.04339408874511719, -0.037776947021484375, -0.03215980529785156, -0.02654266357421875, -0.020925521850585938, -0.015308380126953125, -0.009691238403320312, -0.0040740966796875, 0.0015430450439453125, 0.007160186767578125, 0.012777328491210938, 0.01839447021484375, 0.024011611938476562, 0.029628753662109375, 0.03524589538574219, 0.040863037109375, 0.04648017883300781, 0.052097320556640625, 0.05771446228027344, 0.06333160400390625, 0.06894874572753906, 0.07456588745117188, 0.08018302917480469, 0.0858001708984375, 0.09141731262207031, 0.09703445434570312, 0.10265159606933594, 0.10826873779296875, 0.11388587951660156, 0.11950302124023438, 0.1251201629638672, 0.1307373046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 3.0, 5.0, 5.0, 10.0, 19.0, 28.0, 50.0, 70.0, 100.0, 137.0, 144.0, 124.0, 115.0, 64.0, 45.0, 38.0, 20.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3986055850982666, -0.38072556257247925, -0.3628455400466919, -0.34496551752090454, -0.3270854949951172, -0.30920547246932983, -0.2913254201412201, -0.27344539761543274, -0.2555653750896454, -0.23768535256385803, -0.21980533003807068, -0.20192529261112213, -0.18404527008533478, -0.16616524755954742, -0.14828521013259888, -0.13040518760681152, -0.11252516508102417, -0.09464514255523682, -0.07676511257886887, -0.058885086327791214, -0.04100506007671356, -0.02312503755092621, -0.005245007574558258, 0.012635022401809692, 0.030515044927597046, 0.0483950711786747, 0.06627509742975235, 0.0841551274061203, 0.10203514993190765, 0.11991517245769501, 0.13779520988464355, 0.1556752324104309, 0.17355531454086304, 0.1914353370666504, 0.20931535959243774, 0.2271953970193863, 0.24507541954517365, 0.2629554271697998, 0.28083547949790955, 0.2987155020236969, 0.31659552454948425, 0.3344755470752716, 0.35235556960105896, 0.3702355921268463, 0.38811564445495605, 0.4059956669807434, 0.42387568950653076, 0.4417557120323181, 0.45963573455810547, 0.4775157570838928, 0.4953957796096802, 0.5132758021354675, 0.5311558246612549, 0.5490358471870422, 0.5669158697128296, 0.5847959518432617, 0.6026759147644043, 0.6205559372901917, 0.638435959815979, 0.6563159823417664, 0.6741960048675537, 0.6920760273933411, 0.7099560499191284, 0.7278361320495605, 0.7457161545753479]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 5.0, 8.0, 12.0, 8.0, 16.0, 16.0, 24.0, 25.0, 24.0, 27.0, 32.0, 38.0, 41.0, 33.0, 34.0, 47.0, 41.0, 48.0, 48.0, 45.0, 54.0, 49.0, 49.0, 36.0, 33.0, 25.0, 27.0, 26.0, 27.0, 14.0, 24.0, 18.0, 13.0, 9.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24449318647384644, -0.23632627725601196, -0.2281593531370163, -0.21999244391918182, -0.21182551980018616, -0.20365861058235168, -0.1954917013645172, -0.18732477724552155, -0.17915785312652588, -0.1709909439086914, -0.16282401978969574, -0.15465711057186127, -0.1464901864528656, -0.13832327723503113, -0.13015636801719666, -0.12198944389820099, -0.11382253468036652, -0.10565561801195145, -0.09748870134353638, -0.0893217921257019, -0.08115486800670624, -0.07298795878887177, -0.0648210421204567, -0.056654125452041626, -0.048487208783626556, -0.04032029211521149, -0.03215337544679642, -0.023986462503671646, -0.015819545835256577, -0.007652629166841507, 0.0005142837762832642, 0.008681200444698334, 0.016848117113113403, 0.025015033781528473, 0.03318195044994354, 0.041348863393068314, 0.04951578006148338, 0.05768269672989845, 0.06584960967302322, 0.0740165263414383, 0.08218344300985336, 0.09035035967826843, 0.0985172763466835, 0.10668419301509857, 0.11485110223293304, 0.12301802635192871, 0.13118493556976318, 0.13935184478759766, 0.14751876890659332, 0.1556856781244278, 0.16385260224342346, 0.17201951146125793, 0.1801864355802536, 0.18835334479808807, 0.19652026891708374, 0.2046871781349182, 0.21285408735275269, 0.22102099657058716, 0.22918792068958282, 0.2373548299074173, 0.24552175402641296, 0.25368866324424744, 0.2618555724620819, 0.27002251148223877, 0.27818942070007324]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 9.0, 10.0, 20.0, 18.0, 30.0, 45.0, 71.0, 116.0, 201.0, 284.0, 471.0, 897.0, 1483.0, 2951.0, 6036.0, 12721.0, 28624.0, 64834.0, 139165.0, 246519.0, 257969.0, 154013.0, 71669.0, 31886.0, 14397.0, 6790.0, 3235.0, 1777.0, 946.0, 512.0, 282.0, 210.0, 129.0, 90.0, 46.0, 40.0, 20.0, 15.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.18896484375, -0.1835765838623047, -0.17818832397460938, -0.17280006408691406, -0.16741180419921875, -0.16202354431152344, -0.15663528442382812, -0.1512470245361328, -0.1458587646484375, -0.1404705047607422, -0.13508224487304688, -0.12969398498535156, -0.12430572509765625, -0.11891746520996094, -0.11352920532226562, -0.10814094543457031, -0.102752685546875, -0.09736442565917969, -0.09197616577148438, -0.08658790588378906, -0.08119964599609375, -0.07581138610839844, -0.07042312622070312, -0.06503486633300781, -0.0596466064453125, -0.05425834655761719, -0.048870086669921875, -0.04348182678222656, -0.03809356689453125, -0.03270530700683594, -0.027317047119140625, -0.021928787231445312, -0.01654052734375, -0.011152267456054688, -0.005764007568359375, -0.0003757476806640625, 0.00501251220703125, 0.010400772094726562, 0.015789031982421875, 0.021177291870117188, 0.0265655517578125, 0.03195381164550781, 0.037342071533203125, 0.04273033142089844, 0.04811859130859375, 0.05350685119628906, 0.058895111083984375, 0.06428337097167969, 0.069671630859375, 0.07505989074707031, 0.08044815063476562, 0.08583641052246094, 0.09122467041015625, 0.09661293029785156, 0.10200119018554688, 0.10738945007324219, 0.1127777099609375, 0.11816596984863281, 0.12355422973632812, 0.12894248962402344, 0.13433074951171875, 0.13971900939941406, 0.14510726928710938, 0.1504955291748047, 0.1558837890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 8.0, 12.0, 14.0, 20.0, 19.0, 32.0, 34.0, 34.0, 31.0, 44.0, 35.0, 59.0, 53.0, 55.0, 63.0, 56.0, 56.0, 42.0, 45.0, 47.0, 43.0, 44.0, 27.0, 32.0, 17.0, 17.0, 12.0, 11.0, 2.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.0791482925415039, -0.07669258117675781, -0.07423686981201172, -0.07178115844726562, -0.06932544708251953, -0.06686973571777344, -0.06441402435302734, -0.06195831298828125, -0.059502601623535156, -0.05704689025878906, -0.05459117889404297, -0.052135467529296875, -0.04967975616455078, -0.04722404479980469, -0.044768333435058594, -0.0423126220703125, -0.039856910705566406, -0.03740119934082031, -0.03494548797607422, -0.032489776611328125, -0.03003406524658203, -0.027578353881835938, -0.025122642517089844, -0.02266693115234375, -0.020211219787597656, -0.017755508422851562, -0.015299797058105469, -0.012844085693359375, -0.010388374328613281, -0.007932662963867188, -0.005476951599121094, -0.003021240234375, -0.0005655288696289062, 0.0018901824951171875, 0.004345893859863281, 0.006801605224609375, 0.009257316589355469, 0.011713027954101562, 0.014168739318847656, 0.01662445068359375, 0.019080162048339844, 0.021535873413085938, 0.02399158477783203, 0.026447296142578125, 0.02890300750732422, 0.03135871887207031, 0.033814430236816406, 0.0362701416015625, 0.038725852966308594, 0.04118156433105469, 0.04363727569580078, 0.046092987060546875, 0.04854869842529297, 0.05100440979003906, 0.053460121154785156, 0.05591583251953125, 0.058371543884277344, 0.06082725524902344, 0.06328296661376953, 0.06573867797851562, 0.06819438934326172, 0.07065010070800781, 0.0731058120727539, 0.0755615234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 16.0, 14.0, 17.0, 26.0, 42.0, 58.0, 76.0, 125.0, 156.0, 220.0, 356.0, 590.0, 1095.0, 2266.0, 6164.0, 24554.0, 139184.0, 574057.0, 243029.0, 41159.0, 9096.0, 2872.0, 1306.0, 724.0, 422.0, 288.0, 177.0, 130.0, 82.0, 66.0, 47.0, 33.0, 20.0, 20.0, 16.0, 8.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3851776123046875, -0.373382568359375, -0.3615875244140625, -0.34979248046875, -0.3379974365234375, -0.326202392578125, -0.3144073486328125, -0.3026123046875, -0.2908172607421875, -0.279022216796875, -0.2672271728515625, -0.25543212890625, -0.2436370849609375, -0.231842041015625, -0.2200469970703125, -0.208251953125, -0.1964569091796875, -0.184661865234375, -0.1728668212890625, -0.16107177734375, -0.1492767333984375, -0.137481689453125, -0.1256866455078125, -0.1138916015625, -0.1020965576171875, -0.090301513671875, -0.0785064697265625, -0.06671142578125, -0.0549163818359375, -0.043121337890625, -0.0313262939453125, -0.01953125, -0.0077362060546875, 0.004058837890625, 0.0158538818359375, 0.02764892578125, 0.0394439697265625, 0.051239013671875, 0.0630340576171875, 0.0748291015625, 0.0866241455078125, 0.098419189453125, 0.1102142333984375, 0.12200927734375, 0.1338043212890625, 0.145599365234375, 0.1573944091796875, 0.169189453125, 0.1809844970703125, 0.192779541015625, 0.2045745849609375, 0.21636962890625, 0.2281646728515625, 0.239959716796875, 0.2517547607421875, 0.2635498046875, 0.2753448486328125, 0.287139892578125, 0.2989349365234375, 0.31072998046875, 0.3225250244140625, 0.334320068359375, 0.3461151123046875, 0.35791015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 17.0, 13.0, 16.0, 14.0, 20.0, 22.0, 22.0, 31.0, 24.0, 35.0, 37.0, 46.0, 38.0, 45.0, 41.0, 43.0, 38.0, 43.0, 32.0, 43.0, 47.0, 37.0, 30.0, 24.0, 26.0, 31.0, 21.0, 23.0, 23.0, 22.0, 13.0, 11.0, 15.0, 9.0, 10.0, 7.0, 0.0, 1.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0], "bins": [-0.427978515625, -0.416259765625, -0.404541015625, -0.392822265625, -0.381103515625, -0.369384765625, -0.357666015625, -0.345947265625, -0.334228515625, -0.322509765625, -0.310791015625, -0.299072265625, -0.287353515625, -0.275634765625, -0.263916015625, -0.252197265625, -0.240478515625, -0.228759765625, -0.217041015625, -0.205322265625, -0.193603515625, -0.181884765625, -0.170166015625, -0.158447265625, -0.146728515625, -0.135009765625, -0.123291015625, -0.111572265625, -0.099853515625, -0.088134765625, -0.076416015625, -0.064697265625, -0.052978515625, -0.041259765625, -0.029541015625, -0.017822265625, -0.006103515625, 0.005615234375, 0.017333984375, 0.029052734375, 0.040771484375, 0.052490234375, 0.064208984375, 0.075927734375, 0.087646484375, 0.099365234375, 0.111083984375, 0.122802734375, 0.134521484375, 0.146240234375, 0.157958984375, 0.169677734375, 0.181396484375, 0.193115234375, 0.204833984375, 0.216552734375, 0.228271484375, 0.239990234375, 0.251708984375, 0.263427734375, 0.275146484375, 0.286865234375, 0.298583984375, 0.310302734375, 0.322021484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 9.0, 15.0, 11.0, 32.0, 49.0, 75.0, 99.0, 170.0, 262.0, 430.0, 792.0, 1485.0, 3002.0, 7105.0, 19581.0, 69625.0, 310408.0, 473215.0, 114843.0, 29439.0, 9710.0, 4014.0, 1868.0, 970.0, 528.0, 288.0, 153.0, 124.0, 80.0, 54.0, 31.0, 22.0, 17.0, 2.0, 7.0, 9.0, 12.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.192138671875, -0.18696975708007812, -0.18180084228515625, -0.17663192749023438, -0.1714630126953125, -0.16629409790039062, -0.16112518310546875, -0.15595626831054688, -0.150787353515625, -0.14561843872070312, -0.14044952392578125, -0.13528060913085938, -0.1301116943359375, -0.12494277954101562, -0.11977386474609375, -0.11460494995117188, -0.10943603515625, -0.10426712036132812, -0.09909820556640625, -0.09392929077148438, -0.0887603759765625, -0.08359146118164062, -0.07842254638671875, -0.07325363159179688, -0.068084716796875, -0.06291580200195312, -0.05774688720703125, -0.052577972412109375, -0.0474090576171875, -0.042240142822265625, -0.03707122802734375, -0.031902313232421875, -0.0267333984375, -0.021564483642578125, -0.01639556884765625, -0.011226654052734375, -0.0060577392578125, -0.000888824462890625, 0.00428009033203125, 0.009449005126953125, 0.014617919921875, 0.019786834716796875, 0.02495574951171875, 0.030124664306640625, 0.0352935791015625, 0.040462493896484375, 0.04563140869140625, 0.050800323486328125, 0.05596923828125, 0.061138153076171875, 0.06630706787109375, 0.07147598266601562, 0.0766448974609375, 0.08181381225585938, 0.08698272705078125, 0.09215164184570312, 0.097320556640625, 0.10248947143554688, 0.10765838623046875, 0.11282730102539062, 0.1179962158203125, 0.12316513061523438, 0.12833404541015625, 0.13350296020507812, 0.138671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 9.0, 21.0, 15.0, 28.0, 43.0, 50.0, 48.0, 66.0, 79.0, 72.0, 72.0, 76.0, 77.0, 70.0, 50.0, 59.0, 41.0, 21.0, 26.0, 13.0, 13.0, 15.0, 3.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.458427429199219e-05, -4.2698346078395844e-05, -4.08124178647995e-05, -3.8926489651203156e-05, -3.704056143760681e-05, -3.515463322401047e-05, -3.3268705010414124e-05, -3.138277679681778e-05, -2.9496848583221436e-05, -2.761092036962509e-05, -2.5724992156028748e-05, -2.3839063942432404e-05, -2.195313572883606e-05, -2.0067207515239716e-05, -1.818127930164337e-05, -1.6295351088047028e-05, -1.4409422874450684e-05, -1.252349466085434e-05, -1.0637566447257996e-05, -8.751638233661652e-06, -6.865710020065308e-06, -4.979781806468964e-06, -3.0938535928726196e-06, -1.2079253792762756e-06, 6.780028343200684e-07, 2.5639310479164124e-06, 4.449859261512756e-06, 6.3357874751091e-06, 8.221715688705444e-06, 1.0107643902301788e-05, 1.1993572115898132e-05, 1.3879500329494476e-05, 1.576542854309082e-05, 1.7651356756687164e-05, 1.9537284970283508e-05, 2.1423213183879852e-05, 2.3309141397476196e-05, 2.519506961107254e-05, 2.7080997824668884e-05, 2.8966926038265228e-05, 3.085285425186157e-05, 3.2738782465457916e-05, 3.462471067905426e-05, 3.6510638892650604e-05, 3.839656710624695e-05, 4.028249531984329e-05, 4.2168423533439636e-05, 4.405435174703598e-05, 4.5940279960632324e-05, 4.782620817422867e-05, 4.971213638782501e-05, 5.1598064601421356e-05, 5.34839928150177e-05, 5.5369921028614044e-05, 5.725584924221039e-05, 5.914177745580673e-05, 6.1027705669403076e-05, 6.291363388299942e-05, 6.479956209659576e-05, 6.668549031019211e-05, 6.857141852378845e-05, 7.04573467373848e-05, 7.234327495098114e-05, 7.422920316457748e-05, 7.611513137817383e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 5.0, 14.0, 18.0, 32.0, 50.0, 78.0, 145.0, 227.0, 484.0, 1203.0, 3606.0, 16141.0, 146322.0, 730744.0, 128888.0, 15009.0, 3399.0, 1181.0, 451.0, 242.0, 128.0, 61.0, 49.0, 24.0, 26.0, 10.0, 5.0, 1.0, 0.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.34808921813964844, -0.3394889831542969, -0.3308887481689453, -0.32228851318359375, -0.3136882781982422, -0.3050880432128906, -0.29648780822753906, -0.2878875732421875, -0.27928733825683594, -0.2706871032714844, -0.2620868682861328, -0.25348663330078125, -0.2448863983154297, -0.23628616333007812, -0.22768592834472656, -0.219085693359375, -0.21048545837402344, -0.20188522338867188, -0.1932849884033203, -0.18468475341796875, -0.1760845184326172, -0.16748428344726562, -0.15888404846191406, -0.1502838134765625, -0.14168357849121094, -0.13308334350585938, -0.12448310852050781, -0.11588287353515625, -0.10728263854980469, -0.09868240356445312, -0.09008216857910156, -0.08148193359375, -0.07288169860839844, -0.06428146362304688, -0.05568122863769531, -0.04708099365234375, -0.03848075866699219, -0.029880523681640625, -0.021280288696289062, -0.0126800537109375, -0.0040798187255859375, 0.004520416259765625, 0.013120651245117188, 0.02172088623046875, 0.030321121215820312, 0.038921356201171875, 0.04752159118652344, 0.056121826171875, 0.06472206115722656, 0.07332229614257812, 0.08192253112792969, 0.09052276611328125, 0.09912300109863281, 0.10772323608398438, 0.11632347106933594, 0.1249237060546875, 0.13352394104003906, 0.14212417602539062, 0.1507244110107422, 0.15932464599609375, 0.1679248809814453, 0.17652511596679688, 0.18512535095214844, 0.1937255859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 8.0, 2.0, 3.0, 6.0, 11.0, 16.0, 26.0, 46.0, 40.0, 57.0, 70.0, 113.0, 103.0, 105.0, 95.0, 77.0, 66.0, 52.0, 39.0, 28.0, 14.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.314453125, -0.3070049285888672, -0.2995567321777344, -0.29210853576660156, -0.28466033935546875, -0.27721214294433594, -0.2697639465332031, -0.2623157501220703, -0.2548675537109375, -0.2474193572998047, -0.23997116088867188, -0.23252296447753906, -0.22507476806640625, -0.21762657165527344, -0.21017837524414062, -0.2027301788330078, -0.195281982421875, -0.1878337860107422, -0.18038558959960938, -0.17293739318847656, -0.16548919677734375, -0.15804100036621094, -0.15059280395507812, -0.1431446075439453, -0.1356964111328125, -0.1282482147216797, -0.12080001831054688, -0.11335182189941406, -0.10590362548828125, -0.09845542907714844, -0.09100723266601562, -0.08355903625488281, -0.07611083984375, -0.06866264343261719, -0.061214447021484375, -0.05376625061035156, -0.04631805419921875, -0.03886985778808594, -0.031421661376953125, -0.023973464965820312, -0.0165252685546875, -0.009077072143554688, -0.001628875732421875, 0.0058193206787109375, 0.01326751708984375, 0.020715713500976562, 0.028163909912109375, 0.03561210632324219, 0.043060302734375, 0.05050849914550781, 0.057956695556640625, 0.06540489196777344, 0.07285308837890625, 0.08030128479003906, 0.08774948120117188, 0.09519767761230469, 0.1026458740234375, 0.11009407043457031, 0.11754226684570312, 0.12499046325683594, 0.13243865966796875, 0.13988685607910156, 0.14733505249023438, 0.1547832489013672, 0.1622314453125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 20.0, 28.0, 48.0, 101.0, 150.0, 168.0, 144.0, 132.0, 77.0, 63.0, 28.0, 15.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.422314167022705, -3.3121464252471924, -3.2019784450531006, -3.091810703277588, -2.981642961502075, -2.8714752197265625, -2.7613072395324707, -2.651139497756958, -2.5409717559814453, -2.4308040142059326, -2.320636034011841, -2.210468292236328, -2.1003005504608154, -1.9901326894760132, -1.879964828491211, -1.7697970867156982, -1.6596291065216064, -1.5494612455368042, -1.4392935037612915, -1.3291256427764893, -1.2189579010009766, -1.1087900400161743, -0.9986221790313721, -0.8884543776512146, -0.7782865762710571, -0.6681187748908997, -0.5579509735107422, -0.44778311252593994, -0.33761531114578247, -0.227447509765625, -0.11727964878082275, -0.007111847400665283, 0.10305595397949219, 0.21322377026081085, 0.3233915865421295, 0.4335594177246094, 0.5437272191047668, 0.6538950204849243, 0.7640628814697266, 0.874230682849884, 0.9843984842300415, 1.0945663452148438, 1.2047340869903564, 1.3149019479751587, 1.425069808959961, 1.5352375507354736, 1.6454054117202759, 1.7555732727050781, 1.8657410144805908, 1.975908875465393, 2.0860767364501953, 2.196244478225708, 2.3064122200012207, 2.4165802001953125, 2.526747941970825, 2.636915683746338, 2.7470836639404297, 2.8572514057159424, 2.967419385910034, 3.077587127685547, 3.1877548694610596, 3.2979226112365723, 3.408090591430664, 3.5182583332061768, 3.6284260749816895]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 4.0, 10.0, 7.0, 9.0, 11.0, 17.0, 17.0, 15.0, 17.0, 18.0, 26.0, 43.0, 36.0, 36.0, 41.0, 48.0, 37.0, 42.0, 57.0, 63.0, 68.0, 63.0, 40.0, 38.0, 28.0, 21.0, 26.0, 34.0, 25.0, 17.0, 21.0, 16.0, 11.0, 5.0, 8.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2215898036956787, -2.1516826152801514, -2.081775426864624, -2.0118682384490967, -1.9419611692428589, -1.8720539808273315, -1.8021469116210938, -1.7322397232055664, -1.662332534790039, -1.5924253463745117, -1.5225181579589844, -1.4526110887527466, -1.3827039003372192, -1.312796711921692, -1.242889642715454, -1.1729824542999268, -1.1030752658843994, -1.033168077468872, -0.9632609486579895, -0.8933538198471069, -0.8234466314315796, -0.7535394430160522, -0.6836323142051697, -0.6137251853942871, -0.5438179969787598, -0.4739108383655548, -0.40400367975234985, -0.3340965211391449, -0.26418936252593994, -0.19428220391273499, -0.12437504529953003, -0.05446788668632507, 0.015439033508300781, 0.08534619212150574, 0.1552533507347107, 0.22516050934791565, 0.2950676679611206, 0.36497482657432556, 0.4348819851875305, 0.5047891139984131, 0.5746963024139404, 0.6446034908294678, 0.7145106196403503, 0.7844177484512329, 0.8543249368667603, 0.9242321252822876, 0.9941392540931702, 1.0640463829040527, 1.13395357131958, 1.2038607597351074, 1.2737679481506348, 1.3436750173568726, 1.4135822057724, 1.4834893941879272, 1.553396463394165, 1.6233036518096924, 1.6932108402252197, 1.763118028640747, 1.8330252170562744, 1.9029322862625122, 1.9728394746780396, 2.0427465438842773, 2.1126537322998047, 2.182560920715332, 2.2524681091308594]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 10.0, 16.0, 14.0, 17.0, 19.0, 34.0, 36.0, 54.0, 91.0, 115.0, 152.0, 171.0, 295.0, 441.0, 657.0, 1004.0, 1652.0, 2742.0, 5049.0, 10061.0, 23905.0, 93171.0, 3890199.0, 114323.0, 26172.0, 10616.0, 5372.0, 2937.0, 1732.0, 1036.0, 683.0, 410.0, 346.0, 200.0, 140.0, 105.0, 78.0, 61.0, 49.0, 23.0, 27.0, 16.0, 13.0, 6.0, 8.0, 8.0, 12.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.275390625, -0.26692962646484375, -0.2584686279296875, -0.25000762939453125, -0.241546630859375, -0.23308563232421875, -0.2246246337890625, -0.21616363525390625, -0.20770263671875, -0.19924163818359375, -0.1907806396484375, -0.18231964111328125, -0.173858642578125, -0.16539764404296875, -0.1569366455078125, -0.14847564697265625, -0.1400146484375, -0.13155364990234375, -0.1230926513671875, -0.11463165283203125, -0.106170654296875, -0.09770965576171875, -0.0892486572265625, -0.08078765869140625, -0.07232666015625, -0.06386566162109375, -0.0554046630859375, -0.04694366455078125, -0.038482666015625, -0.03002166748046875, -0.0215606689453125, -0.01309967041015625, -0.004638671875, 0.00382232666015625, 0.0122833251953125, 0.02074432373046875, 0.029205322265625, 0.03766632080078125, 0.0461273193359375, 0.05458831787109375, 0.06304931640625, 0.07151031494140625, 0.0799713134765625, 0.08843231201171875, 0.096893310546875, 0.10535430908203125, 0.1138153076171875, 0.12227630615234375, 0.1307373046875, 0.13919830322265625, 0.1476593017578125, 0.15612030029296875, 0.164581298828125, 0.17304229736328125, 0.1815032958984375, 0.18996429443359375, 0.19842529296875, 0.20688629150390625, 0.2153472900390625, 0.22380828857421875, 0.232269287109375, 0.24073028564453125, 0.2491912841796875, 0.25765228271484375, 0.26611328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 11.0, 13.0, 16.0, 21.0, 20.0, 24.0, 28.0, 32.0, 45.0, 49.0, 47.0, 49.0, 65.0, 57.0, 74.0, 45.0, 50.0, 39.0, 34.0, 43.0, 44.0, 38.0, 29.0, 20.0, 19.0, 7.0, 14.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 0.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0899658203125, -0.08747100830078125, -0.0849761962890625, -0.08248138427734375, -0.079986572265625, -0.07749176025390625, -0.0749969482421875, -0.07250213623046875, -0.07000732421875, -0.06751251220703125, -0.0650177001953125, -0.06252288818359375, -0.060028076171875, -0.05753326416015625, -0.0550384521484375, -0.05254364013671875, -0.050048828125, -0.04755401611328125, -0.0450592041015625, -0.04256439208984375, -0.040069580078125, -0.03757476806640625, -0.0350799560546875, -0.03258514404296875, -0.03009033203125, -0.02759552001953125, -0.0251007080078125, -0.02260589599609375, -0.020111083984375, -0.01761627197265625, -0.0151214599609375, -0.01262664794921875, -0.0101318359375, -0.00763702392578125, -0.0051422119140625, -0.00264739990234375, -0.000152587890625, 0.00234222412109375, 0.0048370361328125, 0.00733184814453125, 0.00982666015625, 0.01232147216796875, 0.0148162841796875, 0.01731109619140625, 0.019805908203125, 0.02230072021484375, 0.0247955322265625, 0.02729034423828125, 0.02978515625, 0.03227996826171875, 0.0347747802734375, 0.03726959228515625, 0.039764404296875, 0.04225921630859375, 0.0447540283203125, 0.04724884033203125, 0.04974365234375, 0.05223846435546875, 0.0547332763671875, 0.05722808837890625, 0.059722900390625, 0.06221771240234375, 0.0647125244140625, 0.06720733642578125, 0.0697021484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 10.0, 13.0, 14.0, 10.0, 27.0, 34.0, 50.0, 66.0, 70.0, 95.0, 124.0, 184.0, 235.0, 340.0, 487.0, 688.0, 1090.0, 1788.0, 3130.0, 6214.0, 14423.0, 42087.0, 277286.0, 3728689.0, 76521.0, 21432.0, 8687.0, 4117.0, 2203.0, 1237.0, 851.0, 589.0, 371.0, 309.0, 222.0, 144.0, 98.0, 97.0, 52.0, 38.0, 36.0, 31.0, 27.0, 19.0, 7.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.393798828125, -0.38228607177734375, -0.3707733154296875, -0.35926055908203125, -0.347747802734375, -0.33623504638671875, -0.3247222900390625, -0.31320953369140625, -0.30169677734375, -0.29018402099609375, -0.2786712646484375, -0.26715850830078125, -0.255645751953125, -0.24413299560546875, -0.2326202392578125, -0.22110748291015625, -0.2095947265625, -0.19808197021484375, -0.1865692138671875, -0.17505645751953125, -0.163543701171875, -0.15203094482421875, -0.1405181884765625, -0.12900543212890625, -0.11749267578125, -0.10597991943359375, -0.0944671630859375, -0.08295440673828125, -0.071441650390625, -0.05992889404296875, -0.0484161376953125, -0.03690338134765625, -0.025390625, -0.01387786865234375, -0.0023651123046875, 0.00914764404296875, 0.020660400390625, 0.03217315673828125, 0.0436859130859375, 0.05519866943359375, 0.06671142578125, 0.07822418212890625, 0.0897369384765625, 0.10124969482421875, 0.112762451171875, 0.12427520751953125, 0.1357879638671875, 0.14730072021484375, 0.1588134765625, 0.17032623291015625, 0.1818389892578125, 0.19335174560546875, 0.204864501953125, 0.21637725830078125, 0.2278900146484375, 0.23940277099609375, 0.25091552734375, 0.26242828369140625, 0.2739410400390625, 0.28545379638671875, 0.296966552734375, 0.30847930908203125, 0.3199920654296875, 0.33150482177734375, 0.343017578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 6.0, 6.0, 6.0, 8.0, 16.0, 47.0, 68.0, 148.0, 2850.0, 600.0, 130.0, 56.0, 38.0, 14.0, 19.0, 15.0, 8.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1231689453125, -0.1195383071899414, -0.11590766906738281, -0.11227703094482422, -0.10864639282226562, -0.10501575469970703, -0.10138511657714844, -0.09775447845458984, -0.09412384033203125, -0.09049320220947266, -0.08686256408691406, -0.08323192596435547, -0.07960128784179688, -0.07597064971923828, -0.07234001159667969, -0.0687093734741211, -0.0650787353515625, -0.061448097229003906, -0.05781745910644531, -0.05418682098388672, -0.050556182861328125, -0.04692554473876953, -0.04329490661621094, -0.039664268493652344, -0.03603363037109375, -0.032402992248535156, -0.028772354125976562, -0.02514171600341797, -0.021511077880859375, -0.01788043975830078, -0.014249801635742188, -0.010619163513183594, -0.006988525390625, -0.0033578872680664062, 0.0002727508544921875, 0.0039033889770507812, 0.007534027099609375, 0.011164665222167969, 0.014795303344726562, 0.018425941467285156, 0.02205657958984375, 0.025687217712402344, 0.029317855834960938, 0.03294849395751953, 0.036579132080078125, 0.04020977020263672, 0.04384040832519531, 0.047471046447753906, 0.0511016845703125, 0.054732322692871094, 0.05836296081542969, 0.06199359893798828, 0.06562423706054688, 0.06925487518310547, 0.07288551330566406, 0.07651615142822266, 0.08014678955078125, 0.08377742767333984, 0.08740806579589844, 0.09103870391845703, 0.09466934204101562, 0.09829998016357422, 0.10193061828613281, 0.1055612564086914, 0.10919189453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 11.0, 14.0, 22.0, 48.0, 87.0, 118.0, 132.0, 143.0, 151.0, 86.0, 74.0, 47.0, 24.0, 14.0, 13.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.664283275604248, -0.6442078351974487, -0.6241323947906494, -0.6040569543838501, -0.5839815139770508, -0.5639060735702515, -0.5438306331634521, -0.5237551927566528, -0.5036797523498535, -0.4836043119430542, -0.4635288715362549, -0.44345343112945557, -0.42337799072265625, -0.40330255031585693, -0.38322708010673523, -0.3631516396999359, -0.3430761694908142, -0.3230007290840149, -0.3029252886772156, -0.28284984827041626, -0.26277440786361694, -0.24269895255565643, -0.22262349724769592, -0.2025480568408966, -0.1824726164340973, -0.16239717602729797, -0.14232173562049866, -0.12224628031253815, -0.10217083990573883, -0.08209539949893951, -0.0620199516415596, -0.04194450378417969, -0.02186906337738037, -0.0017936192452907562, 0.01828182488679886, 0.038357269018888474, 0.05843271315097809, 0.0785081535577774, 0.09858360141515732, 0.11865904927253723, 0.13873448967933655, 0.15880993008613586, 0.17888537049293518, 0.1989608258008957, 0.219036266207695, 0.23911170661449432, 0.25918716192245483, 0.27926260232925415, 0.29933804273605347, 0.3194134831428528, 0.3394889235496521, 0.3595643639564514, 0.37963980436325073, 0.39971524477005005, 0.41979071497917175, 0.43986615538597107, 0.4599415957927704, 0.4800170361995697, 0.5000925064086914, 0.5201679468154907, 0.54024338722229, 0.5603188276290894, 0.5803942680358887, 0.600469708442688, 0.6205451488494873]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 6.0, 6.0, 11.0, 7.0, 10.0, 18.0, 6.0, 17.0, 16.0, 17.0, 30.0, 30.0, 28.0, 30.0, 53.0, 46.0, 41.0, 45.0, 53.0, 40.0, 51.0, 54.0, 40.0, 34.0, 37.0, 36.0, 30.0, 36.0, 24.0, 21.0, 23.0, 19.0, 20.0, 15.0, 16.0, 8.0, 6.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24712252616882324, -0.23897069692611694, -0.23081886768341064, -0.22266703844070435, -0.21451520919799805, -0.20636337995529175, -0.19821156561374664, -0.19005973637104034, -0.18190790712833405, -0.17375607788562775, -0.16560424864292145, -0.15745241940021515, -0.14930060505867004, -0.14114877581596375, -0.13299694657325745, -0.12484511733055115, -0.11669328808784485, -0.10854145884513855, -0.10038962960243225, -0.09223780781030655, -0.08408597856760025, -0.07593414932489395, -0.06778232753276825, -0.05963049829006195, -0.05147866904735565, -0.04332683980464935, -0.03517501428723335, -0.027023186907172203, -0.018871359527111053, -0.010719530284404755, -0.0025677047669887543, 0.005584120750427246, 0.013735949993133545, 0.021887777373194695, 0.030039604753255844, 0.038191430270671844, 0.04634325951337814, 0.05449508875608444, 0.06264691054821014, 0.07079873979091644, 0.07895056903362274, 0.08710239827632904, 0.09525422751903534, 0.10340604931116104, 0.11155787855386734, 0.11970970779657364, 0.12786152958869934, 0.13601335883140564, 0.14416518807411194, 0.15231701731681824, 0.16046884655952454, 0.16862067580223083, 0.17677250504493713, 0.18492433428764343, 0.19307614862918854, 0.20122797787189484, 0.20937980711460114, 0.21753163635730743, 0.22568346560001373, 0.23383529484272003, 0.24198710918426514, 0.25013893842697144, 0.25829076766967773, 0.26644259691238403, 0.27459442615509033]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 7.0, 23.0, 33.0, 45.0, 56.0, 109.0, 131.0, 215.0, 352.0, 594.0, 985.0, 1821.0, 3743.0, 7604.0, 16482.0, 38018.0, 87788.0, 197588.0, 308220.0, 211601.0, 96561.0, 41579.0, 17920.0, 8363.0, 3890.0, 2053.0, 1128.0, 612.0, 369.0, 240.0, 149.0, 85.0, 52.0, 37.0, 33.0, 21.0, 6.0, 10.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.13544654846191406, -0.13014602661132812, -0.12484550476074219, -0.11954498291015625, -0.11424446105957031, -0.10894393920898438, -0.10364341735839844, -0.0983428955078125, -0.09304237365722656, -0.08774185180664062, -0.08244132995605469, -0.07714080810546875, -0.07184028625488281, -0.06653976440429688, -0.06123924255371094, -0.055938720703125, -0.05063819885253906, -0.045337677001953125, -0.04003715515136719, -0.03473663330078125, -0.029436111450195312, -0.024135589599609375, -0.018835067749023438, -0.0135345458984375, -0.008234024047851562, -0.002933502197265625, 0.0023670196533203125, 0.00766754150390625, 0.012968063354492188, 0.018268585205078125, 0.023569107055664062, 0.02886962890625, 0.03417015075683594, 0.039470672607421875, 0.04477119445800781, 0.05007171630859375, 0.05537223815917969, 0.060672760009765625, 0.06597328186035156, 0.0712738037109375, 0.07657432556152344, 0.08187484741210938, 0.08717536926269531, 0.09247589111328125, 0.09777641296386719, 0.10307693481445312, 0.10837745666503906, 0.113677978515625, 0.11897850036621094, 0.12427902221679688, 0.1295795440673828, 0.13488006591796875, 0.1401805877685547, 0.14548110961914062, 0.15078163146972656, 0.1560821533203125, 0.16138267517089844, 0.16668319702148438, 0.1719837188720703, 0.17728424072265625, 0.1825847625732422, 0.18788528442382812, 0.19318580627441406, 0.198486328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 9.0, 11.0, 22.0, 14.0, 26.0, 24.0, 36.0, 33.0, 42.0, 37.0, 56.0, 52.0, 60.0, 48.0, 66.0, 54.0, 55.0, 58.0, 47.0, 49.0, 37.0, 35.0, 24.0, 28.0, 14.0, 15.0, 8.0, 5.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1072998046875, -0.10440826416015625, -0.1015167236328125, -0.09862518310546875, -0.095733642578125, -0.09284210205078125, -0.0899505615234375, -0.08705902099609375, -0.08416748046875, -0.08127593994140625, -0.0783843994140625, -0.07549285888671875, -0.072601318359375, -0.06970977783203125, -0.0668182373046875, -0.06392669677734375, -0.06103515625, -0.05814361572265625, -0.0552520751953125, -0.05236053466796875, -0.049468994140625, -0.04657745361328125, -0.0436859130859375, -0.04079437255859375, -0.03790283203125, -0.03501129150390625, -0.0321197509765625, -0.02922821044921875, -0.026336669921875, -0.02344512939453125, -0.0205535888671875, -0.01766204833984375, -0.0147705078125, -0.01187896728515625, -0.0089874267578125, -0.00609588623046875, -0.003204345703125, -0.00031280517578125, 0.0025787353515625, 0.00547027587890625, 0.00836181640625, 0.01125335693359375, 0.0141448974609375, 0.01703643798828125, 0.019927978515625, 0.02281951904296875, 0.0257110595703125, 0.02860260009765625, 0.031494140625, 0.03438568115234375, 0.0372772216796875, 0.04016876220703125, 0.043060302734375, 0.04595184326171875, 0.0488433837890625, 0.05173492431640625, 0.05462646484375, 0.05751800537109375, 0.0604095458984375, 0.06330108642578125, 0.066192626953125, 0.06908416748046875, 0.0719757080078125, 0.07486724853515625, 0.0777587890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 18.0, 19.0, 18.0, 30.0, 34.0, 81.0, 108.0, 154.0, 233.0, 378.0, 619.0, 1224.0, 2945.0, 10044.0, 59200.0, 529415.0, 388520.0, 42346.0, 7963.0, 2539.0, 1062.0, 561.0, 362.0, 215.0, 137.0, 109.0, 63.0, 47.0, 23.0, 19.0, 19.0, 11.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4365234375, -0.42436981201171875, -0.4122161865234375, -0.40006256103515625, -0.387908935546875, -0.37575531005859375, -0.3636016845703125, -0.35144805908203125, -0.33929443359375, -0.32714080810546875, -0.3149871826171875, -0.30283355712890625, -0.290679931640625, -0.27852630615234375, -0.2663726806640625, -0.25421905517578125, -0.2420654296875, -0.22991180419921875, -0.2177581787109375, -0.20560455322265625, -0.193450927734375, -0.18129730224609375, -0.1691436767578125, -0.15699005126953125, -0.14483642578125, -0.13268280029296875, -0.1205291748046875, -0.10837554931640625, -0.096221923828125, -0.08406829833984375, -0.0719146728515625, -0.05976104736328125, -0.047607421875, -0.03545379638671875, -0.0233001708984375, -0.01114654541015625, 0.001007080078125, 0.01316070556640625, 0.0253143310546875, 0.03746795654296875, 0.04962158203125, 0.06177520751953125, 0.0739288330078125, 0.08608245849609375, 0.098236083984375, 0.11038970947265625, 0.1225433349609375, 0.13469696044921875, 0.1468505859375, 0.15900421142578125, 0.1711578369140625, 0.18331146240234375, 0.195465087890625, 0.20761871337890625, 0.2197723388671875, 0.23192596435546875, 0.24407958984375, 0.25623321533203125, 0.2683868408203125, 0.28054046630859375, 0.292694091796875, 0.30484771728515625, 0.3170013427734375, 0.32915496826171875, 0.34130859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 0.0, 6.0, 6.0, 5.0, 9.0, 8.0, 9.0, 16.0, 22.0, 25.0, 29.0, 24.0, 38.0, 37.0, 38.0, 48.0, 45.0, 45.0, 69.0, 58.0, 50.0, 57.0, 44.0, 43.0, 46.0, 44.0, 43.0, 30.0, 24.0, 15.0, 21.0, 6.0, 7.0, 11.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373046875, -0.3598518371582031, -0.34665679931640625, -0.3334617614746094, -0.3202667236328125, -0.3070716857910156, -0.29387664794921875, -0.2806816101074219, -0.267486572265625, -0.2542915344238281, -0.24109649658203125, -0.22790145874023438, -0.2147064208984375, -0.20151138305664062, -0.18831634521484375, -0.17512130737304688, -0.16192626953125, -0.14873123168945312, -0.13553619384765625, -0.12234115600585938, -0.1091461181640625, -0.09595108032226562, -0.08275604248046875, -0.06956100463867188, -0.056365966796875, -0.043170928955078125, -0.02997589111328125, -0.016780853271484375, -0.0035858154296875, 0.009609222412109375, 0.02280426025390625, 0.035999298095703125, 0.0491943359375, 0.062389373779296875, 0.07558441162109375, 0.08877944946289062, 0.1019744873046875, 0.11516952514648438, 0.12836456298828125, 0.14155960083007812, 0.154754638671875, 0.16794967651367188, 0.18114471435546875, 0.19433975219726562, 0.2075347900390625, 0.22072982788085938, 0.23392486572265625, 0.24711990356445312, 0.26031494140625, 0.2735099792480469, 0.28670501708984375, 0.2999000549316406, 0.3130950927734375, 0.3262901306152344, 0.33948516845703125, 0.3526802062988281, 0.365875244140625, 0.3790702819824219, 0.39226531982421875, 0.4054603576660156, 0.4186553955078125, 0.4318504333496094, 0.44504547119140625, 0.4582405090332031, 0.471435546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 8.0, 15.0, 21.0, 47.0, 75.0, 198.0, 540.0, 2009.0, 14450.0, 642892.0, 376146.0, 9828.0, 1518.0, 471.0, 178.0, 85.0, 36.0, 15.0, 12.0, 6.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4404296875, -0.4274482727050781, -0.41446685791015625, -0.4014854431152344, -0.3885040283203125, -0.3755226135253906, -0.36254119873046875, -0.3495597839355469, -0.336578369140625, -0.3235969543457031, -0.31061553955078125, -0.2976341247558594, -0.2846527099609375, -0.2716712951660156, -0.25868988037109375, -0.24570846557617188, -0.23272705078125, -0.21974563598632812, -0.20676422119140625, -0.19378280639648438, -0.1808013916015625, -0.16781997680664062, -0.15483856201171875, -0.14185714721679688, -0.128875732421875, -0.11589431762695312, -0.10291290283203125, -0.08993148803710938, -0.0769500732421875, -0.06396865844726562, -0.05098724365234375, -0.038005828857421875, -0.0250244140625, -0.012042999267578125, 0.00093841552734375, 0.013919830322265625, 0.0269012451171875, 0.039882659912109375, 0.05286407470703125, 0.06584548950195312, 0.078826904296875, 0.09180831909179688, 0.10478973388671875, 0.11777114868164062, 0.1307525634765625, 0.14373397827148438, 0.15671539306640625, 0.16969680786132812, 0.18267822265625, 0.19565963745117188, 0.20864105224609375, 0.22162246704101562, 0.2346038818359375, 0.24758529663085938, 0.26056671142578125, 0.2735481262207031, 0.286529541015625, 0.2995109558105469, 0.31249237060546875, 0.3254737854003906, 0.3384552001953125, 0.3514366149902344, 0.36441802978515625, 0.3773994445800781, 0.390380859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 15.0, 11.0, 16.0, 16.0, 40.0, 39.0, 52.0, 68.0, 92.0, 83.0, 91.0, 86.0, 80.0, 70.0, 51.0, 55.0, 43.0, 25.0, 13.0, 15.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7147274017333984e-05, -4.5076943933963776e-05, -4.300661385059357e-05, -4.093628376722336e-05, -3.886595368385315e-05, -3.679562360048294e-05, -3.472529351711273e-05, -3.265496343374252e-05, -3.0584633350372314e-05, -2.8514303267002106e-05, -2.6443973183631897e-05, -2.4373643100261688e-05, -2.230331301689148e-05, -2.023298293352127e-05, -1.8162652850151062e-05, -1.6092322766780853e-05, -1.4021992683410645e-05, -1.1951662600040436e-05, -9.881332516670227e-06, -7.811002433300018e-06, -5.7406723499298096e-06, -3.670342266559601e-06, -1.600012183189392e-06, 4.7031790018081665e-07, 2.5406479835510254e-06, 4.610978066921234e-06, 6.681308150291443e-06, 8.751638233661652e-06, 1.082196831703186e-05, 1.2892298400402069e-05, 1.4962628483772278e-05, 1.7032958567142487e-05, 1.9103288650512695e-05, 2.1173618733882904e-05, 2.3243948817253113e-05, 2.531427890062332e-05, 2.738460898399353e-05, 2.945493906736374e-05, 3.152526915073395e-05, 3.3595599234104156e-05, 3.5665929317474365e-05, 3.7736259400844574e-05, 3.980658948421478e-05, 4.187691956758499e-05, 4.39472496509552e-05, 4.601757973432541e-05, 4.808790981769562e-05, 5.0158239901065826e-05, 5.2228569984436035e-05, 5.4298900067806244e-05, 5.636923015117645e-05, 5.843956023454666e-05, 6.050989031791687e-05, 6.258022040128708e-05, 6.465055048465729e-05, 6.67208805680275e-05, 6.87912106513977e-05, 7.086154073476791e-05, 7.293187081813812e-05, 7.500220090150833e-05, 7.707253098487854e-05, 7.914286106824875e-05, 8.121319115161896e-05, 8.328352123498917e-05, 8.535385131835938e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 11.0, 12.0, 14.0, 36.0, 53.0, 101.0, 165.0, 338.0, 678.0, 1579.0, 4947.0, 23800.0, 269719.0, 667135.0, 66208.0, 9217.0, 2594.0, 984.0, 424.0, 236.0, 123.0, 66.0, 39.0, 17.0, 13.0, 8.0, 11.0, 9.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.21076583862304688, -0.20302581787109375, -0.19528579711914062, -0.1875457763671875, -0.17980575561523438, -0.17206573486328125, -0.16432571411132812, -0.156585693359375, -0.14884567260742188, -0.14110565185546875, -0.13336563110351562, -0.1256256103515625, -0.11788558959960938, -0.11014556884765625, -0.10240554809570312, -0.09466552734375, -0.08692550659179688, -0.07918548583984375, -0.07144546508789062, -0.0637054443359375, -0.055965423583984375, -0.04822540283203125, -0.040485382080078125, -0.032745361328125, -0.025005340576171875, -0.01726531982421875, -0.009525299072265625, -0.0017852783203125, 0.005954742431640625, 0.01369476318359375, 0.021434783935546875, 0.0291748046875, 0.036914825439453125, 0.04465484619140625, 0.052394866943359375, 0.0601348876953125, 0.06787490844726562, 0.07561492919921875, 0.08335494995117188, 0.091094970703125, 0.09883499145507812, 0.10657501220703125, 0.11431503295898438, 0.1220550537109375, 0.12979507446289062, 0.13753509521484375, 0.14527511596679688, 0.15301513671875, 0.16075515747070312, 0.16849517822265625, 0.17623519897460938, 0.1839752197265625, 0.19171524047851562, 0.19945526123046875, 0.20719528198242188, 0.214935302734375, 0.22267532348632812, 0.23041534423828125, 0.23815536499023438, 0.2458953857421875, 0.2536354064941406, 0.26137542724609375, 0.2691154479980469, 0.27685546875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 9.0, 7.0, 7.0, 14.0, 19.0, 30.0, 38.0, 46.0, 58.0, 72.0, 85.0, 62.0, 85.0, 91.0, 72.0, 69.0, 51.0, 44.0, 32.0, 35.0, 26.0, 14.0, 8.0, 9.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1573486328125, -0.151947021484375, -0.14654541015625, -0.141143798828125, -0.1357421875, -0.130340576171875, -0.12493896484375, -0.119537353515625, -0.1141357421875, -0.108734130859375, -0.10333251953125, -0.097930908203125, -0.092529296875, -0.087127685546875, -0.08172607421875, -0.076324462890625, -0.0709228515625, -0.065521240234375, -0.06011962890625, -0.054718017578125, -0.04931640625, -0.043914794921875, -0.03851318359375, -0.033111572265625, -0.0277099609375, -0.022308349609375, -0.01690673828125, -0.011505126953125, -0.006103515625, -0.000701904296875, 0.00469970703125, 0.010101318359375, 0.0155029296875, 0.020904541015625, 0.02630615234375, 0.031707763671875, 0.037109375, 0.042510986328125, 0.04791259765625, 0.053314208984375, 0.0587158203125, 0.064117431640625, 0.06951904296875, 0.074920654296875, 0.080322265625, 0.085723876953125, 0.09112548828125, 0.096527099609375, 0.1019287109375, 0.107330322265625, 0.11273193359375, 0.118133544921875, 0.12353515625, 0.128936767578125, 0.13433837890625, 0.139739990234375, 0.1451416015625, 0.150543212890625, 0.15594482421875, 0.161346435546875, 0.166748046875, 0.172149658203125, 0.17755126953125, 0.182952880859375, 0.1883544921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 15.0, 39.0, 124.0, 237.0, 274.0, 190.0, 79.0, 29.0, 9.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.918266534805298, -2.739671468734741, -2.5610766410827637, -2.382481575012207, -2.2038865089416504, -2.025291681289673, -1.8466966152191162, -1.6681016683578491, -1.489506721496582, -1.310911774635315, -1.1323168277740479, -0.9537217617034912, -0.7751268148422241, -0.596531867980957, -0.4179368019104004, -0.2393418550491333, -0.06074690818786621, 0.11784806847572327, 0.29644304513931274, 0.4750380516052246, 0.6536329984664917, 0.8322279453277588, 1.0108230113983154, 1.1894179582595825, 1.3680129051208496, 1.5466078519821167, 1.7252027988433838, 1.9037978649139404, 2.082392692565918, 2.2609877586364746, 2.4395828247070312, 2.618177890777588, 2.7967729568481445, 2.975368022918701, 3.1539628505706787, 3.3325579166412354, 3.511152744293213, 3.6897478103637695, 3.868342876434326, 4.046937942504883, 4.225532531738281, 4.404127597808838, 4.5827226638793945, 4.761317253112793, 4.93991231918335, 5.118507385253906, 5.297102451324463, 5.4756975173950195, 5.654292583465576, 5.832887649536133, 6.0114827156066895, 6.190077781677246, 6.3686723709106445, 6.547267436981201, 6.725862503051758, 6.9044575691223145, 7.083052635192871, 7.261647701263428, 7.440242767333984, 7.618837356567383, 7.7974324226379395, 7.976027488708496, 8.154623031616211, 8.33321762084961, 8.511812210083008]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 1.0, 9.0, 3.0, 8.0, 1.0, 12.0, 17.0, 11.0, 13.0, 11.0, 16.0, 24.0, 39.0, 25.0, 39.0, 46.0, 60.0, 55.0, 68.0, 45.0, 47.0, 59.0, 57.0, 60.0, 44.0, 30.0, 25.0, 25.0, 24.0, 25.0, 25.0, 18.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0916075706481934, -2.0315911769866943, -1.9715749025344849, -1.9115585088729858, -1.8515422344207764, -1.7915258407592773, -1.7315094470977783, -1.6714931726455688, -1.6114768981933594, -1.5514605045318604, -1.4914442300796509, -1.4314278364181519, -1.3714115619659424, -1.3113951683044434, -1.2513787746429443, -1.1913625001907349, -1.1313461065292358, -1.0713297128677368, -1.0113134384155273, -0.9512970447540283, -0.8912807703018188, -0.8312643766403198, -0.7712480425834656, -0.7112317085266113, -0.6512153744697571, -0.5911990404129028, -0.5311827063560486, -0.47116634249687195, -0.4111500084400177, -0.35113367438316345, -0.2911173105239868, -0.23110097646713257, -0.17108476161956787, -0.11106842011213303, -0.05105207860469818, 0.00896427035331726, 0.06898060441017151, 0.12899693846702576, 0.1890133023262024, 0.24902963638305664, 0.3090459704399109, 0.36906230449676514, 0.4290786385536194, 0.489095002412796, 0.5491113662719727, 0.6091276407241821, 0.6691440343856812, 0.7291603684425354, 0.7891767024993896, 0.8491930365562439, 0.9092093706130981, 0.9692257642745972, 1.0292420387268066, 1.0892584323883057, 1.1492748260498047, 1.2092911005020142, 1.2693073749542236, 1.3293237686157227, 1.3893400430679321, 1.4493564367294312, 1.5093727111816406, 1.5693891048431396, 1.6294054985046387, 1.6894217729568481, 1.7494381666183472]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 7.0, 9.0, 10.0, 16.0, 29.0, 30.0, 49.0, 103.0, 143.0, 158.0, 274.0, 462.0, 736.0, 1091.0, 1945.0, 3624.0, 7609.0, 20463.0, 202115.0, 3909827.0, 26883.0, 8878.0, 4129.0, 2178.0, 1303.0, 826.0, 476.0, 278.0, 189.0, 135.0, 91.0, 50.0, 53.0, 37.0, 19.0, 20.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.355712890625, -0.3446311950683594, -0.33354949951171875, -0.3224678039550781, -0.3113861083984375, -0.3003044128417969, -0.28922271728515625, -0.2781410217285156, -0.267059326171875, -0.2559776306152344, -0.24489593505859375, -0.23381423950195312, -0.2227325439453125, -0.21165084838867188, -0.20056915283203125, -0.18948745727539062, -0.17840576171875, -0.16732406616210938, -0.15624237060546875, -0.14516067504882812, -0.1340789794921875, -0.12299728393554688, -0.11191558837890625, -0.10083389282226562, -0.089752197265625, -0.07867050170898438, -0.06758880615234375, -0.056507110595703125, -0.0454254150390625, -0.034343719482421875, -0.02326202392578125, -0.012180328369140625, -0.0010986328125, 0.009983062744140625, 0.02106475830078125, 0.032146453857421875, 0.0432281494140625, 0.054309844970703125, 0.06539154052734375, 0.07647323608398438, 0.087554931640625, 0.09863662719726562, 0.10971832275390625, 0.12080001831054688, 0.1318817138671875, 0.14296340942382812, 0.15404510498046875, 0.16512680053710938, 0.17620849609375, 0.18729019165039062, 0.19837188720703125, 0.20945358276367188, 0.2205352783203125, 0.23161697387695312, 0.24269866943359375, 0.2537803649902344, 0.264862060546875, 0.2759437561035156, 0.28702545166015625, 0.2981071472167969, 0.3091888427734375, 0.3202705383300781, 0.33135223388671875, 0.3424339294433594, 0.353515625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 1.0, 9.0, 16.0, 9.0, 22.0, 22.0, 24.0, 40.0, 58.0, 51.0, 69.0, 56.0, 64.0, 83.0, 71.0, 70.0, 71.0, 63.0, 51.0, 41.0, 29.0, 22.0, 13.0, 13.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1357421875, -0.13199329376220703, -0.12824440002441406, -0.1244955062866211, -0.12074661254882812, -0.11699771881103516, -0.11324882507324219, -0.10949993133544922, -0.10575103759765625, -0.10200214385986328, -0.09825325012207031, -0.09450435638427734, -0.09075546264648438, -0.0870065689086914, -0.08325767517089844, -0.07950878143310547, -0.0757598876953125, -0.07201099395751953, -0.06826210021972656, -0.0645132064819336, -0.060764312744140625, -0.057015419006347656, -0.05326652526855469, -0.04951763153076172, -0.04576873779296875, -0.04201984405517578, -0.03827095031738281, -0.034522056579589844, -0.030773162841796875, -0.027024269104003906, -0.023275375366210938, -0.01952648162841797, -0.015777587890625, -0.012028694152832031, -0.008279800415039062, -0.004530906677246094, -0.000782012939453125, 0.0029668807983398438, 0.0067157745361328125, 0.010464668273925781, 0.01421356201171875, 0.01796245574951172, 0.021711349487304688, 0.025460243225097656, 0.029209136962890625, 0.032958030700683594, 0.03670692443847656, 0.04045581817626953, 0.0442047119140625, 0.04795360565185547, 0.05170249938964844, 0.055451393127441406, 0.059200286865234375, 0.06294918060302734, 0.06669807434082031, 0.07044696807861328, 0.07419586181640625, 0.07794475555419922, 0.08169364929199219, 0.08544254302978516, 0.08919143676757812, 0.0929403305053711, 0.09668922424316406, 0.10043811798095703, 0.10418701171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 4.0, 10.0, 14.0, 16.0, 10.0, 14.0, 27.0, 34.0, 47.0, 63.0, 99.0, 203.0, 308.0, 623.0, 1210.0, 2920.0, 8810.0, 44650.0, 4049976.0, 67641.0, 11191.0, 3428.0, 1445.0, 644.0, 339.0, 182.0, 108.0, 69.0, 58.0, 30.0, 23.0, 15.0, 17.0, 14.0, 13.0, 8.0, 11.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50830078125, -0.48987579345703125, -0.4714508056640625, -0.45302581787109375, -0.434600830078125, -0.41617584228515625, -0.3977508544921875, -0.37932586669921875, -0.36090087890625, -0.34247589111328125, -0.3240509033203125, -0.30562591552734375, -0.287200927734375, -0.26877593994140625, -0.2503509521484375, -0.23192596435546875, -0.2135009765625, -0.19507598876953125, -0.1766510009765625, -0.15822601318359375, -0.139801025390625, -0.12137603759765625, -0.1029510498046875, -0.08452606201171875, -0.06610107421875, -0.04767608642578125, -0.0292510986328125, -0.01082611083984375, 0.007598876953125, 0.02602386474609375, 0.0444488525390625, 0.06287384033203125, 0.081298828125, 0.09972381591796875, 0.1181488037109375, 0.13657379150390625, 0.154998779296875, 0.17342376708984375, 0.1918487548828125, 0.21027374267578125, 0.22869873046875, 0.24712371826171875, 0.2655487060546875, 0.28397369384765625, 0.302398681640625, 0.32082366943359375, 0.3392486572265625, 0.35767364501953125, 0.3760986328125, 0.39452362060546875, 0.4129486083984375, 0.43137359619140625, 0.449798583984375, 0.46822357177734375, 0.4866485595703125, 0.5050735473632812, 0.52349853515625, 0.5419235229492188, 0.5603485107421875, 0.5787734985351562, 0.597198486328125, 0.6156234741210938, 0.6340484619140625, 0.6524734497070312, 0.6708984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 9.0, 11.0, 14.0, 27.0, 54.0, 151.0, 3472.0, 193.0, 60.0, 20.0, 18.0, 10.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08172607421875, -0.07776165008544922, -0.07379722595214844, -0.06983280181884766, -0.06586837768554688, -0.061903953552246094, -0.05793952941894531, -0.05397510528564453, -0.05001068115234375, -0.04604625701904297, -0.04208183288574219, -0.038117408752441406, -0.034152984619140625, -0.030188560485839844, -0.026224136352539062, -0.02225971221923828, -0.0182952880859375, -0.014330863952636719, -0.010366439819335938, -0.006402015686035156, -0.002437591552734375, 0.0015268325805664062, 0.0054912567138671875, 0.009455680847167969, 0.01342010498046875, 0.01738452911376953, 0.021348953247070312, 0.025313377380371094, 0.029277801513671875, 0.033242225646972656, 0.03720664978027344, 0.04117107391357422, 0.045135498046875, 0.04909992218017578, 0.05306434631347656, 0.057028770446777344, 0.060993194580078125, 0.0649576187133789, 0.06892204284667969, 0.07288646697998047, 0.07685089111328125, 0.08081531524658203, 0.08477973937988281, 0.0887441635131836, 0.09270858764648438, 0.09667301177978516, 0.10063743591308594, 0.10460186004638672, 0.1085662841796875, 0.11253070831298828, 0.11649513244628906, 0.12045955657958984, 0.12442398071289062, 0.1283884048461914, 0.1323528289794922, 0.13631725311279297, 0.14028167724609375, 0.14424610137939453, 0.1482105255126953, 0.1521749496459961, 0.15613937377929688, 0.16010379791259766, 0.16406822204589844, 0.16803264617919922, 0.1719970703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 15.0, 27.0, 47.0, 73.0, 103.0, 128.0, 145.0, 133.0, 117.0, 74.0, 53.0, 33.0, 19.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5267080664634705, -0.5120776891708374, -0.49744731187820435, -0.4828169345855713, -0.4681865870952606, -0.45355620980262756, -0.4389258325099945, -0.42429545521736145, -0.4096651077270508, -0.3950347304344177, -0.38040435314178467, -0.3657739758491516, -0.35114362835884094, -0.3365132510662079, -0.32188287377357483, -0.3072524964809418, -0.2926221191883087, -0.27799174189567566, -0.2633613646030426, -0.24873100221157074, -0.23410063982009888, -0.21947026252746582, -0.20483988523483276, -0.1902095079421997, -0.17557914555072784, -0.1609487682580948, -0.14631840586662292, -0.13168802857398987, -0.11705765873193741, -0.10242728888988495, -0.08779691159725189, -0.07316654175519943, -0.05853617191314697, -0.04390580207109451, -0.029275428503751755, -0.014645054936408997, -1.4685094356536865e-05, 0.014615684747695923, 0.02924606204032898, 0.04387643188238144, 0.0585068017244339, 0.07313717156648636, 0.08776754140853882, 0.10239791870117188, 0.11702828854322433, 0.1316586583852768, 0.14628903567790985, 0.1609193980693817, 0.17554977536201477, 0.19018015265464783, 0.2048105150461197, 0.21944089233875275, 0.2340712547302246, 0.24870163202285767, 0.2633320093154907, 0.2779623866081238, 0.29259276390075684, 0.3072231411933899, 0.32185351848602295, 0.336483895778656, 0.3511142432689667, 0.36574462056159973, 0.3803749978542328, 0.39500537514686584, 0.4096357226371765]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 7.0, 7.0, 19.0, 9.0, 22.0, 20.0, 14.0, 30.0, 34.0, 31.0, 30.0, 41.0, 38.0, 35.0, 51.0, 48.0, 38.0, 40.0, 41.0, 29.0, 39.0, 41.0, 29.0, 37.0, 32.0, 30.0, 27.0, 22.0, 22.0, 20.0, 14.0, 15.0, 18.0, 13.0, 11.0, 8.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.17311352491378784, -0.16769325733184814, -0.16227300465106964, -0.15685273706912994, -0.15143248438835144, -0.14601221680641174, -0.14059194922447205, -0.13517168164253235, -0.12975142896175385, -0.12433116883039474, -0.11891090869903564, -0.11349064111709595, -0.10807038098573685, -0.10265012085437775, -0.09722985327243805, -0.09180959314107895, -0.08638933300971985, -0.08096907287836075, -0.07554881274700165, -0.07012854516506195, -0.06470828503370285, -0.05928802490234375, -0.05386776104569435, -0.04844749718904495, -0.04302723705768585, -0.03760697692632675, -0.03218671306967735, -0.026766451075673103, -0.021346189081668854, -0.015925927087664604, -0.010505665093660355, -0.005085401237010956, 0.00033485889434814453, 0.005755120888352394, 0.011175382882356644, 0.016595644876360893, 0.022015906870365143, 0.027436168864369392, 0.03285643085837364, 0.03827669471502304, 0.04369695484638214, 0.04911721497774124, 0.05453747883439064, 0.05995774269104004, 0.06537800282239914, 0.07079826295375824, 0.07621853053569794, 0.08163879066705704, 0.08705905079841614, 0.09247931092977524, 0.09789957106113434, 0.10331983864307404, 0.10874009877443314, 0.11416035890579224, 0.11958062648773193, 0.12500089406967163, 0.13042114675045013, 0.13584141433238983, 0.14126166701316833, 0.14668193459510803, 0.15210220217704773, 0.15752245485782623, 0.16294272243976593, 0.16836297512054443, 0.17378324270248413]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 4.0, 16.0, 21.0, 38.0, 40.0, 47.0, 69.0, 100.0, 175.0, 267.0, 451.0, 734.0, 1372.0, 2626.0, 4945.0, 9900.0, 20527.0, 42985.0, 93802.0, 210456.0, 319126.0, 184503.0, 81910.0, 37977.0, 17813.0, 8854.0, 4378.0, 2205.0, 1268.0, 736.0, 437.0, 243.0, 176.0, 106.0, 77.0, 49.0, 32.0, 17.0, 17.0, 12.0, 8.0, 4.0, 10.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.14276695251464844, -0.13807296752929688, -0.1333789825439453, -0.12868499755859375, -0.12399101257324219, -0.11929702758789062, -0.11460304260253906, -0.1099090576171875, -0.10521507263183594, -0.10052108764648438, -0.09582710266113281, -0.09113311767578125, -0.08643913269042969, -0.08174514770507812, -0.07705116271972656, -0.072357177734375, -0.06766319274902344, -0.06296920776367188, -0.05827522277832031, -0.05358123779296875, -0.04888725280761719, -0.044193267822265625, -0.03949928283691406, -0.0348052978515625, -0.030111312866210938, -0.025417327880859375, -0.020723342895507812, -0.01602935791015625, -0.011335372924804688, -0.006641387939453125, -0.0019474029541015625, 0.00274658203125, 0.0074405670166015625, 0.012134552001953125, 0.016828536987304688, 0.02152252197265625, 0.026216506958007812, 0.030910491943359375, 0.03560447692871094, 0.0402984619140625, 0.04499244689941406, 0.049686431884765625, 0.05438041687011719, 0.05907440185546875, 0.06376838684082031, 0.06846237182617188, 0.07315635681152344, 0.077850341796875, 0.08254432678222656, 0.08723831176757812, 0.09193229675292969, 0.09662628173828125, 0.10132026672363281, 0.10601425170898438, 0.11070823669433594, 0.1154022216796875, 0.12009620666503906, 0.12479019165039062, 0.1294841766357422, 0.13417816162109375, 0.1388721466064453, 0.14356613159179688, 0.14826011657714844, 0.1529541015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 10.0, 10.0, 14.0, 14.0, 20.0, 27.0, 24.0, 36.0, 52.0, 62.0, 59.0, 86.0, 83.0, 80.0, 91.0, 58.0, 55.0, 44.0, 45.0, 42.0, 30.0, 23.0, 10.0, 11.0, 8.0, 0.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152587890625, -0.14844894409179688, -0.14430999755859375, -0.14017105102539062, -0.1360321044921875, -0.13189315795898438, -0.12775421142578125, -0.12361526489257812, -0.119476318359375, -0.11533737182617188, -0.11119842529296875, -0.10705947875976562, -0.1029205322265625, -0.09878158569335938, -0.09464263916015625, -0.09050369262695312, -0.08636474609375, -0.08222579956054688, -0.07808685302734375, -0.07394790649414062, -0.0698089599609375, -0.06567001342773438, -0.06153106689453125, -0.057392120361328125, -0.053253173828125, -0.049114227294921875, -0.04497528076171875, -0.040836334228515625, -0.0366973876953125, -0.032558441162109375, -0.02841949462890625, -0.024280548095703125, -0.0201416015625, -0.016002655029296875, -0.01186370849609375, -0.007724761962890625, -0.0035858154296875, 0.000553131103515625, 0.00469207763671875, 0.008831024169921875, 0.012969970703125, 0.017108917236328125, 0.02124786376953125, 0.025386810302734375, 0.0295257568359375, 0.033664703369140625, 0.03780364990234375, 0.041942596435546875, 0.04608154296875, 0.050220489501953125, 0.05435943603515625, 0.058498382568359375, 0.0626373291015625, 0.06677627563476562, 0.07091522216796875, 0.07505416870117188, 0.079193115234375, 0.08333206176757812, 0.08747100830078125, 0.09160995483398438, 0.0957489013671875, 0.09988784790039062, 0.10402679443359375, 0.10816574096679688, 0.1123046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 9.0, 6.0, 5.0, 13.0, 22.0, 29.0, 40.0, 39.0, 55.0, 70.0, 107.0, 111.0, 181.0, 300.0, 422.0, 732.0, 1401.0, 3207.0, 10739.0, 52878.0, 454774.0, 453938.0, 52171.0, 10516.0, 3237.0, 1369.0, 723.0, 434.0, 294.0, 203.0, 123.0, 92.0, 86.0, 51.0, 40.0, 32.0, 33.0, 20.0, 14.0, 11.0, 6.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.32177734375, -0.3123130798339844, -0.30284881591796875, -0.2933845520019531, -0.2839202880859375, -0.2744560241699219, -0.26499176025390625, -0.2555274963378906, -0.246063232421875, -0.23659896850585938, -0.22713470458984375, -0.21767044067382812, -0.2082061767578125, -0.19874191284179688, -0.18927764892578125, -0.17981338500976562, -0.17034912109375, -0.16088485717773438, -0.15142059326171875, -0.14195632934570312, -0.1324920654296875, -0.12302780151367188, -0.11356353759765625, -0.10409927368164062, -0.094635009765625, -0.08517074584960938, -0.07570648193359375, -0.06624221801757812, -0.0567779541015625, -0.047313690185546875, -0.03784942626953125, -0.028385162353515625, -0.0189208984375, -0.009456634521484375, 7.62939453125e-06, 0.009471893310546875, 0.0189361572265625, 0.028400421142578125, 0.03786468505859375, 0.047328948974609375, 0.056793212890625, 0.06625747680664062, 0.07572174072265625, 0.08518600463867188, 0.0946502685546875, 0.10411453247070312, 0.11357879638671875, 0.12304306030273438, 0.13250732421875, 0.14197158813476562, 0.15143585205078125, 0.16090011596679688, 0.1703643798828125, 0.17982864379882812, 0.18929290771484375, 0.19875717163085938, 0.208221435546875, 0.21768569946289062, 0.22714996337890625, 0.23661422729492188, 0.2460784912109375, 0.2555427551269531, 0.26500701904296875, 0.2744712829589844, 0.283935546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 11.0, 10.0, 20.0, 27.0, 25.0, 34.0, 33.0, 44.0, 39.0, 50.0, 47.0, 54.0, 51.0, 49.0, 54.0, 50.0, 39.0, 41.0, 43.0, 45.0, 36.0, 32.0, 38.0, 25.0, 13.0, 9.0, 23.0, 10.0, 10.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4873046875, -0.4737281799316406, -0.46015167236328125, -0.4465751647949219, -0.4329986572265625, -0.4194221496582031, -0.40584564208984375, -0.3922691345214844, -0.378692626953125, -0.3651161193847656, -0.35153961181640625, -0.3379631042480469, -0.3243865966796875, -0.3108100891113281, -0.29723358154296875, -0.2836570739746094, -0.27008056640625, -0.2565040588378906, -0.24292755126953125, -0.22935104370117188, -0.2157745361328125, -0.20219802856445312, -0.18862152099609375, -0.17504501342773438, -0.161468505859375, -0.14789199829101562, -0.13431549072265625, -0.12073898315429688, -0.1071624755859375, -0.09358596801757812, -0.08000946044921875, -0.06643295288085938, -0.0528564453125, -0.039279937744140625, -0.02570343017578125, -0.012126922607421875, 0.0014495849609375, 0.015026092529296875, 0.02860260009765625, 0.042179107666015625, 0.055755615234375, 0.06933212280273438, 0.08290863037109375, 0.09648513793945312, 0.1100616455078125, 0.12363815307617188, 0.13721466064453125, 0.15079116821289062, 0.16436767578125, 0.17794418334960938, 0.19152069091796875, 0.20509719848632812, 0.2186737060546875, 0.23225021362304688, 0.24582672119140625, 0.2594032287597656, 0.272979736328125, 0.2865562438964844, 0.30013275146484375, 0.3137092590332031, 0.3272857666015625, 0.3408622741699219, 0.35443878173828125, 0.3680152893066406, 0.381591796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 10.0, 23.0, 71.0, 141.0, 385.0, 1476.0, 12118.0, 702824.0, 322432.0, 7437.0, 1098.0, 319.0, 101.0, 48.0, 20.0, 17.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.489990234375, -0.4780120849609375, -0.466033935546875, -0.4540557861328125, -0.44207763671875, -0.4300994873046875, -0.418121337890625, -0.4061431884765625, -0.3941650390625, -0.3821868896484375, -0.370208740234375, -0.3582305908203125, -0.34625244140625, -0.3342742919921875, -0.322296142578125, -0.3103179931640625, -0.29833984375, -0.2863616943359375, -0.274383544921875, -0.2624053955078125, -0.25042724609375, -0.2384490966796875, -0.226470947265625, -0.2144927978515625, -0.2025146484375, -0.1905364990234375, -0.178558349609375, -0.1665802001953125, -0.15460205078125, -0.1426239013671875, -0.130645751953125, -0.1186676025390625, -0.106689453125, -0.0947113037109375, -0.082733154296875, -0.0707550048828125, -0.05877685546875, -0.0467987060546875, -0.034820556640625, -0.0228424072265625, -0.0108642578125, 0.0011138916015625, 0.013092041015625, 0.0250701904296875, 0.03704833984375, 0.0490264892578125, 0.061004638671875, 0.0729827880859375, 0.0849609375, 0.0969390869140625, 0.108917236328125, 0.1208953857421875, 0.13287353515625, 0.1448516845703125, 0.156829833984375, 0.1688079833984375, 0.1807861328125, 0.1927642822265625, 0.204742431640625, 0.2167205810546875, 0.22869873046875, 0.2406768798828125, 0.252655029296875, 0.2646331787109375, 0.276611328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 0.0, 6.0, 4.0, 9.0, 5.0, 4.0, 6.0, 9.0, 11.0, 17.0, 13.0, 18.0, 33.0, 30.0, 60.0, 63.0, 58.0, 67.0, 97.0, 76.0, 77.0, 65.0, 57.0, 52.0, 35.0, 35.0, 20.0, 14.0, 17.0, 15.0, 10.0, 7.0, 2.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.115436553955078e-05, -5.970802158117294e-05, -5.8261677622795105e-05, -5.681533366441727e-05, -5.536898970603943e-05, -5.392264574766159e-05, -5.247630178928375e-05, -5.1029957830905914e-05, -4.9583613872528076e-05, -4.813726991415024e-05, -4.66909259557724e-05, -4.524458199739456e-05, -4.3798238039016724e-05, -4.2351894080638885e-05, -4.090555012226105e-05, -3.945920616388321e-05, -3.801286220550537e-05, -3.656651824712753e-05, -3.5120174288749695e-05, -3.367383033037186e-05, -3.222748637199402e-05, -3.078114241361618e-05, -2.9334798455238342e-05, -2.7888454496860504e-05, -2.6442110538482666e-05, -2.4995766580104828e-05, -2.354942262172699e-05, -2.210307866334915e-05, -2.0656734704971313e-05, -1.9210390746593475e-05, -1.7764046788215637e-05, -1.63177028298378e-05, -1.4871358871459961e-05, -1.3425014913082123e-05, -1.1978670954704285e-05, -1.0532326996326447e-05, -9.085983037948608e-06, -7.63963907957077e-06, -6.193295121192932e-06, -4.746951162815094e-06, -3.300607204437256e-06, -1.8542632460594177e-06, -4.079192876815796e-07, 1.0384246706962585e-06, 2.4847686290740967e-06, 3.931112587451935e-06, 5.377456545829773e-06, 6.823800504207611e-06, 8.27014446258545e-06, 9.716488420963287e-06, 1.1162832379341125e-05, 1.2609176337718964e-05, 1.4055520296096802e-05, 1.550186425447464e-05, 1.6948208212852478e-05, 1.8394552171230316e-05, 1.9840896129608154e-05, 2.1287240087985992e-05, 2.273358404636383e-05, 2.417992800474167e-05, 2.5626271963119507e-05, 2.7072615921497345e-05, 2.8518959879875183e-05, 2.996530383825302e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 12.0, 14.0, 38.0, 53.0, 78.0, 154.0, 261.0, 487.0, 1056.0, 2895.0, 10818.0, 78367.0, 701611.0, 222894.0, 22061.0, 4731.0, 1645.0, 646.0, 317.0, 176.0, 86.0, 45.0, 33.0, 18.0, 12.0, 6.0, 7.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2093505859375, -0.20294952392578125, -0.1965484619140625, -0.19014739990234375, -0.183746337890625, -0.17734527587890625, -0.1709442138671875, -0.16454315185546875, -0.15814208984375, -0.15174102783203125, -0.1453399658203125, -0.13893890380859375, -0.132537841796875, -0.12613677978515625, -0.1197357177734375, -0.11333465576171875, -0.10693359375, -0.10053253173828125, -0.0941314697265625, -0.08773040771484375, -0.081329345703125, -0.07492828369140625, -0.0685272216796875, -0.06212615966796875, -0.05572509765625, -0.04932403564453125, -0.0429229736328125, -0.03652191162109375, -0.030120849609375, -0.02371978759765625, -0.0173187255859375, -0.01091766357421875, -0.0045166015625, 0.00188446044921875, 0.0082855224609375, 0.01468658447265625, 0.021087646484375, 0.02748870849609375, 0.0338897705078125, 0.04029083251953125, 0.04669189453125, 0.05309295654296875, 0.0594940185546875, 0.06589508056640625, 0.072296142578125, 0.07869720458984375, 0.0850982666015625, 0.09149932861328125, 0.097900390625, 0.10430145263671875, 0.1107025146484375, 0.11710357666015625, 0.123504638671875, 0.12990570068359375, 0.1363067626953125, 0.14270782470703125, 0.14910888671875, 0.15550994873046875, 0.1619110107421875, 0.16831207275390625, 0.174713134765625, 0.18111419677734375, 0.1875152587890625, 0.19391632080078125, 0.2003173828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 15.0, 6.0, 18.0, 27.0, 26.0, 24.0, 56.0, 46.0, 57.0, 63.0, 76.0, 75.0, 77.0, 59.0, 58.0, 59.0, 39.0, 40.0, 23.0, 23.0, 20.0, 28.0, 14.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1240234375, -0.12037944793701172, -0.11673545837402344, -0.11309146881103516, -0.10944747924804688, -0.1058034896850586, -0.10215950012207031, -0.09851551055908203, -0.09487152099609375, -0.09122753143310547, -0.08758354187011719, -0.0839395523071289, -0.08029556274414062, -0.07665157318115234, -0.07300758361816406, -0.06936359405517578, -0.0657196044921875, -0.06207561492919922, -0.05843162536621094, -0.054787635803222656, -0.051143646240234375, -0.047499656677246094, -0.04385566711425781, -0.04021167755126953, -0.03656768798828125, -0.03292369842529297, -0.029279708862304688, -0.025635719299316406, -0.021991729736328125, -0.018347740173339844, -0.014703750610351562, -0.011059761047363281, -0.007415771484375, -0.0037717819213867188, -0.0001277923583984375, 0.0035161972045898438, 0.007160186767578125, 0.010804176330566406, 0.014448165893554688, 0.01809215545654297, 0.02173614501953125, 0.02538013458251953, 0.029024124145507812, 0.032668113708496094, 0.036312103271484375, 0.039956092834472656, 0.04360008239746094, 0.04724407196044922, 0.0508880615234375, 0.05453205108642578, 0.05817604064941406, 0.061820030212402344, 0.06546401977539062, 0.0691080093383789, 0.07275199890136719, 0.07639598846435547, 0.08003997802734375, 0.08368396759033203, 0.08732795715332031, 0.0909719467163086, 0.09461593627929688, 0.09825992584228516, 0.10190391540527344, 0.10554790496826172, 0.10919189453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 5.0, 1.0, 6.0, 1.0, 18.0, 27.0, 66.0, 164.0, 193.0, 235.0, 154.0, 83.0, 34.0, 15.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6376831531524658, -1.5120912790298462, -1.3864994049072266, -1.2609076499938965, -1.1353156566619873, -1.0097239017486572, -0.8841320276260376, -0.758540153503418, -0.6329482793807983, -0.5073564052581787, -0.38176456093788147, -0.25617271661758423, -0.1305808424949646, -0.004988968372344971, 0.12060284614562988, 0.2461947202682495, 0.37178659439086914, 0.49737846851348877, 0.6229703426361084, 0.7485621571540833, 0.8741540312767029, 0.9997459053993225, 1.1253377199172974, 1.250929594039917, 1.3765214681625366, 1.5021133422851562, 1.6277052164077759, 1.7532970905303955, 1.8788888454437256, 2.0044808387756348, 2.130072593688965, 2.255664348602295, 2.381256580352783, 2.5068483352661133, 2.6324403285980225, 2.7580320835113525, 2.8836240768432617, 3.009215831756592, 3.134807586669922, 3.260399580001831, 3.3859915733337402, 3.5115833282470703, 3.6371753215789795, 3.7627670764923096, 3.8883590698242188, 4.013950824737549, 4.139542579650879, 4.265134811401367, 4.390726089477539, 4.516317844390869, 4.641909599304199, 4.7675018310546875, 4.893093585968018, 5.018685340881348, 5.144277095794678, 5.269868850708008, 5.395461082458496, 5.521052837371826, 5.646644592285156, 5.7722368240356445, 5.897828578948975, 6.023420333862305, 6.149012088775635, 6.274603843688965, 6.400196075439453]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 3.0, 5.0, 13.0, 13.0, 11.0, 12.0, 24.0, 22.0, 32.0, 23.0, 27.0, 26.0, 39.0, 31.0, 43.0, 41.0, 61.0, 66.0, 57.0, 50.0, 59.0, 36.0, 51.0, 33.0, 33.0, 28.0, 25.0, 20.0, 25.0, 24.0, 13.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9483669996261597, -1.8918190002441406, -1.8352710008621216, -1.7787230014801025, -1.722175121307373, -1.665627121925354, -1.609079122543335, -1.552531123161316, -1.4959831237792969, -1.4394351243972778, -1.3828871250152588, -1.3263392448425293, -1.2697912454605103, -1.2132432460784912, -1.1566952466964722, -1.1001472473144531, -1.0435993671417236, -0.9870513677597046, -0.9305034279823303, -0.8739554286003113, -0.8174074292182922, -0.760859489440918, -0.7043114900588989, -0.6477634906768799, -0.5912154912948608, -0.5346674919128418, -0.47811952233314514, -0.4215715527534485, -0.36502355337142944, -0.3084755837917328, -0.25192761421203613, -0.1953796148300171, -0.13883161544799805, -0.0822836309671402, -0.025735653936862946, 0.030812323093414307, 0.08736030757427216, 0.14390829205513, 0.20045626163482666, 0.2570042610168457, 0.31355223059654236, 0.370100200176239, 0.42664819955825806, 0.4831961691379547, 0.5397441387176514, 0.5962921380996704, 0.6528401374816895, 0.7093881368637085, 0.7659360766410828, 0.8224840760231018, 0.8790320158004761, 0.9355800151824951, 0.9921280145645142, 1.0486760139465332, 1.1052238941192627, 1.1617720127105713, 1.2183198928833008, 1.2748678922653198, 1.3314158916473389, 1.3879637718200684, 1.4445117712020874, 1.5010597705841064, 1.5576077699661255, 1.6141557693481445, 1.6707037687301636]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 12.0, 16.0, 19.0, 26.0, 38.0, 66.0, 111.0, 164.0, 253.0, 423.0, 756.0, 1319.0, 2513.0, 4931.0, 11363.0, 33761.0, 200696.0, 3822723.0, 78982.0, 20385.0, 7817.0, 3567.0, 1786.0, 957.0, 594.0, 345.0, 211.0, 165.0, 104.0, 67.0, 42.0, 21.0, 15.0, 10.0, 7.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.2677154541015625, -0.258575439453125, -0.2494354248046875, -0.24029541015625, -0.2311553955078125, -0.222015380859375, -0.2128753662109375, -0.2037353515625, -0.1945953369140625, -0.185455322265625, -0.1763153076171875, -0.16717529296875, -0.1580352783203125, -0.148895263671875, -0.1397552490234375, -0.130615234375, -0.1214752197265625, -0.112335205078125, -0.1031951904296875, -0.09405517578125, -0.0849151611328125, -0.075775146484375, -0.0666351318359375, -0.0574951171875, -0.0483551025390625, -0.039215087890625, -0.0300750732421875, -0.02093505859375, -0.0117950439453125, -0.002655029296875, 0.0064849853515625, 0.015625, 0.0247650146484375, 0.033905029296875, 0.0430450439453125, 0.05218505859375, 0.0613250732421875, 0.070465087890625, 0.0796051025390625, 0.0887451171875, 0.0978851318359375, 0.107025146484375, 0.1161651611328125, 0.12530517578125, 0.1344451904296875, 0.143585205078125, 0.1527252197265625, 0.161865234375, 0.1710052490234375, 0.180145263671875, 0.1892852783203125, 0.19842529296875, 0.2075653076171875, 0.216705322265625, 0.2258453369140625, 0.2349853515625, 0.2441253662109375, 0.253265380859375, 0.2624053955078125, 0.27154541015625, 0.2806854248046875, 0.289825439453125, 0.2989654541015625, 0.30810546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 3.0, 7.0, 14.0, 12.0, 15.0, 21.0, 19.0, 38.0, 56.0, 48.0, 48.0, 64.0, 62.0, 80.0, 66.0, 49.0, 45.0, 50.0, 44.0, 47.0, 40.0, 37.0, 34.0, 23.0, 14.0, 6.0, 11.0, 5.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.10055828094482422, -0.09753990173339844, -0.09452152252197266, -0.09150314331054688, -0.0884847640991211, -0.08546638488769531, -0.08244800567626953, -0.07942962646484375, -0.07641124725341797, -0.07339286804199219, -0.0703744888305664, -0.06735610961914062, -0.06433773040771484, -0.06131935119628906, -0.05830097198486328, -0.0552825927734375, -0.05226421356201172, -0.04924583435058594, -0.046227455139160156, -0.043209075927734375, -0.040190696716308594, -0.03717231750488281, -0.03415393829345703, -0.03113555908203125, -0.02811717987060547, -0.025098800659179688, -0.022080421447753906, -0.019062042236328125, -0.016043663024902344, -0.013025283813476562, -0.010006904602050781, -0.006988525390625, -0.003970146179199219, -0.0009517669677734375, 0.0020666122436523438, 0.005084991455078125, 0.008103370666503906, 0.011121749877929688, 0.014140129089355469, 0.01715850830078125, 0.02017688751220703, 0.023195266723632812, 0.026213645935058594, 0.029232025146484375, 0.032250404357910156, 0.03526878356933594, 0.03828716278076172, 0.0413055419921875, 0.04432392120361328, 0.04734230041503906, 0.050360679626464844, 0.053379058837890625, 0.056397438049316406, 0.05941581726074219, 0.06243419647216797, 0.06545257568359375, 0.06847095489501953, 0.07148933410644531, 0.0745077133178711, 0.07752609252929688, 0.08054447174072266, 0.08356285095214844, 0.08658123016357422, 0.089599609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 14.0, 22.0, 28.0, 48.0, 81.0, 107.0, 150.0, 245.0, 442.0, 747.0, 1464.0, 3269.0, 8044.0, 26090.0, 154271.0, 3818326.0, 141843.0, 24830.0, 7796.0, 3115.0, 1463.0, 719.0, 406.0, 255.0, 154.0, 107.0, 78.0, 46.0, 33.0, 15.0, 19.0, 15.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.37353515625, -0.3632965087890625, -0.353057861328125, -0.3428192138671875, -0.33258056640625, -0.3223419189453125, -0.312103271484375, -0.3018646240234375, -0.2916259765625, -0.2813873291015625, -0.271148681640625, -0.2609100341796875, -0.25067138671875, -0.2404327392578125, -0.230194091796875, -0.2199554443359375, -0.209716796875, -0.1994781494140625, -0.189239501953125, -0.1790008544921875, -0.16876220703125, -0.1585235595703125, -0.148284912109375, -0.1380462646484375, -0.1278076171875, -0.1175689697265625, -0.107330322265625, -0.0970916748046875, -0.08685302734375, -0.0766143798828125, -0.066375732421875, -0.0561370849609375, -0.0458984375, -0.0356597900390625, -0.025421142578125, -0.0151824951171875, -0.00494384765625, 0.0052947998046875, 0.015533447265625, 0.0257720947265625, 0.0360107421875, 0.0462493896484375, 0.056488037109375, 0.0667266845703125, 0.07696533203125, 0.0872039794921875, 0.097442626953125, 0.1076812744140625, 0.117919921875, 0.1281585693359375, 0.138397216796875, 0.1486358642578125, 0.15887451171875, 0.1691131591796875, 0.179351806640625, 0.1895904541015625, 0.1998291015625, 0.2100677490234375, 0.220306396484375, 0.2305450439453125, 0.24078369140625, 0.2510223388671875, 0.261260986328125, 0.2714996337890625, 0.28173828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 11.0, 6.0, 10.0, 9.0, 25.0, 39.0, 47.0, 100.0, 219.0, 1693.0, 1439.0, 187.0, 105.0, 44.0, 42.0, 23.0, 15.0, 17.0, 9.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.15771484375, -0.15345191955566406, -0.14918899536132812, -0.1449260711669922, -0.14066314697265625, -0.1364002227783203, -0.13213729858398438, -0.12787437438964844, -0.1236114501953125, -0.11934852600097656, -0.11508560180664062, -0.11082267761230469, -0.10655975341796875, -0.10229682922363281, -0.09803390502929688, -0.09377098083496094, -0.089508056640625, -0.08524513244628906, -0.08098220825195312, -0.07671928405761719, -0.07245635986328125, -0.06819343566894531, -0.06393051147460938, -0.05966758728027344, -0.0554046630859375, -0.05114173889160156, -0.046878814697265625, -0.04261589050292969, -0.03835296630859375, -0.03409004211425781, -0.029827117919921875, -0.025564193725585938, -0.02130126953125, -0.017038345336914062, -0.012775421142578125, -0.008512496948242188, -0.00424957275390625, 1.33514404296875e-05, 0.004276275634765625, 0.008539199829101562, 0.0128021240234375, 0.017065048217773438, 0.021327972412109375, 0.025590896606445312, 0.02985382080078125, 0.03411674499511719, 0.038379669189453125, 0.04264259338378906, 0.046905517578125, 0.05116844177246094, 0.055431365966796875, 0.05969429016113281, 0.06395721435546875, 0.06822013854980469, 0.07248306274414062, 0.07674598693847656, 0.0810089111328125, 0.08527183532714844, 0.08953475952148438, 0.09379768371582031, 0.09806060791015625, 0.10232353210449219, 0.10658645629882812, 0.11084938049316406, 0.1151123046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 9.0, 13.0, 22.0, 39.0, 81.0, 134.0, 171.0, 189.0, 135.0, 82.0, 53.0, 28.0, 21.0, 8.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8752933740615845, -0.8462796211242676, -0.8172658085823059, -0.788252055644989, -0.7592383027076721, -0.7302244901657104, -0.7012107372283936, -0.6721969842910767, -0.6431832313537598, -0.6141694784164429, -0.5851556658744812, -0.5561419129371643, -0.5271281599998474, -0.49811437726020813, -0.46910059452056885, -0.44008684158325195, -0.4110730290412903, -0.382059246301651, -0.3530454933643341, -0.3240317106246948, -0.29501795768737793, -0.26600417494773865, -0.23699039220809937, -0.20797662436962128, -0.1789628565311432, -0.1499490886926651, -0.12093531340360641, -0.09192153811454773, -0.06290777027606964, -0.03389400243759155, -0.0048802196979522705, 0.024133548140525818, 0.05314725637435913, 0.08216102421283722, 0.1111747995018959, 0.1401885747909546, 0.16920234262943268, 0.19821611046791077, 0.22722989320755005, 0.25624364614486694, 0.2852574288845062, 0.3142712116241455, 0.3432849645614624, 0.3722987473011017, 0.40131253004074097, 0.43032628297805786, 0.45934006571769714, 0.4883538484573364, 0.5173676013946533, 0.5463813543319702, 0.5753951668739319, 0.6044089198112488, 0.6334226727485657, 0.6624364852905273, 0.6914502382278442, 0.7204639911651611, 0.749477744102478, 0.7784914970397949, 0.8075053095817566, 0.8365190625190735, 0.8655328154563904, 0.894546627998352, 0.923560380935669, 0.9525741338729858, 0.9815879464149475]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 1.0, 6.0, 7.0, 10.0, 8.0, 15.0, 7.0, 16.0, 18.0, 22.0, 23.0, 25.0, 23.0, 31.0, 37.0, 50.0, 37.0, 38.0, 50.0, 48.0, 33.0, 56.0, 32.0, 38.0, 33.0, 42.0, 33.0, 34.0, 34.0, 31.0, 22.0, 16.0, 20.0, 18.0, 14.0, 13.0, 8.0, 7.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2980915307998657, -0.2880476415157318, -0.2780037522315979, -0.267959862947464, -0.2579159736633301, -0.24787208437919617, -0.23782820999622345, -0.22778432071208954, -0.21774043142795563, -0.20769654214382172, -0.1976526528596878, -0.1876087635755539, -0.17756488919258118, -0.16752099990844727, -0.15747711062431335, -0.14743322134017944, -0.13738933205604553, -0.12734544277191162, -0.11730155348777771, -0.1072576716542244, -0.09721378237009048, -0.08716989308595657, -0.07712601125240326, -0.06708212196826935, -0.05703823268413544, -0.046994343400001526, -0.03695045784115791, -0.02690657041966915, -0.01686268299818039, -0.006818793714046478, 0.0032250918447971344, 0.013268977403640747, 0.023312866687774658, 0.03335675597190857, 0.04340064153075218, 0.053444527089595795, 0.0634884163737297, 0.07353230565786362, 0.08357618749141693, 0.09362007677555084, 0.10366396605968475, 0.11370785534381866, 0.12375174462795258, 0.1337956339120865, 0.1438395082950592, 0.15388339757919312, 0.16392728686332703, 0.17397117614746094, 0.18401506543159485, 0.19405895471572876, 0.20410284399986267, 0.21414673328399658, 0.2241906225681305, 0.2342345118522644, 0.24427838623523712, 0.2543222904205322, 0.26436614990234375, 0.27441003918647766, 0.2844539284706116, 0.2944978177547455, 0.3045417070388794, 0.3145855963230133, 0.3246294856071472, 0.33467334508895874, 0.34471726417541504]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 16.0, 12.0, 15.0, 39.0, 45.0, 70.0, 122.0, 184.0, 309.0, 483.0, 878.0, 1368.0, 2508.0, 4486.0, 8517.0, 16076.0, 31159.0, 60061.0, 118426.0, 260561.0, 280306.0, 127671.0, 64308.0, 33176.0, 17360.0, 9053.0, 4754.0, 2757.0, 1527.0, 886.0, 503.0, 319.0, 196.0, 147.0, 99.0, 44.0, 30.0, 25.0, 13.0, 10.0, 9.0, 5.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1517333984375, -0.1466846466064453, -0.14163589477539062, -0.13658714294433594, -0.13153839111328125, -0.12648963928222656, -0.12144088745117188, -0.11639213562011719, -0.1113433837890625, -0.10629463195800781, -0.10124588012695312, -0.09619712829589844, -0.09114837646484375, -0.08609962463378906, -0.08105087280273438, -0.07600212097167969, -0.070953369140625, -0.06590461730957031, -0.060855865478515625, -0.05580711364746094, -0.05075836181640625, -0.04570960998535156, -0.040660858154296875, -0.03561210632324219, -0.0305633544921875, -0.025514602661132812, -0.020465850830078125, -0.015417098999023438, -0.01036834716796875, -0.0053195953369140625, -0.000270843505859375, 0.0047779083251953125, 0.00982666015625, 0.014875411987304688, 0.019924163818359375, 0.024972915649414062, 0.03002166748046875, 0.03507041931152344, 0.040119171142578125, 0.04516792297363281, 0.0502166748046875, 0.05526542663574219, 0.060314178466796875, 0.06536293029785156, 0.07041168212890625, 0.07546043395996094, 0.08050918579101562, 0.08555793762207031, 0.090606689453125, 0.09565544128417969, 0.10070419311523438, 0.10575294494628906, 0.11080169677734375, 0.11585044860839844, 0.12089920043945312, 0.1259479522705078, 0.1309967041015625, 0.1360454559326172, 0.14109420776367188, 0.14614295959472656, 0.15119171142578125, 0.15624046325683594, 0.16128921508789062, 0.1663379669189453, 0.17138671875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 5.0, 8.0, 6.0, 9.0, 11.0, 18.0, 17.0, 23.0, 41.0, 44.0, 40.0, 42.0, 59.0, 55.0, 61.0, 53.0, 54.0, 54.0, 45.0, 57.0, 55.0, 41.0, 41.0, 37.0, 32.0, 23.0, 10.0, 6.0, 11.0, 8.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1025390625, -0.0994110107421875, -0.096282958984375, -0.0931549072265625, -0.09002685546875, -0.0868988037109375, -0.083770751953125, -0.0806427001953125, -0.0775146484375, -0.0743865966796875, -0.071258544921875, -0.0681304931640625, -0.06500244140625, -0.0618743896484375, -0.058746337890625, -0.0556182861328125, -0.052490234375, -0.0493621826171875, -0.046234130859375, -0.0431060791015625, -0.03997802734375, -0.0368499755859375, -0.033721923828125, -0.0305938720703125, -0.0274658203125, -0.0243377685546875, -0.021209716796875, -0.0180816650390625, -0.01495361328125, -0.0118255615234375, -0.008697509765625, -0.0055694580078125, -0.00244140625, 0.0006866455078125, 0.003814697265625, 0.0069427490234375, 0.01007080078125, 0.0131988525390625, 0.016326904296875, 0.0194549560546875, 0.0225830078125, 0.0257110595703125, 0.028839111328125, 0.0319671630859375, 0.03509521484375, 0.0382232666015625, 0.041351318359375, 0.0444793701171875, 0.047607421875, 0.0507354736328125, 0.053863525390625, 0.0569915771484375, 0.06011962890625, 0.0632476806640625, 0.066375732421875, 0.0695037841796875, 0.0726318359375, 0.0757598876953125, 0.078887939453125, 0.0820159912109375, 0.08514404296875, 0.0882720947265625, 0.091400146484375, 0.0945281982421875, 0.09765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 13.0, 17.0, 23.0, 39.0, 40.0, 59.0, 85.0, 119.0, 176.0, 245.0, 341.0, 578.0, 1024.0, 2045.0, 5511.0, 21816.0, 144577.0, 697602.0, 142365.0, 21538.0, 5594.0, 2016.0, 1026.0, 564.0, 343.0, 227.0, 169.0, 106.0, 86.0, 55.0, 52.0, 20.0, 22.0, 12.0, 10.0, 9.0, 10.0, 4.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.3662109375, -0.35527801513671875, -0.3443450927734375, -0.33341217041015625, -0.322479248046875, -0.31154632568359375, -0.3006134033203125, -0.28968048095703125, -0.27874755859375, -0.26781463623046875, -0.2568817138671875, -0.24594879150390625, -0.235015869140625, -0.22408294677734375, -0.2131500244140625, -0.20221710205078125, -0.1912841796875, -0.18035125732421875, -0.1694183349609375, -0.15848541259765625, -0.147552490234375, -0.13661956787109375, -0.1256866455078125, -0.11475372314453125, -0.10382080078125, -0.09288787841796875, -0.0819549560546875, -0.07102203369140625, -0.060089111328125, -0.04915618896484375, -0.0382232666015625, -0.02729034423828125, -0.016357421875, -0.00542449951171875, 0.0055084228515625, 0.01644134521484375, 0.027374267578125, 0.03830718994140625, 0.0492401123046875, 0.06017303466796875, 0.07110595703125, 0.08203887939453125, 0.0929718017578125, 0.10390472412109375, 0.114837646484375, 0.12577056884765625, 0.1367034912109375, 0.14763641357421875, 0.1585693359375, 0.16950225830078125, 0.1804351806640625, 0.19136810302734375, 0.202301025390625, 0.21323394775390625, 0.2241668701171875, 0.23509979248046875, 0.24603271484375, 0.25696563720703125, 0.2678985595703125, 0.27883148193359375, 0.289764404296875, 0.30069732666015625, 0.3116302490234375, 0.32256317138671875, 0.33349609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 3.0, 8.0, 4.0, 10.0, 5.0, 14.0, 15.0, 17.0, 22.0, 18.0, 35.0, 23.0, 23.0, 27.0, 33.0, 46.0, 38.0, 48.0, 49.0, 50.0, 36.0, 51.0, 45.0, 38.0, 37.0, 33.0, 37.0, 30.0, 31.0, 16.0, 23.0, 19.0, 16.0, 20.0, 12.0, 11.0, 8.0, 6.0, 7.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0], "bins": [-0.353759765625, -0.3442115783691406, -0.33466339111328125, -0.3251152038574219, -0.3155670166015625, -0.3060188293457031, -0.29647064208984375, -0.2869224548339844, -0.277374267578125, -0.2678260803222656, -0.25827789306640625, -0.24872970581054688, -0.2391815185546875, -0.22963333129882812, -0.22008514404296875, -0.21053695678710938, -0.20098876953125, -0.19144058227539062, -0.18189239501953125, -0.17234420776367188, -0.1627960205078125, -0.15324783325195312, -0.14369964599609375, -0.13415145874023438, -0.124603271484375, -0.11505508422851562, -0.10550689697265625, -0.09595870971679688, -0.0864105224609375, -0.07686233520507812, -0.06731414794921875, -0.057765960693359375, -0.0482177734375, -0.038669586181640625, -0.02912139892578125, -0.019573211669921875, -0.0100250244140625, -0.000476837158203125, 0.00907135009765625, 0.018619537353515625, 0.028167724609375, 0.037715911865234375, 0.04726409912109375, 0.056812286376953125, 0.0663604736328125, 0.07590866088867188, 0.08545684814453125, 0.09500503540039062, 0.10455322265625, 0.11410140991210938, 0.12364959716796875, 0.13319778442382812, 0.1427459716796875, 0.15229415893554688, 0.16184234619140625, 0.17139053344726562, 0.180938720703125, 0.19048690795898438, 0.20003509521484375, 0.20958328247070312, 0.2191314697265625, 0.22867965698242188, 0.23822784423828125, 0.24777603149414062, 0.25732421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 7.0, 10.0, 5.0, 11.0, 16.0, 27.0, 54.0, 69.0, 99.0, 183.0, 353.0, 607.0, 1377.0, 3453.0, 10586.0, 44298.0, 245307.0, 583104.0, 123507.0, 24281.0, 6621.0, 2413.0, 1029.0, 491.0, 257.0, 134.0, 94.0, 55.0, 28.0, 24.0, 11.0, 10.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09912109375, -0.09561920166015625, -0.0921173095703125, -0.08861541748046875, -0.085113525390625, -0.08161163330078125, -0.0781097412109375, -0.07460784912109375, -0.07110595703125, -0.06760406494140625, -0.0641021728515625, -0.06060028076171875, -0.057098388671875, -0.05359649658203125, -0.0500946044921875, -0.04659271240234375, -0.0430908203125, -0.03958892822265625, -0.0360870361328125, -0.03258514404296875, -0.029083251953125, -0.02558135986328125, -0.0220794677734375, -0.01857757568359375, -0.01507568359375, -0.01157379150390625, -0.0080718994140625, -0.00457000732421875, -0.001068115234375, 0.00243377685546875, 0.0059356689453125, 0.00943756103515625, 0.012939453125, 0.01644134521484375, 0.0199432373046875, 0.02344512939453125, 0.026947021484375, 0.03044891357421875, 0.0339508056640625, 0.03745269775390625, 0.04095458984375, 0.04445648193359375, 0.0479583740234375, 0.05146026611328125, 0.054962158203125, 0.05846405029296875, 0.0619659423828125, 0.06546783447265625, 0.0689697265625, 0.07247161865234375, 0.0759735107421875, 0.07947540283203125, 0.082977294921875, 0.08647918701171875, 0.0899810791015625, 0.09348297119140625, 0.09698486328125, 0.10048675537109375, 0.1039886474609375, 0.10749053955078125, 0.110992431640625, 0.11449432373046875, 0.1179962158203125, 0.12149810791015625, 0.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 12.0, 10.0, 14.0, 19.0, 21.0, 24.0, 30.0, 42.0, 32.0, 49.0, 54.0, 81.0, 92.0, 106.0, 88.0, 77.0, 38.0, 38.0, 29.0, 28.0, 26.0, 14.0, 11.0, 13.0, 9.0, 6.0, 10.0, 11.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-05, -4.011392593383789e-05, -3.8504600524902344e-05, -3.68952751159668e-05, -3.528594970703125e-05, -3.36766242980957e-05, -3.2067298889160156e-05, -3.045797348022461e-05, -2.8848648071289062e-05, -2.7239322662353516e-05, -2.562999725341797e-05, -2.4020671844482422e-05, -2.2411346435546875e-05, -2.0802021026611328e-05, -1.919269561767578e-05, -1.7583370208740234e-05, -1.5974044799804688e-05, -1.436471939086914e-05, -1.2755393981933594e-05, -1.1146068572998047e-05, -9.5367431640625e-06, -7.927417755126953e-06, -6.318092346191406e-06, -4.708766937255859e-06, -3.0994415283203125e-06, -1.4901161193847656e-06, 1.1920928955078125e-07, 1.7285346984863281e-06, 3.337860107421875e-06, 4.947185516357422e-06, 6.556510925292969e-06, 8.165836334228516e-06, 9.775161743164062e-06, 1.138448715209961e-05, 1.2993812561035156e-05, 1.4603137969970703e-05, 1.621246337890625e-05, 1.7821788787841797e-05, 1.9431114196777344e-05, 2.104043960571289e-05, 2.2649765014648438e-05, 2.4259090423583984e-05, 2.586841583251953e-05, 2.7477741241455078e-05, 2.9087066650390625e-05, 3.069639205932617e-05, 3.230571746826172e-05, 3.3915042877197266e-05, 3.552436828613281e-05, 3.713369369506836e-05, 3.8743019104003906e-05, 4.035234451293945e-05, 4.1961669921875e-05, 4.357099533081055e-05, 4.5180320739746094e-05, 4.678964614868164e-05, 4.839897155761719e-05, 5.0008296966552734e-05, 5.161762237548828e-05, 5.322694778442383e-05, 5.4836273193359375e-05, 5.644559860229492e-05, 5.805492401123047e-05, 5.9664249420166016e-05, 6.127357482910156e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 5.0, 12.0, 11.0, 21.0, 24.0, 27.0, 38.0, 60.0, 92.0, 129.0, 246.0, 351.0, 591.0, 1218.0, 2578.0, 6460.0, 22617.0, 114802.0, 552775.0, 279469.0, 47639.0, 11485.0, 3987.0, 1745.0, 871.0, 481.0, 287.0, 179.0, 100.0, 71.0, 55.0, 34.0, 25.0, 17.0, 10.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10760498046875, -0.10421562194824219, -0.10082626342773438, -0.09743690490722656, -0.09404754638671875, -0.09065818786621094, -0.08726882934570312, -0.08387947082519531, -0.0804901123046875, -0.07710075378417969, -0.07371139526367188, -0.07032203674316406, -0.06693267822265625, -0.06354331970214844, -0.060153961181640625, -0.05676460266113281, -0.053375244140625, -0.04998588562011719, -0.046596527099609375, -0.04320716857910156, -0.03981781005859375, -0.03642845153808594, -0.033039093017578125, -0.029649734497070312, -0.0262603759765625, -0.022871017456054688, -0.019481658935546875, -0.016092300415039062, -0.01270294189453125, -0.009313583374023438, -0.005924224853515625, -0.0025348663330078125, 0.0008544921875, 0.0042438507080078125, 0.007633209228515625, 0.011022567749023438, 0.01441192626953125, 0.017801284790039062, 0.021190643310546875, 0.024580001831054688, 0.0279693603515625, 0.03135871887207031, 0.034748077392578125, 0.03813743591308594, 0.04152679443359375, 0.04491615295410156, 0.048305511474609375, 0.05169486999511719, 0.055084228515625, 0.05847358703613281, 0.061862945556640625, 0.06525230407714844, 0.06864166259765625, 0.07203102111816406, 0.07542037963867188, 0.07880973815917969, 0.0821990966796875, 0.08558845520019531, 0.08897781372070312, 0.09236717224121094, 0.09575653076171875, 0.09914588928222656, 0.10253524780273438, 0.10592460632324219, 0.10931396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 1.0, 1.0, 7.0, 7.0, 13.0, 14.0, 11.0, 15.0, 22.0, 25.0, 27.0, 29.0, 38.0, 47.0, 59.0, 46.0, 64.0, 72.0, 58.0, 55.0, 69.0, 46.0, 42.0, 43.0, 26.0, 28.0, 15.0, 18.0, 10.0, 14.0, 14.0, 7.0, 7.0, 13.0, 7.0, 1.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.08392047882080078, -0.08135414123535156, -0.07878780364990234, -0.07622146606445312, -0.0736551284790039, -0.07108879089355469, -0.06852245330810547, -0.06595611572265625, -0.06338977813720703, -0.06082344055175781, -0.058257102966308594, -0.055690765380859375, -0.053124427795410156, -0.05055809020996094, -0.04799175262451172, -0.0454254150390625, -0.04285907745361328, -0.04029273986816406, -0.037726402282714844, -0.035160064697265625, -0.032593727111816406, -0.030027389526367188, -0.02746105194091797, -0.02489471435546875, -0.02232837677001953, -0.019762039184570312, -0.017195701599121094, -0.014629364013671875, -0.012063026428222656, -0.009496688842773438, -0.006930351257324219, -0.004364013671875, -0.0017976760864257812, 0.0007686614990234375, 0.0033349990844726562, 0.005901336669921875, 0.008467674255371094, 0.011034011840820312, 0.013600349426269531, 0.01616668701171875, 0.01873302459716797, 0.021299362182617188, 0.023865699768066406, 0.026432037353515625, 0.028998374938964844, 0.03156471252441406, 0.03413105010986328, 0.0366973876953125, 0.03926372528076172, 0.04183006286621094, 0.044396400451660156, 0.046962738037109375, 0.049529075622558594, 0.05209541320800781, 0.05466175079345703, 0.05722808837890625, 0.05979442596435547, 0.06236076354980469, 0.0649271011352539, 0.06749343872070312, 0.07005977630615234, 0.07262611389160156, 0.07519245147705078, 0.0777587890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 8.0, 23.0, 27.0, 46.0, 70.0, 89.0, 101.0, 112.0, 122.0, 113.0, 73.0, 66.0, 59.0, 36.0, 13.0, 15.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1587326526641846, -2.1010186672210693, -2.043304920196533, -1.985590934753418, -1.9278769493103027, -1.870163083076477, -1.8124492168426514, -1.7547352313995361, -1.6970213651657104, -1.6393074989318848, -1.5815935134887695, -1.5238796472549438, -1.4661657810211182, -1.408451795578003, -1.3507379293441772, -1.2930240631103516, -1.2353100776672363, -1.1775962114334106, -1.1198822259902954, -1.0621683597564697, -1.0044543743133545, -0.9467405080795288, -0.8890266418457031, -0.8313127160072327, -0.7735987901687622, -0.7158848643302917, -0.6581709384918213, -0.6004570722579956, -0.5427431464195251, -0.4850292205810547, -0.4273153245449066, -0.36960142850875854, -0.3118875026702881, -0.2541735768318176, -0.19645968079566956, -0.1387457698583603, -0.08103185892105103, -0.023317933082580566, 0.034395962953567505, 0.09210985898971558, 0.14982378482818604, 0.2075376957654953, 0.26525160670280457, 0.32296550273895264, 0.3806794285774231, 0.43839335441589355, 0.4961072504520416, 0.5538211464881897, 0.6115350723266602, 0.6692489981651306, 0.7269629240036011, 0.7846767902374268, 0.8423907160758972, 0.9001046419143677, 0.9578185081481934, 1.0155324935913086, 1.0732463598251343, 1.13096022605896, 1.1886742115020752, 1.2463880777359009, 1.3041019439697266, 1.3618159294128418, 1.4195297956466675, 1.4772436618804932, 1.5349576473236084]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 15.0, 17.0, 7.0, 28.0, 17.0, 14.0, 22.0, 20.0, 33.0, 35.0, 39.0, 26.0, 39.0, 39.0, 38.0, 44.0, 50.0, 63.0, 52.0, 47.0, 52.0, 34.0, 31.0, 27.0, 34.0, 26.0, 18.0, 24.0, 13.0, 13.0, 13.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-1.6132254600524902, -1.5671130418777466, -1.521000623703003, -1.4748882055282593, -1.4287757873535156, -1.382663369178772, -1.3365509510040283, -1.2904385328292847, -1.244326114654541, -1.1982136964797974, -1.1521012783050537, -1.10598886013031, -1.0598764419555664, -1.0137640237808228, -0.9676516056060791, -0.9215391874313354, -0.875426709651947, -0.8293142914772034, -0.7832018733024597, -0.7370894551277161, -0.6909770369529724, -0.6448646187782288, -0.5987521409988403, -0.5526397228240967, -0.506527304649353, -0.4604148864746094, -0.4143024682998657, -0.36819005012512207, -0.3220776319503784, -0.27596521377563477, -0.22985276579856873, -0.18374034762382507, -0.1376279592514038, -0.09151554107666016, -0.04540311545133591, 0.0007093101739883423, 0.046821728348731995, 0.09293414652347565, 0.1390465795993805, 0.18515899777412415, 0.2312714159488678, 0.27738383412361145, 0.3234962522983551, 0.36960870027542114, 0.4157211184501648, 0.46183353662490845, 0.5079459547996521, 0.5540583729743958, 0.6001707911491394, 0.6462832093238831, 0.6923956274986267, 0.7385080456733704, 0.784620463848114, 0.8307328820228577, 0.8768453598022461, 0.9229577779769897, 0.9690701961517334, 1.015182614326477, 1.0612950325012207, 1.1074074506759644, 1.153519868850708, 1.1996322870254517, 1.2457447052001953, 1.291857123374939, 1.3379695415496826]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 19.0, 15.0, 31.0, 31.0, 51.0, 84.0, 134.0, 171.0, 278.0, 441.0, 699.0, 1093.0, 1910.0, 3375.0, 6021.0, 11704.0, 24240.0, 57194.0, 169165.0, 870389.0, 2393611.0, 457601.0, 112879.0, 42571.0, 19292.0, 9385.0, 4877.0, 2824.0, 1565.0, 947.0, 571.0, 415.0, 228.0, 153.0, 114.0, 60.0, 49.0, 20.0, 21.0, 17.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1444091796875, -0.14043426513671875, -0.1364593505859375, -0.13248443603515625, -0.128509521484375, -0.12453460693359375, -0.1205596923828125, -0.11658477783203125, -0.11260986328125, -0.10863494873046875, -0.1046600341796875, -0.10068511962890625, -0.096710205078125, -0.09273529052734375, -0.0887603759765625, -0.08478546142578125, -0.080810546875, -0.07683563232421875, -0.0728607177734375, -0.06888580322265625, -0.064910888671875, -0.06093597412109375, -0.0569610595703125, -0.05298614501953125, -0.04901123046875, -0.04503631591796875, -0.0410614013671875, -0.03708648681640625, -0.033111572265625, -0.02913665771484375, -0.0251617431640625, -0.02118682861328125, -0.0172119140625, -0.01323699951171875, -0.0092620849609375, -0.00528717041015625, -0.001312255859375, 0.00266265869140625, 0.0066375732421875, 0.01061248779296875, 0.01458740234375, 0.01856231689453125, 0.0225372314453125, 0.02651214599609375, 0.030487060546875, 0.03446197509765625, 0.0384368896484375, 0.04241180419921875, 0.04638671875, 0.05036163330078125, 0.0543365478515625, 0.05831146240234375, 0.062286376953125, 0.06626129150390625, 0.0702362060546875, 0.07421112060546875, 0.07818603515625, 0.08216094970703125, 0.0861358642578125, 0.09011077880859375, 0.094085693359375, 0.09806060791015625, 0.1020355224609375, 0.10601043701171875, 0.1099853515625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 11.0, 11.0, 10.0, 11.0, 21.0, 23.0, 25.0, 27.0, 33.0, 33.0, 36.0, 52.0, 44.0, 53.0, 34.0, 55.0, 59.0, 48.0, 49.0, 45.0, 50.0, 34.0, 41.0, 42.0, 24.0, 27.0, 21.0, 20.0, 10.0, 8.0, 10.0, 8.0, 3.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08941650390625, -0.08683586120605469, -0.08425521850585938, -0.08167457580566406, -0.07909393310546875, -0.07651329040527344, -0.07393264770507812, -0.07135200500488281, -0.0687713623046875, -0.06619071960449219, -0.06361007690429688, -0.06102943420410156, -0.05844879150390625, -0.05586814880371094, -0.053287506103515625, -0.05070686340332031, -0.048126220703125, -0.04554557800292969, -0.042964935302734375, -0.04038429260253906, -0.03780364990234375, -0.03522300720214844, -0.032642364501953125, -0.030061721801757812, -0.0274810791015625, -0.024900436401367188, -0.022319793701171875, -0.019739151000976562, -0.01715850830078125, -0.014577865600585938, -0.011997222900390625, -0.009416580200195312, -0.0068359375, -0.0042552947998046875, -0.001674652099609375, 0.0009059906005859375, 0.00348663330078125, 0.0060672760009765625, 0.008647918701171875, 0.011228561401367188, 0.0138092041015625, 0.016389846801757812, 0.018970489501953125, 0.021551132202148438, 0.02413177490234375, 0.026712417602539062, 0.029293060302734375, 0.03187370300292969, 0.034454345703125, 0.03703498840332031, 0.039615631103515625, 0.04219627380371094, 0.04477691650390625, 0.04735755920410156, 0.049938201904296875, 0.05251884460449219, 0.0550994873046875, 0.05768013000488281, 0.060260772705078125, 0.06284141540527344, 0.06542205810546875, 0.06800270080566406, 0.07058334350585938, 0.07316398620605469, 0.07574462890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 7.0, 11.0, 18.0, 32.0, 68.0, 106.0, 235.0, 465.0, 1210.0, 3830.0, 14412.0, 82426.0, 1843647.0, 2137188.0, 89002.0, 15426.0, 3944.0, 1287.0, 491.0, 244.0, 100.0, 61.0, 21.0, 20.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253662109375, -0.24352264404296875, -0.2333831787109375, -0.22324371337890625, -0.213104248046875, -0.20296478271484375, -0.1928253173828125, -0.18268585205078125, -0.17254638671875, -0.16240692138671875, -0.1522674560546875, -0.14212799072265625, -0.131988525390625, -0.12184906005859375, -0.1117095947265625, -0.10157012939453125, -0.0914306640625, -0.08129119873046875, -0.0711517333984375, -0.06101226806640625, -0.050872802734375, -0.04073333740234375, -0.0305938720703125, -0.02045440673828125, -0.01031494140625, -0.00017547607421875, 0.0099639892578125, 0.02010345458984375, 0.030242919921875, 0.04038238525390625, 0.0505218505859375, 0.06066131591796875, 0.07080078125, 0.08094024658203125, 0.0910797119140625, 0.10121917724609375, 0.111358642578125, 0.12149810791015625, 0.1316375732421875, 0.14177703857421875, 0.15191650390625, 0.16205596923828125, 0.1721954345703125, 0.18233489990234375, 0.192474365234375, 0.20261383056640625, 0.2127532958984375, 0.22289276123046875, 0.2330322265625, 0.24317169189453125, 0.2533111572265625, 0.26345062255859375, 0.273590087890625, 0.28372955322265625, 0.2938690185546875, 0.30400848388671875, 0.31414794921875, 0.32428741455078125, 0.3344268798828125, 0.34456634521484375, 0.354705810546875, 0.36484527587890625, 0.3749847412109375, 0.38512420654296875, 0.395263671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 8.0, 9.0, 13.0, 16.0, 18.0, 31.0, 51.0, 55.0, 84.0, 124.0, 237.0, 414.0, 753.0, 916.0, 525.0, 287.0, 160.0, 100.0, 65.0, 60.0, 40.0, 22.0, 17.0, 12.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31787109375, -0.3095550537109375, -0.301239013671875, -0.2929229736328125, -0.28460693359375, -0.2762908935546875, -0.267974853515625, -0.2596588134765625, -0.2513427734375, -0.2430267333984375, -0.234710693359375, -0.2263946533203125, -0.21807861328125, -0.2097625732421875, -0.201446533203125, -0.1931304931640625, -0.184814453125, -0.1764984130859375, -0.168182373046875, -0.1598663330078125, -0.15155029296875, -0.1432342529296875, -0.134918212890625, -0.1266021728515625, -0.1182861328125, -0.1099700927734375, -0.101654052734375, -0.0933380126953125, -0.08502197265625, -0.0767059326171875, -0.068389892578125, -0.0600738525390625, -0.0517578125, -0.0434417724609375, -0.035125732421875, -0.0268096923828125, -0.01849365234375, -0.0101776123046875, -0.001861572265625, 0.0064544677734375, 0.0147705078125, 0.0230865478515625, 0.031402587890625, 0.0397186279296875, 0.04803466796875, 0.0563507080078125, 0.064666748046875, 0.0729827880859375, 0.081298828125, 0.0896148681640625, 0.097930908203125, 0.1062469482421875, 0.11456298828125, 0.1228790283203125, 0.131195068359375, 0.1395111083984375, 0.1478271484375, 0.1561431884765625, 0.164459228515625, 0.1727752685546875, 0.18109130859375, 0.1894073486328125, 0.197723388671875, 0.2060394287109375, 0.21435546875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 10.0, 22.0, 41.0, 91.0, 153.0, 227.0, 204.0, 123.0, 64.0, 30.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.057502746582031, -3.955089569091797, -3.8526766300201416, -3.7502634525299072, -3.647850513458252, -3.5454373359680176, -3.443024158477783, -3.340611219406128, -3.2381982803344727, -3.1357851028442383, -3.033372163772583, -2.9309589862823486, -2.8285460472106934, -2.726132869720459, -2.6237196922302246, -2.5213067531585693, -2.418893575668335, -2.3164803981781006, -2.2140674591064453, -2.111654281616211, -2.0092413425445557, -1.9068281650543213, -1.8044151067733765, -1.7020020484924316, -1.5995889902114868, -1.497175931930542, -1.3947628736495972, -1.2923498153686523, -1.189936637878418, -1.0875236988067627, -0.9851105213165283, -0.8826974630355835, -0.7802846431732178, -0.677871584892273, -0.5754585266113281, -0.4730454087257385, -0.3706323504447937, -0.2682192921638489, -0.16580617427825928, -0.06339311599731445, 0.03901994228363037, 0.1414330154657364, 0.2438460886478424, 0.3462591767311096, 0.44867223501205444, 0.5510852932929993, 0.6534984111785889, 0.7559114694595337, 0.8583245277404785, 0.9607375860214233, 1.0631506443023682, 1.1655638217926025, 1.2679767608642578, 1.3703899383544922, 1.472802996635437, 1.5752160549163818, 1.6776291131973267, 1.7800421714782715, 1.8824552297592163, 1.9848682880401611, 2.0872814655303955, 2.189694404602051, 2.292107582092285, 2.3945207595825195, 2.496933698654175]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 12.0, 19.0, 19.0, 24.0, 31.0, 30.0, 36.0, 40.0, 53.0, 43.0, 41.0, 62.0, 49.0, 47.0, 44.0, 44.0, 51.0, 49.0, 40.0, 42.0, 26.0, 21.0, 25.0, 15.0, 21.0, 16.0, 13.0, 12.0, 10.0, 5.0, 5.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0209617614746094, -0.9830405712127686, -0.9451194405555725, -0.9071983098983765, -0.8692771196365356, -0.8313559293746948, -0.7934347987174988, -0.7555136680603027, -0.7175924777984619, -0.6796712875366211, -0.641750156879425, -0.603829026222229, -0.5659078359603882, -0.5279866456985474, -0.4900655150413513, -0.4521443545818329, -0.41422319412231445, -0.376302033662796, -0.3383808732032776, -0.30045971274375916, -0.2625385522842407, -0.2246173918247223, -0.18669623136520386, -0.14877507090568542, -0.11085391044616699, -0.07293274998664856, -0.03501158952713013, 0.0029095709323883057, 0.04083073139190674, 0.07875189185142517, 0.1166730523109436, 0.15459421277046204, 0.19251549243927002, 0.23043665289878845, 0.2683578133583069, 0.3062789738178253, 0.34420013427734375, 0.3821212947368622, 0.4200424551963806, 0.45796361565589905, 0.4958847761154175, 0.5338059663772583, 0.5717270970344543, 0.6096482276916504, 0.6475694179534912, 0.685490608215332, 0.7234117388725281, 0.7613328695297241, 0.7992540597915649, 0.8371752500534058, 0.8750963807106018, 0.9130175113677979, 0.9509387016296387, 0.9888598918914795, 1.0267810821533203, 1.0647021532058716, 1.1026233434677124, 1.1405445337295532, 1.1784656047821045, 1.2163867950439453, 1.2543079853057861, 1.292229175567627, 1.3301503658294678, 1.368071436882019, 1.4059926271438599]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 15.0, 19.0, 43.0, 55.0, 63.0, 106.0, 166.0, 310.0, 464.0, 828.0, 1421.0, 2354.0, 4300.0, 8438.0, 16758.0, 36360.0, 89450.0, 340543.0, 372984.0, 97999.0, 38450.0, 17802.0, 8952.0, 4591.0, 2545.0, 1381.0, 824.0, 487.0, 301.0, 181.0, 130.0, 74.0, 49.0, 37.0, 27.0, 16.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185791015625, -0.17916488647460938, -0.17253875732421875, -0.16591262817382812, -0.1592864990234375, -0.15266036987304688, -0.14603424072265625, -0.13940811157226562, -0.132781982421875, -0.12615585327148438, -0.11952972412109375, -0.11290359497070312, -0.1062774658203125, -0.09965133666992188, -0.09302520751953125, -0.08639907836914062, -0.07977294921875, -0.07314682006835938, -0.06652069091796875, -0.059894561767578125, -0.0532684326171875, -0.046642303466796875, -0.04001617431640625, -0.033390045166015625, -0.026763916015625, -0.020137786865234375, -0.01351165771484375, -0.006885528564453125, -0.0002593994140625, 0.006366729736328125, 0.01299285888671875, 0.019618988037109375, 0.0262451171875, 0.032871246337890625, 0.03949737548828125, 0.046123504638671875, 0.0527496337890625, 0.059375762939453125, 0.06600189208984375, 0.07262802124023438, 0.079254150390625, 0.08588027954101562, 0.09250640869140625, 0.09913253784179688, 0.1057586669921875, 0.11238479614257812, 0.11901092529296875, 0.12563705444335938, 0.13226318359375, 0.13888931274414062, 0.14551544189453125, 0.15214157104492188, 0.1587677001953125, 0.16539382934570312, 0.17201995849609375, 0.17864608764648438, 0.185272216796875, 0.19189834594726562, 0.19852447509765625, 0.20515060424804688, 0.2117767333984375, 0.21840286254882812, 0.22502899169921875, 0.23165512084960938, 0.23828125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 10.0, 18.0, 16.0, 19.0, 31.0, 45.0, 43.0, 48.0, 48.0, 60.0, 63.0, 65.0, 55.0, 48.0, 54.0, 51.0, 52.0, 46.0, 41.0, 35.0, 31.0, 29.0, 23.0, 13.0, 8.0, 9.0, 7.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.07561111450195312, -0.07236480712890625, -0.06911849975585938, -0.0658721923828125, -0.06262588500976562, -0.05937957763671875, -0.056133270263671875, -0.052886962890625, -0.049640655517578125, -0.04639434814453125, -0.043148040771484375, -0.0399017333984375, -0.036655426025390625, -0.03340911865234375, -0.030162811279296875, -0.02691650390625, -0.023670196533203125, -0.02042388916015625, -0.017177581787109375, -0.0139312744140625, -0.010684967041015625, -0.00743865966796875, -0.004192352294921875, -0.000946044921875, 0.002300262451171875, 0.00554656982421875, 0.008792877197265625, 0.0120391845703125, 0.015285491943359375, 0.01853179931640625, 0.021778106689453125, 0.0250244140625, 0.028270721435546875, 0.03151702880859375, 0.034763336181640625, 0.0380096435546875, 0.041255950927734375, 0.04450225830078125, 0.047748565673828125, 0.050994873046875, 0.054241180419921875, 0.05748748779296875, 0.060733795166015625, 0.0639801025390625, 0.06722640991210938, 0.07047271728515625, 0.07371902465820312, 0.07696533203125, 0.08021163940429688, 0.08345794677734375, 0.08670425415039062, 0.0899505615234375, 0.09319686889648438, 0.09644317626953125, 0.09968948364257812, 0.102935791015625, 0.10618209838867188, 0.10942840576171875, 0.11267471313476562, 0.1159210205078125, 0.11916732788085938, 0.12241363525390625, 0.12565994262695312, 0.12890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 3.0, 5.0, 8.0, 20.0, 20.0, 42.0, 40.0, 72.0, 102.0, 135.0, 227.0, 390.0, 734.0, 1486.0, 4025.0, 15862.0, 128579.0, 822866.0, 58631.0, 9690.0, 2849.0, 1238.0, 608.0, 329.0, 215.0, 109.0, 77.0, 57.0, 38.0, 25.0, 13.0, 19.0, 12.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.3471870422363281, -0.33231353759765625, -0.3174400329589844, -0.3025665283203125, -0.2876930236816406, -0.27281951904296875, -0.2579460144042969, -0.243072509765625, -0.22819900512695312, -0.21332550048828125, -0.19845199584960938, -0.1835784912109375, -0.16870498657226562, -0.15383148193359375, -0.13895797729492188, -0.12408447265625, -0.10921096801757812, -0.09433746337890625, -0.07946395874023438, -0.0645904541015625, -0.049716949462890625, -0.03484344482421875, -0.019969940185546875, -0.005096435546875, 0.009777069091796875, 0.02465057373046875, 0.039524078369140625, 0.0543975830078125, 0.06927108764648438, 0.08414459228515625, 0.09901809692382812, 0.1138916015625, 0.12876510620117188, 0.14363861083984375, 0.15851211547851562, 0.1733856201171875, 0.18825912475585938, 0.20313262939453125, 0.21800613403320312, 0.232879638671875, 0.24775314331054688, 0.26262664794921875, 0.2775001525878906, 0.2923736572265625, 0.3072471618652344, 0.32212066650390625, 0.3369941711425781, 0.35186767578125, 0.3667411804199219, 0.38161468505859375, 0.3964881896972656, 0.4113616943359375, 0.4262351989746094, 0.44110870361328125, 0.4559822082519531, 0.470855712890625, 0.4857292175292969, 0.5006027221679688, 0.5154762268066406, 0.5303497314453125, 0.5452232360839844, 0.5600967407226562, 0.5749702453613281, 0.58984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 4.0, 12.0, 12.0, 14.0, 21.0, 33.0, 28.0, 34.0, 36.0, 53.0, 52.0, 55.0, 63.0, 63.0, 71.0, 51.0, 59.0, 63.0, 64.0, 43.0, 31.0, 35.0, 20.0, 16.0, 13.0, 10.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3700599670410156, -0.35462188720703125, -0.3391838073730469, -0.3237457275390625, -0.3083076477050781, -0.29286956787109375, -0.2774314880371094, -0.261993408203125, -0.24655532836914062, -0.23111724853515625, -0.21567916870117188, -0.2002410888671875, -0.18480300903320312, -0.16936492919921875, -0.15392684936523438, -0.13848876953125, -0.12305068969726562, -0.10761260986328125, -0.09217453002929688, -0.0767364501953125, -0.061298370361328125, -0.04586029052734375, -0.030422210693359375, -0.014984130859375, 0.000453948974609375, 0.01589202880859375, 0.031330108642578125, 0.0467681884765625, 0.062206268310546875, 0.07764434814453125, 0.09308242797851562, 0.1085205078125, 0.12395858764648438, 0.13939666748046875, 0.15483474731445312, 0.1702728271484375, 0.18571090698242188, 0.20114898681640625, 0.21658706665039062, 0.232025146484375, 0.24746322631835938, 0.26290130615234375, 0.2783393859863281, 0.2937774658203125, 0.3092155456542969, 0.32465362548828125, 0.3400917053222656, 0.35552978515625, 0.3709678649902344, 0.38640594482421875, 0.4018440246582031, 0.4172821044921875, 0.4327201843261719, 0.44815826416015625, 0.4635963439941406, 0.479034423828125, 0.4944725036621094, 0.5099105834960938, 0.5253486633300781, 0.5407867431640625, 0.5562248229980469, 0.5716629028320312, 0.5871009826660156, 0.6025390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 11.0, 4.0, 15.0, 19.0, 44.0, 79.0, 113.0, 262.0, 680.0, 1761.0, 7357.0, 48873.0, 796162.0, 170779.0, 17231.0, 3375.0, 999.0, 353.0, 199.0, 87.0, 56.0, 32.0, 21.0, 15.0, 7.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.2087993621826172, -0.20177841186523438, -0.19475746154785156, -0.18773651123046875, -0.18071556091308594, -0.17369461059570312, -0.1666736602783203, -0.1596527099609375, -0.1526317596435547, -0.14561080932617188, -0.13858985900878906, -0.13156890869140625, -0.12454795837402344, -0.11752700805664062, -0.11050605773925781, -0.103485107421875, -0.09646415710449219, -0.08944320678710938, -0.08242225646972656, -0.07540130615234375, -0.06838035583496094, -0.061359405517578125, -0.05433845520019531, -0.0473175048828125, -0.04029655456542969, -0.033275604248046875, -0.026254653930664062, -0.01923370361328125, -0.012212753295898438, -0.005191802978515625, 0.0018291473388671875, 0.00885009765625, 0.015871047973632812, 0.022891998291015625, 0.029912948608398438, 0.03693389892578125, 0.04395484924316406, 0.050975799560546875, 0.05799674987792969, 0.0650177001953125, 0.07203865051269531, 0.07905960083007812, 0.08608055114746094, 0.09310150146484375, 0.10012245178222656, 0.10714340209960938, 0.11416435241699219, 0.121185302734375, 0.1282062530517578, 0.13522720336914062, 0.14224815368652344, 0.14926910400390625, 0.15629005432128906, 0.16331100463867188, 0.1703319549560547, 0.1773529052734375, 0.1843738555908203, 0.19139480590820312, 0.19841575622558594, 0.20543670654296875, 0.21245765686035156, 0.21947860717773438, 0.2264995574951172, 0.2335205078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 1.0, 5.0, 4.0, 9.0, 11.0, 9.0, 11.0, 17.0, 29.0, 44.0, 37.0, 68.0, 103.0, 135.0, 115.0, 106.0, 76.0, 63.0, 38.0, 27.0, 20.0, 15.0, 10.0, 9.0, 10.0, 6.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.349252700805664e-05, -7.15227797627449e-05, -6.955303251743317e-05, -6.758328527212143e-05, -6.561353802680969e-05, -6.364379078149796e-05, -6.167404353618622e-05, -5.970429629087448e-05, -5.7734549045562744e-05, -5.576480180025101e-05, -5.379505455493927e-05, -5.182530730962753e-05, -4.9855560064315796e-05, -4.788581281900406e-05, -4.591606557369232e-05, -4.3946318328380585e-05, -4.197657108306885e-05, -4.000682383775711e-05, -3.8037076592445374e-05, -3.6067329347133636e-05, -3.40975821018219e-05, -3.212783485651016e-05, -3.0158087611198425e-05, -2.8188340365886688e-05, -2.621859312057495e-05, -2.4248845875263214e-05, -2.2279098629951477e-05, -2.030935138463974e-05, -1.8339604139328003e-05, -1.6369856894016266e-05, -1.4400109648704529e-05, -1.2430362403392792e-05, -1.0460615158081055e-05, -8.490867912769318e-06, -6.5211206674575806e-06, -4.5513734221458435e-06, -2.5816261768341064e-06, -6.118789315223694e-07, 1.3578683137893677e-06, 3.3276155591011047e-06, 5.297362804412842e-06, 7.267110049724579e-06, 9.236857295036316e-06, 1.1206604540348053e-05, 1.317635178565979e-05, 1.5146099030971527e-05, 1.7115846276283264e-05, 1.9085593521595e-05, 2.1055340766906738e-05, 2.3025088012218475e-05, 2.4994835257530212e-05, 2.696458250284195e-05, 2.8934329748153687e-05, 3.0904076993465424e-05, 3.287382423877716e-05, 3.48435714840889e-05, 3.6813318729400635e-05, 3.878306597471237e-05, 4.075281322002411e-05, 4.2722560465335846e-05, 4.469230771064758e-05, 4.666205495595932e-05, 4.863180220127106e-05, 5.0601549446582794e-05, 5.257129669189453e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 8.0, 6.0, 12.0, 14.0, 18.0, 33.0, 34.0, 52.0, 86.0, 115.0, 176.0, 279.0, 542.0, 1003.0, 2214.0, 5789.0, 21296.0, 139227.0, 743651.0, 106656.0, 18010.0, 5080.0, 1985.0, 928.0, 480.0, 288.0, 192.0, 120.0, 79.0, 52.0, 38.0, 23.0, 14.0, 13.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.159393310546875, -0.15447998046875, -0.149566650390625, -0.1446533203125, -0.139739990234375, -0.13482666015625, -0.129913330078125, -0.125, -0.120086669921875, -0.11517333984375, -0.110260009765625, -0.1053466796875, -0.100433349609375, -0.09552001953125, -0.090606689453125, -0.085693359375, -0.080780029296875, -0.07586669921875, -0.070953369140625, -0.0660400390625, -0.061126708984375, -0.05621337890625, -0.051300048828125, -0.04638671875, -0.041473388671875, -0.03656005859375, -0.031646728515625, -0.0267333984375, -0.021820068359375, -0.01690673828125, -0.011993408203125, -0.007080078125, -0.002166748046875, 0.00274658203125, 0.007659912109375, 0.0125732421875, 0.017486572265625, 0.02239990234375, 0.027313232421875, 0.0322265625, 0.037139892578125, 0.04205322265625, 0.046966552734375, 0.0518798828125, 0.056793212890625, 0.06170654296875, 0.066619873046875, 0.071533203125, 0.076446533203125, 0.08135986328125, 0.086273193359375, 0.0911865234375, 0.096099853515625, 0.10101318359375, 0.105926513671875, 0.11083984375, 0.115753173828125, 0.12066650390625, 0.125579833984375, 0.1304931640625, 0.135406494140625, 0.14031982421875, 0.145233154296875, 0.150146484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 10.0, 14.0, 12.0, 17.0, 24.0, 30.0, 47.0, 52.0, 63.0, 97.0, 105.0, 93.0, 78.0, 70.0, 53.0, 46.0, 47.0, 25.0, 20.0, 19.0, 12.0, 8.0, 6.0, 8.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14013671875, -0.1360340118408203, -0.13193130493164062, -0.12782859802246094, -0.12372589111328125, -0.11962318420410156, -0.11552047729492188, -0.11141777038574219, -0.1073150634765625, -0.10321235656738281, -0.09910964965820312, -0.09500694274902344, -0.09090423583984375, -0.08680152893066406, -0.08269882202148438, -0.07859611511230469, -0.074493408203125, -0.07039070129394531, -0.06628799438476562, -0.06218528747558594, -0.05808258056640625, -0.05397987365722656, -0.049877166748046875, -0.04577445983886719, -0.0416717529296875, -0.03756904602050781, -0.033466339111328125, -0.029363632202148438, -0.02526092529296875, -0.021158218383789062, -0.017055511474609375, -0.012952804565429688, -0.00885009765625, -0.0047473907470703125, -0.000644683837890625, 0.0034580230712890625, 0.00756072998046875, 0.011663436889648438, 0.015766143798828125, 0.019868850708007812, 0.0239715576171875, 0.028074264526367188, 0.032176971435546875, 0.03627967834472656, 0.04038238525390625, 0.04448509216308594, 0.048587799072265625, 0.05269050598144531, 0.056793212890625, 0.06089591979980469, 0.06499862670898438, 0.06910133361816406, 0.07320404052734375, 0.07730674743652344, 0.08140945434570312, 0.08551216125488281, 0.0896148681640625, 0.09371757507324219, 0.09782028198242188, 0.10192298889160156, 0.10602569580078125, 0.11012840270996094, 0.11423110961914062, 0.11833381652832031, 0.1224365234375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 41.0, 164.0, 335.0, 262.0, 123.0, 29.0, 17.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.136778831481934, -3.963371753692627, -3.7899646759033203, -3.6165573596954346, -3.443150281906128, -3.2697432041168213, -3.0963358879089355, -2.922928810119629, -2.7495217323303223, -2.5761146545410156, -2.402707576751709, -2.2293002605438232, -2.0558931827545166, -1.88248610496521, -1.7090789079666138, -1.5356717109680176, -1.362264633178711, -1.1888575553894043, -1.015450358390808, -0.8420432209968567, -0.6686360836029053, -0.49522894620895386, -0.32182180881500244, -0.14841461181640625, 0.02499246597290039, 0.1983996033668518, 0.3718067407608032, 0.5452138781547546, 0.718621015548706, 0.8920281529426575, 1.0654352903366089, 1.238842487335205, 1.4122495651245117, 1.5856566429138184, 1.7590638399124146, 1.9324710369110107, 2.1058781147003174, 2.279285192489624, 2.4526925086975098, 2.6260995864868164, 2.799506664276123, 2.9729137420654297, 3.1463208198547363, 3.319728136062622, 3.4931352138519287, 3.6665422916412354, 3.839949607849121, 4.013356685638428, 4.186763763427734, 4.360170841217041, 4.533577919006348, 4.706984996795654, 4.880392074584961, 5.053799629211426, 5.227206707000732, 5.400613784790039, 5.574020862579346, 5.747427940368652, 5.920835018157959, 6.094242095947266, 6.2676496505737305, 6.441056728363037, 6.614463806152344, 6.78787088394165, 6.961277961730957]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 17.0, 21.0, 21.0, 39.0, 48.0, 51.0, 65.0, 70.0, 81.0, 104.0, 113.0, 89.0, 61.0, 60.0, 44.0, 35.0, 44.0, 15.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6194236278533936, -3.528352737426758, -3.437281608581543, -3.3462107181549072, -3.2551395893096924, -3.1640686988830566, -3.072997570037842, -2.981926679611206, -2.8908557891845703, -2.7997848987579346, -2.7087137699127197, -2.617642879486084, -2.526571750640869, -2.4355008602142334, -2.3444299697875977, -2.253358840942383, -2.162287712097168, -2.0712168216705322, -1.9801456928253174, -1.8890748023986816, -1.7980036735534668, -1.706932783126831, -1.6158617734909058, -1.5247907638549805, -1.4337197542190552, -1.3426487445831299, -1.2515777349472046, -1.1605067253112793, -1.0694358348846436, -0.9783647656440735, -0.887293815612793, -0.7962228059768677, -0.7051515579223633, -0.614080548286438, -0.5230095386505127, -0.4319385886192322, -0.3408675789833069, -0.2497965693473816, -0.15872561931610107, -0.06765460968017578, 0.02341639995574951, 0.11448739469051361, 0.2055583894252777, 0.2966293692588806, 0.3877003788948059, 0.4787713885307312, 0.5698423385620117, 0.660913348197937, 0.7519843578338623, 0.8430553674697876, 0.9341263771057129, 1.0251972675323486, 1.1162683963775635, 1.2073392868041992, 1.2984102964401245, 1.3894813060760498, 1.480552315711975, 1.5716233253479004, 1.6626943349838257, 1.753765344619751, 1.8448362350463867, 1.9359073638916016, 2.0269782543182373, 2.118049144744873, 2.209120273590088]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 2.0, 9.0, 6.0, 8.0, 9.0, 16.0, 25.0, 29.0, 31.0, 36.0, 62.0, 98.0, 138.0, 339.0, 1109.0, 9359.0, 325397.0, 3809270.0, 43986.0, 3117.0, 575.0, 220.0, 124.0, 77.0, 59.0, 27.0, 33.0, 24.0, 20.0, 16.0, 10.0, 16.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.611328125, -0.5953521728515625, -0.579376220703125, -0.5634002685546875, -0.54742431640625, -0.5314483642578125, -0.515472412109375, -0.4994964599609375, -0.4835205078125, -0.4675445556640625, -0.451568603515625, -0.4355926513671875, -0.41961669921875, -0.4036407470703125, -0.387664794921875, -0.3716888427734375, -0.355712890625, -0.3397369384765625, -0.323760986328125, -0.3077850341796875, -0.29180908203125, -0.2758331298828125, -0.259857177734375, -0.2438812255859375, -0.2279052734375, -0.2119293212890625, -0.195953369140625, -0.1799774169921875, -0.16400146484375, -0.1480255126953125, -0.132049560546875, -0.1160736083984375, -0.10009765625, -0.0841217041015625, -0.068145751953125, -0.0521697998046875, -0.03619384765625, -0.0202178955078125, -0.004241943359375, 0.0117340087890625, 0.0277099609375, 0.0436859130859375, 0.059661865234375, 0.0756378173828125, 0.09161376953125, 0.1075897216796875, 0.123565673828125, 0.1395416259765625, 0.155517578125, 0.1714935302734375, 0.187469482421875, 0.2034454345703125, 0.21942138671875, 0.2353973388671875, 0.251373291015625, 0.2673492431640625, 0.2833251953125, 0.2993011474609375, 0.315277099609375, 0.3312530517578125, 0.34722900390625, 0.3632049560546875, 0.379180908203125, 0.3951568603515625, 0.4111328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 5.0, 9.0, 21.0, 29.0, 36.0, 49.0, 57.0, 80.0, 79.0, 73.0, 89.0, 81.0, 67.0, 74.0, 74.0, 50.0, 35.0, 32.0, 27.0, 13.0, 4.0, 3.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1337890625, -0.129425048828125, -0.12506103515625, -0.120697021484375, -0.1163330078125, -0.111968994140625, -0.10760498046875, -0.103240966796875, -0.098876953125, -0.094512939453125, -0.09014892578125, -0.085784912109375, -0.0814208984375, -0.077056884765625, -0.07269287109375, -0.068328857421875, -0.06396484375, -0.059600830078125, -0.05523681640625, -0.050872802734375, -0.0465087890625, -0.042144775390625, -0.03778076171875, -0.033416748046875, -0.029052734375, -0.024688720703125, -0.02032470703125, -0.015960693359375, -0.0115966796875, -0.007232666015625, -0.00286865234375, 0.001495361328125, 0.005859375, 0.010223388671875, 0.01458740234375, 0.018951416015625, 0.0233154296875, 0.027679443359375, 0.03204345703125, 0.036407470703125, 0.040771484375, 0.045135498046875, 0.04949951171875, 0.053863525390625, 0.0582275390625, 0.062591552734375, 0.06695556640625, 0.071319580078125, 0.07568359375, 0.080047607421875, 0.08441162109375, 0.088775634765625, 0.0931396484375, 0.097503662109375, 0.10186767578125, 0.106231689453125, 0.110595703125, 0.114959716796875, 0.11932373046875, 0.123687744140625, 0.1280517578125, 0.132415771484375, 0.13677978515625, 0.141143798828125, 0.1455078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 13.0, 16.0, 37.0, 43.0, 66.0, 112.0, 167.0, 278.0, 505.0, 931.0, 1610.0, 3202.0, 6636.0, 15095.0, 36881.0, 108313.0, 494897.0, 2557393.0, 746880.0, 141752.0, 45020.0, 18327.0, 8134.0, 3726.0, 1904.0, 998.0, 557.0, 273.0, 186.0, 100.0, 82.0, 49.0, 30.0, 16.0, 9.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.16317176818847656, -0.15800857543945312, -0.1528453826904297, -0.14768218994140625, -0.1425189971923828, -0.13735580444335938, -0.13219261169433594, -0.1270294189453125, -0.12186622619628906, -0.11670303344726562, -0.11153984069824219, -0.10637664794921875, -0.10121345520019531, -0.09605026245117188, -0.09088706970214844, -0.085723876953125, -0.08056068420410156, -0.07539749145507812, -0.07023429870605469, -0.06507110595703125, -0.05990791320800781, -0.054744720458984375, -0.04958152770996094, -0.0444183349609375, -0.03925514221191406, -0.034091949462890625, -0.028928756713867188, -0.02376556396484375, -0.018602371215820312, -0.013439178466796875, -0.008275985717773438, -0.00311279296875, 0.0020503997802734375, 0.007213592529296875, 0.012376785278320312, 0.01753997802734375, 0.022703170776367188, 0.027866363525390625, 0.03302955627441406, 0.0381927490234375, 0.04335594177246094, 0.048519134521484375, 0.05368232727050781, 0.05884552001953125, 0.06400871276855469, 0.06917190551757812, 0.07433509826660156, 0.079498291015625, 0.08466148376464844, 0.08982467651367188, 0.09498786926269531, 0.10015106201171875, 0.10531425476074219, 0.11047744750976562, 0.11564064025878906, 0.1208038330078125, 0.12596702575683594, 0.13113021850585938, 0.1362934112548828, 0.14145660400390625, 0.1466197967529297, 0.15178298950195312, 0.15694618225097656, 0.162109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 7.0, 6.0, 2.0, 13.0, 13.0, 17.0, 30.0, 41.0, 44.0, 62.0, 90.0, 147.0, 281.0, 464.0, 830.0, 806.0, 434.0, 291.0, 167.0, 97.0, 86.0, 34.0, 22.0, 27.0, 18.0, 8.0, 13.0, 6.0, 12.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314208984375, -0.3057117462158203, -0.2972145080566406, -0.28871726989746094, -0.28022003173828125, -0.27172279357910156, -0.2632255554199219, -0.2547283172607422, -0.2462310791015625, -0.2377338409423828, -0.22923660278320312, -0.22073936462402344, -0.21224212646484375, -0.20374488830566406, -0.19524765014648438, -0.1867504119873047, -0.178253173828125, -0.1697559356689453, -0.16125869750976562, -0.15276145935058594, -0.14426422119140625, -0.13576698303222656, -0.12726974487304688, -0.11877250671386719, -0.1102752685546875, -0.10177803039550781, -0.09328079223632812, -0.08478355407714844, -0.07628631591796875, -0.06778907775878906, -0.059291839599609375, -0.05079460144042969, -0.04229736328125, -0.03380012512207031, -0.025302886962890625, -0.016805648803710938, -0.00830841064453125, 0.0001888275146484375, 0.008686065673828125, 0.017183303833007812, 0.0256805419921875, 0.03417778015136719, 0.042675018310546875, 0.05117225646972656, 0.05966949462890625, 0.06816673278808594, 0.07666397094726562, 0.08516120910644531, 0.093658447265625, 0.10215568542480469, 0.11065292358398438, 0.11915016174316406, 0.12764739990234375, 0.13614463806152344, 0.14464187622070312, 0.1531391143798828, 0.1616363525390625, 0.1701335906982422, 0.17863082885742188, 0.18712806701660156, 0.19562530517578125, 0.20412254333496094, 0.21261978149414062, 0.2211170196533203, 0.2296142578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 7.0, 17.0, 51.0, 117.0, 229.0, 268.0, 168.0, 66.0, 37.0, 12.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4222029447555542, -1.3133485317230225, -1.2044942378997803, -1.0956398248672485, -0.9867854118347168, -0.8779309988021851, -0.7690766453742981, -0.6602222919464111, -0.5513678789138794, -0.44251349568367004, -0.3336591124534607, -0.22480472922325134, -0.11595034599304199, -0.007095932960510254, 0.10175842046737671, 0.21061277389526367, 0.3194671869277954, 0.42832157015800476, 0.5371759533882141, 0.6460303068161011, 0.7548847198486328, 0.8637391328811646, 0.9725934863090515, 1.0814478397369385, 1.1903022527694702, 1.299156665802002, 1.4080109596252441, 1.5168653726577759, 1.6257197856903076, 1.7345741987228394, 1.843428611755371, 1.9522829055786133, 2.0611371994018555, 2.1699914932250977, 2.278846025466919, 2.387700319290161, 2.4965548515319824, 2.6054091453552246, 2.714263439178467, 2.823117733001709, 2.9319722652435303, 3.0408265590667725, 3.1496810913085938, 3.258535385131836, 3.367389678955078, 3.4762442111968994, 3.5850985050201416, 3.693953037261963, 3.802807331085205, 3.9116616249084473, 4.0205159187316895, 4.12937068939209, 4.238224983215332, 4.347079277038574, 4.455933570861816, 4.564787864685059, 4.673642158508301, 4.782496452331543, 4.891350746154785, 5.0002055168151855, 5.109059810638428, 5.21791410446167, 5.326768398284912, 5.435622692108154, 5.544477462768555]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 13.0, 28.0, 26.0, 23.0, 42.0, 42.0, 35.0, 37.0, 45.0, 62.0, 42.0, 53.0, 54.0, 59.0, 52.0, 45.0, 45.0, 34.0, 38.0, 31.0, 35.0, 21.0, 24.0, 17.0, 13.0, 14.0, 11.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9469990730285645, -0.9092732667922974, -0.8715474009513855, -0.8338215351104736, -0.7960957288742065, -0.7583699226379395, -0.7206440567970276, -0.6829181909561157, -0.6451923847198486, -0.6074665784835815, -0.5697407126426697, -0.5320148468017578, -0.4942890405654907, -0.45656320452690125, -0.41883736848831177, -0.3811115324497223, -0.3433856964111328, -0.30565986037254333, -0.26793402433395386, -0.23020818829536438, -0.1924823522567749, -0.15475651621818542, -0.11703068017959595, -0.07930484414100647, -0.04157900810241699, -0.0038531720638275146, 0.03387266397476196, 0.07159850001335144, 0.10932433605194092, 0.1470501720905304, 0.18477600812911987, 0.22250184416770935, 0.2602275609970093, 0.29795339703559875, 0.33567923307418823, 0.3734050691127777, 0.4111309051513672, 0.44885674118995667, 0.48658257722854614, 0.524308443069458, 0.5620342493057251, 0.5997600555419922, 0.637485921382904, 0.6752117872238159, 0.712937593460083, 0.7506633996963501, 0.788389265537262, 0.8261151313781738, 0.8638409376144409, 0.901566743850708, 0.9392926096916199, 0.9770184755325317, 1.0147442817687988, 1.052470088005066, 1.090195894241333, 1.1279218196868896, 1.1656476259231567, 1.2033734321594238, 1.2410993576049805, 1.2788251638412476, 1.3165509700775146, 1.3542767763137817, 1.3920025825500488, 1.4297285079956055, 1.4674543142318726]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 9.0, 13.0, 20.0, 28.0, 26.0, 49.0, 72.0, 112.0, 144.0, 193.0, 253.0, 397.0, 576.0, 800.0, 1336.0, 2035.0, 3374.0, 5562.0, 9557.0, 17194.0, 33672.0, 77692.0, 219479.0, 377279.0, 170936.0, 62596.0, 28404.0, 14864.0, 8407.0, 4967.0, 2925.0, 1857.0, 1155.0, 805.0, 572.0, 325.0, 244.0, 176.0, 123.0, 99.0, 70.0, 42.0, 28.0, 23.0, 23.0, 12.0, 9.0, 7.0, 1.0, 0.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.14599609375, -0.1413440704345703, -0.13669204711914062, -0.13204002380371094, -0.12738800048828125, -0.12273597717285156, -0.11808395385742188, -0.11343193054199219, -0.1087799072265625, -0.10412788391113281, -0.09947586059570312, -0.09482383728027344, -0.09017181396484375, -0.08551979064941406, -0.08086776733398438, -0.07621574401855469, -0.071563720703125, -0.06691169738769531, -0.062259674072265625, -0.05760765075683594, -0.05295562744140625, -0.04830360412597656, -0.043651580810546875, -0.03899955749511719, -0.0343475341796875, -0.029695510864257812, -0.025043487548828125, -0.020391464233398438, -0.01573944091796875, -0.011087417602539062, -0.006435394287109375, -0.0017833709716796875, 0.00286865234375, 0.0075206756591796875, 0.012172698974609375, 0.016824722290039062, 0.02147674560546875, 0.026128768920898438, 0.030780792236328125, 0.03543281555175781, 0.0400848388671875, 0.04473686218261719, 0.049388885498046875, 0.05404090881347656, 0.05869293212890625, 0.06334495544433594, 0.06799697875976562, 0.07264900207519531, 0.077301025390625, 0.08195304870605469, 0.08660507202148438, 0.09125709533691406, 0.09590911865234375, 0.10056114196777344, 0.10521316528320312, 0.10986518859863281, 0.1145172119140625, 0.11916923522949219, 0.12382125854492188, 0.12847328186035156, 0.13312530517578125, 0.13777732849121094, 0.14242935180664062, 0.1470813751220703, 0.1517333984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 10.0, 9.0, 14.0, 5.0, 6.0, 23.0, 22.0, 21.0, 31.0, 20.0, 27.0, 34.0, 42.0, 28.0, 38.0, 33.0, 43.0, 48.0, 33.0, 44.0, 39.0, 39.0, 33.0, 42.0, 42.0, 41.0, 22.0, 31.0, 32.0, 19.0, 18.0, 16.0, 24.0, 13.0, 9.0, 9.0, 5.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07855224609375, -0.07616043090820312, -0.07376861572265625, -0.07137680053710938, -0.0689849853515625, -0.06659317016601562, -0.06420135498046875, -0.061809539794921875, -0.059417724609375, -0.057025909423828125, -0.05463409423828125, -0.052242279052734375, -0.0498504638671875, -0.047458648681640625, -0.04506683349609375, -0.042675018310546875, -0.040283203125, -0.037891387939453125, -0.03549957275390625, -0.033107757568359375, -0.0307159423828125, -0.028324127197265625, -0.02593231201171875, -0.023540496826171875, -0.021148681640625, -0.018756866455078125, -0.01636505126953125, -0.013973236083984375, -0.0115814208984375, -0.009189605712890625, -0.00679779052734375, -0.004405975341796875, -0.00201416015625, 0.000377655029296875, 0.00276947021484375, 0.005161285400390625, 0.0075531005859375, 0.009944915771484375, 0.01233673095703125, 0.014728546142578125, 0.017120361328125, 0.019512176513671875, 0.02190399169921875, 0.024295806884765625, 0.0266876220703125, 0.029079437255859375, 0.03147125244140625, 0.033863067626953125, 0.0362548828125, 0.038646697998046875, 0.04103851318359375, 0.043430328369140625, 0.0458221435546875, 0.048213958740234375, 0.05060577392578125, 0.052997589111328125, 0.055389404296875, 0.057781219482421875, 0.06017303466796875, 0.06256484985351562, 0.0649566650390625, 0.06734848022460938, 0.06974029541015625, 0.07213211059570312, 0.07452392578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 12.0, 17.0, 24.0, 39.0, 75.0, 84.0, 183.0, 268.0, 582.0, 1233.0, 3071.0, 10459.0, 54765.0, 738060.0, 206203.0, 23930.0, 5775.0, 1953.0, 790.0, 425.0, 197.0, 127.0, 84.0, 55.0, 40.0, 20.0, 16.0, 18.0, 8.0, 12.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2634391784667969, -0.25075531005859375, -0.23807144165039062, -0.2253875732421875, -0.21270370483398438, -0.20001983642578125, -0.18733596801757812, -0.174652099609375, -0.16196823120117188, -0.14928436279296875, -0.13660049438476562, -0.1239166259765625, -0.11123275756835938, -0.09854888916015625, -0.08586502075195312, -0.07318115234375, -0.060497283935546875, -0.04781341552734375, -0.035129547119140625, -0.0224456787109375, -0.009761810302734375, 0.00292205810546875, 0.015605926513671875, 0.028289794921875, 0.040973663330078125, 0.05365753173828125, 0.06634140014648438, 0.0790252685546875, 0.09170913696289062, 0.10439300537109375, 0.11707687377929688, 0.1297607421875, 0.14244461059570312, 0.15512847900390625, 0.16781234741210938, 0.1804962158203125, 0.19318008422851562, 0.20586395263671875, 0.21854782104492188, 0.231231689453125, 0.24391555786132812, 0.25659942626953125, 0.2692832946777344, 0.2819671630859375, 0.2946510314941406, 0.30733489990234375, 0.3200187683105469, 0.33270263671875, 0.3453865051269531, 0.35807037353515625, 0.3707542419433594, 0.3834381103515625, 0.3961219787597656, 0.40880584716796875, 0.4214897155761719, 0.434173583984375, 0.4468574523925781, 0.45954132080078125, 0.4722251892089844, 0.4849090576171875, 0.4975929260253906, 0.5102767944335938, 0.5229606628417969, 0.53564453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 11.0, 6.0, 9.0, 15.0, 18.0, 36.0, 54.0, 66.0, 82.0, 99.0, 88.0, 90.0, 98.0, 97.0, 59.0, 53.0, 37.0, 33.0, 19.0, 12.0, 6.0, 9.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67626953125, -0.6538238525390625, -0.631378173828125, -0.6089324951171875, -0.58648681640625, -0.5640411376953125, -0.541595458984375, -0.5191497802734375, -0.4967041015625, -0.4742584228515625, -0.451812744140625, -0.4293670654296875, -0.40692138671875, -0.3844757080078125, -0.362030029296875, -0.3395843505859375, -0.317138671875, -0.2946929931640625, -0.272247314453125, -0.2498016357421875, -0.22735595703125, -0.2049102783203125, -0.182464599609375, -0.1600189208984375, -0.1375732421875, -0.1151275634765625, -0.092681884765625, -0.0702362060546875, -0.04779052734375, -0.0253448486328125, -0.002899169921875, 0.0195465087890625, 0.0419921875, 0.0644378662109375, 0.086883544921875, 0.1093292236328125, 0.13177490234375, 0.1542205810546875, 0.176666259765625, 0.1991119384765625, 0.2215576171875, 0.2440032958984375, 0.266448974609375, 0.2888946533203125, 0.31134033203125, 0.3337860107421875, 0.356231689453125, 0.3786773681640625, 0.401123046875, 0.4235687255859375, 0.446014404296875, 0.4684600830078125, 0.49090576171875, 0.5133514404296875, 0.535797119140625, 0.5582427978515625, 0.5806884765625, 0.6031341552734375, 0.625579833984375, 0.6480255126953125, 0.67047119140625, 0.6929168701171875, 0.715362548828125, 0.7378082275390625, 0.76025390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 11.0, 33.0, 59.0, 185.0, 851.0, 7793.0, 598194.0, 433227.0, 7016.0, 828.0, 205.0, 66.0, 33.0, 16.0, 9.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59765625, -0.5843696594238281, -0.5710830688476562, -0.5577964782714844, -0.5445098876953125, -0.5312232971191406, -0.5179367065429688, -0.5046501159667969, -0.491363525390625, -0.4780769348144531, -0.46479034423828125, -0.4515037536621094, -0.4382171630859375, -0.4249305725097656, -0.41164398193359375, -0.3983573913574219, -0.38507080078125, -0.3717842102050781, -0.35849761962890625, -0.3452110290527344, -0.3319244384765625, -0.3186378479003906, -0.30535125732421875, -0.2920646667480469, -0.278778076171875, -0.2654914855957031, -0.25220489501953125, -0.23891830444335938, -0.2256317138671875, -0.21234512329101562, -0.19905853271484375, -0.18577194213867188, -0.1724853515625, -0.15919876098632812, -0.14591217041015625, -0.13262557983398438, -0.1193389892578125, -0.10605239868164062, -0.09276580810546875, -0.07947921752929688, -0.066192626953125, -0.052906036376953125, -0.03961944580078125, -0.026332855224609375, -0.0130462646484375, 0.000240325927734375, 0.01352691650390625, 0.026813507080078125, 0.04010009765625, 0.053386688232421875, 0.06667327880859375, 0.07995986938476562, 0.0932464599609375, 0.10653305053710938, 0.11981964111328125, 0.13310623168945312, 0.146392822265625, 0.15967941284179688, 0.17296600341796875, 0.18625259399414062, 0.1995391845703125, 0.21282577514648438, 0.22611236572265625, 0.23939895629882812, 0.252685546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 5.0, 12.0, 12.0, 14.0, 26.0, 26.0, 53.0, 56.0, 68.0, 86.0, 80.0, 111.0, 83.0, 78.0, 57.0, 53.0, 46.0, 26.0, 20.0, 16.0, 12.0, 7.0, 8.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.3752603232860565e-05, -4.2265281081199646e-05, -4.077795892953873e-05, -3.929063677787781e-05, -3.780331462621689e-05, -3.631599247455597e-05, -3.482867032289505e-05, -3.334134817123413e-05, -3.185402601957321e-05, -3.0366703867912292e-05, -2.8879381716251373e-05, -2.7392059564590454e-05, -2.5904737412929535e-05, -2.4417415261268616e-05, -2.2930093109607697e-05, -2.1442770957946777e-05, -1.9955448806285858e-05, -1.846812665462494e-05, -1.698080450296402e-05, -1.54934823513031e-05, -1.4006160199642181e-05, -1.2518838047981262e-05, -1.1031515896320343e-05, -9.544193744659424e-06, -8.056871592998505e-06, -6.5695494413375854e-06, -5.082227289676666e-06, -3.594905138015747e-06, -2.107582986354828e-06, -6.202608346939087e-07, 8.670613169670105e-07, 2.3543834686279297e-06, 3.841705620288849e-06, 5.329027771949768e-06, 6.816349923610687e-06, 8.303672075271606e-06, 9.790994226932526e-06, 1.1278316378593445e-05, 1.2765638530254364e-05, 1.4252960681915283e-05, 1.5740282833576202e-05, 1.722760498523712e-05, 1.871492713689804e-05, 2.020224928855896e-05, 2.168957144021988e-05, 2.31768935918808e-05, 2.4664215743541718e-05, 2.6151537895202637e-05, 2.7638860046863556e-05, 2.9126182198524475e-05, 3.0613504350185394e-05, 3.2100826501846313e-05, 3.358814865350723e-05, 3.507547080516815e-05, 3.656279295682907e-05, 3.805011510848999e-05, 3.953743726015091e-05, 4.102475941181183e-05, 4.251208156347275e-05, 4.399940371513367e-05, 4.5486725866794586e-05, 4.6974048018455505e-05, 4.8461370170116425e-05, 4.9948692321777344e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 8.0, 15.0, 24.0, 38.0, 74.0, 151.0, 397.0, 1116.0, 4217.0, 32495.0, 750465.0, 242114.0, 13730.0, 2386.0, 768.0, 269.0, 115.0, 77.0, 39.0, 20.0, 7.0, 6.0, 6.0, 0.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.320068359375, -0.3122272491455078, -0.3043861389160156, -0.29654502868652344, -0.28870391845703125, -0.28086280822753906, -0.2730216979980469, -0.2651805877685547, -0.2573394775390625, -0.2494983673095703, -0.24165725708007812, -0.23381614685058594, -0.22597503662109375, -0.21813392639160156, -0.21029281616210938, -0.2024517059326172, -0.194610595703125, -0.1867694854736328, -0.17892837524414062, -0.17108726501464844, -0.16324615478515625, -0.15540504455566406, -0.14756393432617188, -0.1397228240966797, -0.1318817138671875, -0.12404060363769531, -0.11619949340820312, -0.10835838317871094, -0.10051727294921875, -0.09267616271972656, -0.08483505249023438, -0.07699394226074219, -0.06915283203125, -0.06131172180175781, -0.053470611572265625, -0.04562950134277344, -0.03778839111328125, -0.029947280883789062, -0.022106170654296875, -0.014265060424804688, -0.0064239501953125, 0.0014171600341796875, 0.009258270263671875, 0.017099380493164062, 0.02494049072265625, 0.03278160095214844, 0.040622711181640625, 0.04846382141113281, 0.056304931640625, 0.06414604187011719, 0.07198715209960938, 0.07982826232910156, 0.08766937255859375, 0.09551048278808594, 0.10335159301757812, 0.11119270324707031, 0.1190338134765625, 0.1268749237060547, 0.13471603393554688, 0.14255714416503906, 0.15039825439453125, 0.15823936462402344, 0.16608047485351562, 0.1739215850830078, 0.1817626953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 11.0, 19.0, 32.0, 44.0, 49.0, 98.0, 158.0, 165.0, 144.0, 104.0, 69.0, 51.0, 20.0, 15.0, 11.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.364990234375, -0.35746288299560547, -0.34993553161621094, -0.3424081802368164, -0.3348808288574219, -0.32735347747802734, -0.3198261260986328, -0.3122987747192383, -0.30477142333984375, -0.2972440719604492, -0.2897167205810547, -0.28218936920166016, -0.2746620178222656, -0.2671346664428711, -0.25960731506347656, -0.25207996368408203, -0.2445526123046875, -0.23702526092529297, -0.22949790954589844, -0.2219705581665039, -0.21444320678710938, -0.20691585540771484, -0.1993885040283203, -0.19186115264892578, -0.18433380126953125, -0.17680644989013672, -0.1692790985107422, -0.16175174713134766, -0.15422439575195312, -0.1466970443725586, -0.13916969299316406, -0.13164234161376953, -0.124114990234375, -0.11658763885498047, -0.10906028747558594, -0.1015329360961914, -0.09400558471679688, -0.08647823333740234, -0.07895088195800781, -0.07142353057861328, -0.06389617919921875, -0.05636882781982422, -0.04884147644042969, -0.041314125061035156, -0.033786773681640625, -0.026259422302246094, -0.018732070922851562, -0.011204719543457031, -0.0036773681640625, 0.0038499832153320312, 0.011377334594726562, 0.018904685974121094, 0.026432037353515625, 0.033959388732910156, 0.04148674011230469, 0.04901409149169922, 0.05654144287109375, 0.06406879425048828, 0.07159614562988281, 0.07912349700927734, 0.08665084838867188, 0.0941781997680664, 0.10170555114746094, 0.10923290252685547, 0.11676025390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 13.0, 35.0, 93.0, 210.0, 304.0, 192.0, 92.0, 27.0, 8.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.023674011230469, -3.8949646949768066, -3.7662553787231445, -3.6375458240509033, -3.508836507797241, -3.380127191543579, -3.251417636871338, -3.122708320617676, -2.9939990043640137, -2.8652896881103516, -2.7365803718566895, -2.6078708171844482, -2.479161500930786, -2.350452184677124, -2.221742630004883, -2.0930333137512207, -1.9643239974975586, -1.8356146812438965, -1.7069052457809448, -1.5781958103179932, -1.449486494064331, -1.320777177810669, -1.1920677423477173, -1.0633583068847656, -0.9346489906311035, -0.8059396147727966, -0.6772302389144897, -0.5485208630561829, -0.419811487197876, -0.2911021113395691, -0.1623927354812622, -0.03368335962295532, 0.09502649307250977, 0.22373586893081665, 0.35244524478912354, 0.4811546206474304, 0.6098639965057373, 0.7385733723640442, 0.8672827482223511, 0.995992124080658, 1.1247014999389648, 1.253410816192627, 1.3821202516555786, 1.5108296871185303, 1.6395390033721924, 1.7682483196258545, 1.8969577550888062, 2.025667190551758, 2.15437650680542, 2.283085823059082, 2.411795139312744, 2.5405046939849854, 2.6692140102386475, 2.7979233264923096, 2.926632881164551, 3.055342197418213, 3.184051513671875, 3.312760829925537, 3.441470146179199, 3.5701797008514404, 3.6988890171051025, 3.8275983333587646, 3.956307888031006, 4.085017204284668, 4.21372652053833]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 15.0, 11.0, 17.0, 41.0, 50.0, 63.0, 72.0, 99.0, 130.0, 131.0, 83.0, 73.0, 61.0, 55.0, 47.0, 23.0, 16.0, 10.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6359992027282715, -4.5257887840271, -4.415578365325928, -4.305367946624756, -4.195158004760742, -4.08494758605957, -3.9747371673583984, -3.8645267486572266, -3.7543163299560547, -3.644105911254883, -3.53389573097229, -3.423685312271118, -3.3134748935699463, -3.2032647132873535, -3.0930542945861816, -2.9828438758850098, -2.872633457183838, -2.762423038482666, -2.6522128582000732, -2.5420024394989014, -2.4317920207977295, -2.3215818405151367, -2.211371421813965, -2.101161003112793, -1.9909508228302002, -1.8807405233383179, -1.770530104637146, -1.6603198051452637, -1.5501093864440918, -1.4398990869522095, -1.3296887874603271, -1.2194783687591553, -1.1092679500579834, -0.9990575909614563, -0.8888472318649292, -0.7786369323730469, -0.668426513671875, -0.5582162141799927, -0.4480058550834656, -0.3377954959869385, -0.22758513689041138, -0.11737478524446487, -0.007164433598518372, 0.10304591059684753, 0.21325626969337463, 0.32346659898757935, 0.43367695808410645, 0.5438873171806335, 0.6540976762771606, 0.7643080353736877, 0.8745183944702148, 0.9847286939620972, 1.094939112663269, 1.2051494121551514, 1.3153598308563232, 1.4255701303482056, 1.535780429840088, 1.6459907293319702, 1.756201148033142, 1.8664114475250244, 1.9766218662261963, 2.086832046508789, 2.197042465209961, 2.307252883911133, 2.4174633026123047]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 2.0, 11.0, 8.0, 6.0, 6.0, 11.0, 11.0, 24.0, 33.0, 24.0, 58.0, 113.0, 190.0, 431.0, 1113.0, 3272.0, 11563.0, 51879.0, 378248.0, 2759825.0, 863088.0, 96486.0, 19437.0, 5417.0, 1812.0, 672.0, 307.0, 123.0, 57.0, 19.0, 12.0, 6.0, 3.0, 2.0], "bins": [-0.32177734375, -0.31529903411865234, -0.3088207244873047, -0.30234241485595703, -0.2958641052246094, -0.2893857955932617, -0.28290748596191406, -0.2764291763305664, -0.26995086669921875, -0.2634725570678711, -0.25699424743652344, -0.2505159378051758, -0.24403762817382812, -0.23755931854248047, -0.2310810089111328, -0.22460269927978516, -0.2181243896484375, -0.21164608001708984, -0.2051677703857422, -0.19868946075439453, -0.19221115112304688, -0.18573284149169922, -0.17925453186035156, -0.1727762222290039, -0.16629791259765625, -0.1598196029663086, -0.15334129333496094, -0.14686298370361328, -0.14038467407226562, -0.13390636444091797, -0.1274280548095703, -0.12094974517822266, -0.114471435546875, -0.10799312591552734, -0.10151481628417969, -0.09503650665283203, -0.08855819702148438, -0.08207988739013672, -0.07560157775878906, -0.0691232681274414, -0.06264495849609375, -0.056166648864746094, -0.04968833923339844, -0.04321002960205078, -0.036731719970703125, -0.03025341033935547, -0.023775100708007812, -0.017296791076660156, -0.0108184814453125, -0.004340171813964844, 0.0021381378173828125, 0.008616447448730469, 0.015094757080078125, 0.02157306671142578, 0.028051376342773438, 0.034529685974121094, 0.04100799560546875, 0.047486305236816406, 0.05396461486816406, 0.06044292449951172, 0.06692123413085938, 0.07339954376220703, 0.07987785339355469, 0.08635616302490234, 0.09283447265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 11.0, 18.0, 40.0, 69.0, 108.0, 153.0, 153.0, 142.0, 118.0, 101.0, 47.0, 38.0, 9.0, 5.0, 3.0], "bins": [-0.47119140625, -0.46272754669189453, -0.45426368713378906, -0.4457998275756836, -0.4373359680175781, -0.42887210845947266, -0.4204082489013672, -0.4119443893432617, -0.40348052978515625, -0.3950166702270508, -0.3865528106689453, -0.37808895111083984, -0.3696250915527344, -0.3611612319946289, -0.35269737243652344, -0.34423351287841797, -0.3357696533203125, -0.32730579376220703, -0.31884193420410156, -0.3103780746459961, -0.3019142150878906, -0.29345035552978516, -0.2849864959716797, -0.2765226364135742, -0.26805877685546875, -0.2595949172973633, -0.2511310577392578, -0.24266719818115234, -0.23420333862304688, -0.2257394790649414, -0.21727561950683594, -0.20881175994873047, -0.200347900390625, -0.19188404083251953, -0.18342018127441406, -0.1749563217163086, -0.16649246215820312, -0.15802860260009766, -0.1495647430419922, -0.14110088348388672, -0.13263702392578125, -0.12417316436767578, -0.11570930480957031, -0.10724544525146484, -0.09878158569335938, -0.0903177261352539, -0.08185386657714844, -0.07339000701904297, -0.0649261474609375, -0.05646228790283203, -0.04799842834472656, -0.039534568786621094, -0.031070709228515625, -0.022606849670410156, -0.014142990112304688, -0.005679130554199219, 0.00278472900390625, 0.011248588562011719, 0.019712448120117188, 0.028176307678222656, 0.036640167236328125, 0.045104026794433594, 0.05356788635253906, 0.06203174591064453, 0.07049560546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 6.0, 17.0, 13.0, 24.0, 29.0, 43.0, 55.0, 96.0, 161.0, 235.0, 414.0, 766.0, 1653.0, 3659.0, 9039.0, 24612.0, 77224.0, 302937.0, 1847317.0, 1559236.0, 260281.0, 68791.0, 22217.0, 8402.0, 3320.0, 1601.0, 830.0, 469.0, 252.0, 173.0, 129.0, 80.0, 46.0, 45.0, 26.0, 26.0, 12.0, 6.0, 5.0, 4.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.19482421875, -0.18924903869628906, -0.18367385864257812, -0.1780986785888672, -0.17252349853515625, -0.1669483184814453, -0.16137313842773438, -0.15579795837402344, -0.1502227783203125, -0.14464759826660156, -0.13907241821289062, -0.1334972381591797, -0.12792205810546875, -0.12234687805175781, -0.11677169799804688, -0.11119651794433594, -0.105621337890625, -0.10004615783691406, -0.09447097778320312, -0.08889579772949219, -0.08332061767578125, -0.07774543762207031, -0.07217025756835938, -0.06659507751464844, -0.0610198974609375, -0.05544471740722656, -0.049869537353515625, -0.04429435729980469, -0.03871917724609375, -0.03314399719238281, -0.027568817138671875, -0.021993637084960938, -0.01641845703125, -0.010843276977539062, -0.005268096923828125, 0.0003070831298828125, 0.00588226318359375, 0.011457443237304688, 0.017032623291015625, 0.022607803344726562, 0.0281829833984375, 0.03375816345214844, 0.039333343505859375, 0.04490852355957031, 0.05048370361328125, 0.05605888366699219, 0.061634063720703125, 0.06720924377441406, 0.072784423828125, 0.07835960388183594, 0.08393478393554688, 0.08950996398925781, 0.09508514404296875, 0.10066032409667969, 0.10623550415039062, 0.11181068420410156, 0.1173858642578125, 0.12296104431152344, 0.12853622436523438, 0.1341114044189453, 0.13968658447265625, 0.1452617645263672, 0.15083694458007812, 0.15641212463378906, 0.1619873046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 19.0, 16.0, 26.0, 29.0, 43.0, 49.0, 70.0, 102.0, 135.0, 185.0, 298.0, 434.0, 505.0, 563.0, 476.0, 322.0, 198.0, 172.0, 98.0, 89.0, 55.0, 39.0, 35.0, 30.0, 18.0, 12.0, 8.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2325439453125, -0.22426414489746094, -0.21598434448242188, -0.2077045440673828, -0.19942474365234375, -0.1911449432373047, -0.18286514282226562, -0.17458534240722656, -0.1663055419921875, -0.15802574157714844, -0.14974594116210938, -0.1414661407470703, -0.13318634033203125, -0.12490653991699219, -0.11662673950195312, -0.10834693908691406, -0.100067138671875, -0.09178733825683594, -0.08350753784179688, -0.07522773742675781, -0.06694793701171875, -0.05866813659667969, -0.050388336181640625, -0.04210853576660156, -0.0338287353515625, -0.025548934936523438, -0.017269134521484375, -0.008989334106445312, -0.00070953369140625, 0.0075702667236328125, 0.015850067138671875, 0.024129867553710938, 0.03240966796875, 0.04068946838378906, 0.048969268798828125, 0.05724906921386719, 0.06552886962890625, 0.07380867004394531, 0.08208847045898438, 0.09036827087402344, 0.0986480712890625, 0.10692787170410156, 0.11520767211914062, 0.12348747253417969, 0.13176727294921875, 0.1400470733642578, 0.14832687377929688, 0.15660667419433594, 0.164886474609375, 0.17316627502441406, 0.18144607543945312, 0.1897258758544922, 0.19800567626953125, 0.2062854766845703, 0.21456527709960938, 0.22284507751464844, 0.2311248779296875, 0.23940467834472656, 0.24768447875976562, 0.2559642791748047, 0.26424407958984375, 0.2725238800048828, 0.2808036804199219, 0.28908348083496094, 0.29736328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 20.0, 40.0, 181.0, 302.0, 241.0, 120.0, 40.0, 21.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.394401788711548, -2.241150379180908, -2.0878992080688477, -1.934647798538208, -1.781396508216858, -1.6281452178955078, -1.4748938083648682, -1.321642518043518, -1.168391227722168, -1.0151399374008179, -0.861888587474823, -0.7086372375488281, -0.555385947227478, -0.40213465690612793, -0.24888330698013306, -0.09563195705413818, 0.057619333267211914, 0.2108706533908844, 0.3641219735145569, 0.5173733234405518, 0.6706246137619019, 0.823875904083252, 0.9771272540092468, 1.1303786039352417, 1.2836298942565918, 1.436881184577942, 1.590132474899292, 1.7433838844299316, 1.8966351747512817, 2.049886465072632, 2.2031378746032715, 2.356389045715332, 2.509640693664551, 2.6628921031951904, 2.816143274307251, 2.9693946838378906, 3.122645854949951, 3.275897264480591, 3.4291486740112305, 3.582399845123291, 3.7356512546539307, 3.8889026641845703, 4.042153835296631, 4.195405006408691, 4.34865665435791, 4.501907825469971, 4.655158996582031, 4.80841064453125, 4.9616618156433105, 5.114912986755371, 5.26816463470459, 5.42141580581665, 5.574666976928711, 5.72791862487793, 5.88116979598999, 6.034420967102051, 6.1876726150512695, 6.34092378616333, 6.494175434112549, 6.647426605224609, 6.80067777633667, 6.9539289474487305, 7.107180595397949, 7.26043176651001, 7.41368293762207]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 13.0, 10.0, 16.0, 27.0, 42.0, 53.0, 65.0, 73.0, 76.0, 98.0, 94.0, 97.0, 70.0, 64.0, 54.0, 48.0, 39.0, 20.0, 14.0, 14.0, 9.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4143567085266113, -1.3306742906570435, -1.2469918727874756, -1.1633094549179077, -1.0796270370483398, -0.995944619178772, -0.9122622013092041, -0.8285797834396362, -0.7448973655700684, -0.6612149477005005, -0.5775325298309326, -0.49385011196136475, -0.4101676940917969, -0.326485276222229, -0.24280285835266113, -0.15912044048309326, -0.07543802261352539, 0.00824439525604248, 0.09192681312561035, 0.17560923099517822, 0.2592916488647461, 0.34297406673431396, 0.42665648460388184, 0.5103389024734497, 0.5940213203430176, 0.6777037382125854, 0.7613861560821533, 0.8450685739517212, 0.9287509918212891, 1.012433409690857, 1.0961158275604248, 1.1797982454299927, 1.2634809017181396, 1.3471633195877075, 1.4308457374572754, 1.5145281553268433, 1.5982105731964111, 1.681892991065979, 1.7655754089355469, 1.8492578268051147, 1.9329402446746826, 2.016622543334961, 2.1003050804138184, 2.183987617492676, 2.267669916152954, 2.3513522148132324, 2.43503475189209, 2.5187172889709473, 2.6023995876312256, 2.686081886291504, 2.7697644233703613, 2.8534469604492188, 2.937129259109497, 3.0208115577697754, 3.104494094848633, 3.1881766319274902, 3.2718589305877686, 3.355541229248047, 3.4392237663269043, 3.5229063034057617, 3.60658860206604, 3.6902709007263184, 3.773953437805176, 3.857635974884033, 3.9413182735443115]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 12.0, 10.0, 22.0, 30.0, 39.0, 57.0, 106.0, 181.0, 243.0, 389.0, 549.0, 837.0, 1346.0, 2054.0, 3260.0, 5057.0, 8182.0, 13241.0, 21684.0, 36856.0, 64947.0, 128402.0, 264975.0, 239516.0, 111804.0, 58508.0, 33747.0, 19904.0, 11959.0, 7610.0, 4655.0, 2942.0, 1968.0, 1201.0, 792.0, 483.0, 369.0, 210.0, 128.0, 109.0, 52.0, 42.0, 29.0, 15.0, 8.0, 7.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1435546875, -0.1391925811767578, -0.13483047485351562, -0.13046836853027344, -0.12610626220703125, -0.12174415588378906, -0.11738204956054688, -0.11301994323730469, -0.1086578369140625, -0.10429573059082031, -0.09993362426757812, -0.09557151794433594, -0.09120941162109375, -0.08684730529785156, -0.08248519897460938, -0.07812309265136719, -0.073760986328125, -0.06939888000488281, -0.06503677368164062, -0.06067466735839844, -0.05631256103515625, -0.05195045471191406, -0.047588348388671875, -0.04322624206542969, -0.0388641357421875, -0.03450202941894531, -0.030139923095703125, -0.025777816772460938, -0.02141571044921875, -0.017053604125976562, -0.012691497802734375, -0.008329391479492188, -0.00396728515625, 0.0003948211669921875, 0.004756927490234375, 0.009119033813476562, 0.01348114013671875, 0.017843246459960938, 0.022205352783203125, 0.026567459106445312, 0.0309295654296875, 0.03529167175292969, 0.039653778076171875, 0.04401588439941406, 0.04837799072265625, 0.05274009704589844, 0.057102203369140625, 0.06146430969238281, 0.065826416015625, 0.07018852233886719, 0.07455062866210938, 0.07891273498535156, 0.08327484130859375, 0.08763694763183594, 0.09199905395507812, 0.09636116027832031, 0.1007232666015625, 0.10508537292480469, 0.10944747924804688, 0.11380958557128906, 0.11817169189453125, 0.12253379821777344, 0.12689590454101562, 0.1312580108642578, 0.1356201171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 1.0, 5.0, 9.0, 11.0, 12.0, 16.0, 23.0, 33.0, 45.0, 45.0, 57.0, 62.0, 59.0, 68.0, 71.0, 68.0, 61.0, 60.0, 45.0, 55.0, 47.0, 41.0, 27.0, 26.0, 22.0, 16.0, 12.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15185260772705078, -0.14794349670410156, -0.14403438568115234, -0.14012527465820312, -0.1362161636352539, -0.1323070526123047, -0.12839794158935547, -0.12448883056640625, -0.12057971954345703, -0.11667060852050781, -0.1127614974975586, -0.10885238647460938, -0.10494327545166016, -0.10103416442871094, -0.09712505340576172, -0.0932159423828125, -0.08930683135986328, -0.08539772033691406, -0.08148860931396484, -0.07757949829101562, -0.0736703872680664, -0.06976127624511719, -0.06585216522216797, -0.06194305419921875, -0.05803394317626953, -0.05412483215332031, -0.050215721130371094, -0.046306610107421875, -0.042397499084472656, -0.03848838806152344, -0.03457927703857422, -0.030670166015625, -0.02676105499267578, -0.022851943969726562, -0.018942832946777344, -0.015033721923828125, -0.011124610900878906, -0.0072154998779296875, -0.0033063888549804688, 0.00060272216796875, 0.004511833190917969, 0.008420944213867188, 0.012330055236816406, 0.016239166259765625, 0.020148277282714844, 0.024057388305664062, 0.02796649932861328, 0.0318756103515625, 0.03578472137451172, 0.03969383239746094, 0.043602943420410156, 0.047512054443359375, 0.051421165466308594, 0.05533027648925781, 0.05923938751220703, 0.06314849853515625, 0.06705760955810547, 0.07096672058105469, 0.0748758316040039, 0.07878494262695312, 0.08269405364990234, 0.08660316467285156, 0.09051227569580078, 0.09442138671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 8.0, 10.0, 14.0, 17.0, 16.0, 18.0, 29.0, 48.0, 59.0, 83.0, 96.0, 140.0, 228.0, 374.0, 558.0, 950.0, 1706.0, 3625.0, 9569.0, 34355.0, 210116.0, 687107.0, 71763.0, 16416.0, 5414.0, 2414.0, 1234.0, 765.0, 448.0, 251.0, 189.0, 161.0, 95.0, 77.0, 56.0, 49.0, 24.0, 26.0, 12.0, 12.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.45166015625, -0.4380683898925781, -0.42447662353515625, -0.4108848571777344, -0.3972930908203125, -0.3837013244628906, -0.37010955810546875, -0.3565177917480469, -0.342926025390625, -0.3293342590332031, -0.31574249267578125, -0.3021507263183594, -0.2885589599609375, -0.2749671936035156, -0.26137542724609375, -0.24778366088867188, -0.23419189453125, -0.22060012817382812, -0.20700836181640625, -0.19341659545898438, -0.1798248291015625, -0.16623306274414062, -0.15264129638671875, -0.13904953002929688, -0.125457763671875, -0.11186599731445312, -0.09827423095703125, -0.08468246459960938, -0.0710906982421875, -0.057498931884765625, -0.04390716552734375, -0.030315399169921875, -0.0167236328125, -0.003131866455078125, 0.01045989990234375, 0.024051666259765625, 0.0376434326171875, 0.051235198974609375, 0.06482696533203125, 0.07841873168945312, 0.092010498046875, 0.10560226440429688, 0.11919403076171875, 0.13278579711914062, 0.1463775634765625, 0.15996932983398438, 0.17356109619140625, 0.18715286254882812, 0.20074462890625, 0.21433639526367188, 0.22792816162109375, 0.24151992797851562, 0.2551116943359375, 0.2687034606933594, 0.28229522705078125, 0.2958869934082031, 0.309478759765625, 0.3230705261230469, 0.33666229248046875, 0.3502540588378906, 0.3638458251953125, 0.3774375915527344, 0.39102935791015625, 0.4046211242675781, 0.418212890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 9.0, 10.0, 16.0, 19.0, 21.0, 28.0, 37.0, 39.0, 35.0, 39.0, 38.0, 44.0, 57.0, 45.0, 51.0, 66.0, 54.0, 51.0, 50.0, 38.0, 33.0, 32.0, 29.0, 22.0, 23.0, 13.0, 26.0, 18.0, 10.0, 5.0, 8.0, 9.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.53515625, -0.5210113525390625, -0.506866455078125, -0.4927215576171875, -0.47857666015625, -0.4644317626953125, -0.450286865234375, -0.4361419677734375, -0.4219970703125, -0.4078521728515625, -0.393707275390625, -0.3795623779296875, -0.36541748046875, -0.3512725830078125, -0.337127685546875, -0.3229827880859375, -0.308837890625, -0.2946929931640625, -0.280548095703125, -0.2664031982421875, -0.25225830078125, -0.2381134033203125, -0.223968505859375, -0.2098236083984375, -0.1956787109375, -0.1815338134765625, -0.167388916015625, -0.1532440185546875, -0.13909912109375, -0.1249542236328125, -0.110809326171875, -0.0966644287109375, -0.08251953125, -0.0683746337890625, -0.054229736328125, -0.0400848388671875, -0.02593994140625, -0.0117950439453125, 0.002349853515625, 0.0164947509765625, 0.0306396484375, 0.0447845458984375, 0.058929443359375, 0.0730743408203125, 0.08721923828125, 0.1013641357421875, 0.115509033203125, 0.1296539306640625, 0.143798828125, 0.1579437255859375, 0.172088623046875, 0.1862335205078125, 0.20037841796875, 0.2145233154296875, 0.228668212890625, 0.2428131103515625, 0.2569580078125, 0.2711029052734375, 0.285247802734375, 0.2993927001953125, 0.31353759765625, 0.3276824951171875, 0.341827392578125, 0.3559722900390625, 0.3701171875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 10.0, 20.0, 33.0, 48.0, 62.0, 137.0, 283.0, 570.0, 1442.0, 4207.0, 16318.0, 96492.0, 742118.0, 154433.0, 23484.0, 5589.0, 1825.0, 764.0, 336.0, 163.0, 86.0, 46.0, 30.0, 20.0, 7.0, 9.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.254638671875, -0.24821090698242188, -0.24178314208984375, -0.23535537719726562, -0.2289276123046875, -0.22249984741210938, -0.21607208251953125, -0.20964431762695312, -0.203216552734375, -0.19678878784179688, -0.19036102294921875, -0.18393325805664062, -0.1775054931640625, -0.17107772827148438, -0.16464996337890625, -0.15822219848632812, -0.15179443359375, -0.14536666870117188, -0.13893890380859375, -0.13251113891601562, -0.1260833740234375, -0.11965560913085938, -0.11322784423828125, -0.10680007934570312, -0.100372314453125, -0.09394454956054688, -0.08751678466796875, -0.08108901977539062, -0.0746612548828125, -0.06823348999023438, -0.06180572509765625, -0.055377960205078125, -0.0489501953125, -0.042522430419921875, -0.03609466552734375, -0.029666900634765625, -0.0232391357421875, -0.016811370849609375, -0.01038360595703125, -0.003955841064453125, 0.002471923828125, 0.008899688720703125, 0.01532745361328125, 0.021755218505859375, 0.0281829833984375, 0.034610748291015625, 0.04103851318359375, 0.047466278076171875, 0.05389404296875, 0.060321807861328125, 0.06674957275390625, 0.07317733764648438, 0.0796051025390625, 0.08603286743164062, 0.09246063232421875, 0.09888839721679688, 0.105316162109375, 0.11174392700195312, 0.11817169189453125, 0.12459945678710938, 0.1310272216796875, 0.13745498657226562, 0.14388275146484375, 0.15031051635742188, 0.15673828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 3.0, 5.0, 9.0, 11.0, 12.0, 15.0, 16.0, 14.0, 17.0, 22.0, 30.0, 37.0, 33.0, 59.0, 70.0, 75.0, 86.0, 75.0, 84.0, 53.0, 54.0, 43.0, 26.0, 30.0, 20.0, 19.0, 13.0, 8.0, 9.0, 8.0, 7.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8683414459228516e-05, -3.7243589758872986e-05, -3.5803765058517456e-05, -3.4363940358161926e-05, -3.2924115657806396e-05, -3.148429095745087e-05, -3.0044466257095337e-05, -2.8604641556739807e-05, -2.7164816856384277e-05, -2.5724992156028748e-05, -2.4285167455673218e-05, -2.2845342755317688e-05, -2.1405518054962158e-05, -1.996569335460663e-05, -1.85258686542511e-05, -1.708604395389557e-05, -1.564621925354004e-05, -1.420639455318451e-05, -1.276656985282898e-05, -1.132674515247345e-05, -9.88692045211792e-06, -8.44709575176239e-06, -7.00727105140686e-06, -5.5674463510513306e-06, -4.127621650695801e-06, -2.687796950340271e-06, -1.2479722499847412e-06, 1.9185245037078857e-07, 1.6316771507263184e-06, 3.071501851081848e-06, 4.511326551437378e-06, 5.951151251792908e-06, 7.3909759521484375e-06, 8.830800652503967e-06, 1.0270625352859497e-05, 1.1710450053215027e-05, 1.3150274753570557e-05, 1.4590099453926086e-05, 1.6029924154281616e-05, 1.7469748854637146e-05, 1.8909573554992676e-05, 2.0349398255348206e-05, 2.1789222955703735e-05, 2.3229047656059265e-05, 2.4668872356414795e-05, 2.6108697056770325e-05, 2.7548521757125854e-05, 2.8988346457481384e-05, 3.0428171157836914e-05, 3.1867995858192444e-05, 3.3307820558547974e-05, 3.4747645258903503e-05, 3.618746995925903e-05, 3.762729465961456e-05, 3.906711935997009e-05, 4.050694406032562e-05, 4.194676876068115e-05, 4.338659346103668e-05, 4.482641816139221e-05, 4.626624286174774e-05, 4.770606756210327e-05, 4.91458922624588e-05, 5.058571696281433e-05, 5.202554166316986e-05, 5.346536636352539e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 10.0, 13.0, 14.0, 13.0, 27.0, 29.0, 40.0, 59.0, 87.0, 129.0, 198.0, 310.0, 499.0, 864.0, 1625.0, 3577.0, 9314.0, 35639.0, 205126.0, 663780.0, 95898.0, 19752.0, 5879.0, 2490.0, 1211.0, 749.0, 425.0, 253.0, 172.0, 101.0, 78.0, 57.0, 38.0, 20.0, 19.0, 12.0, 12.0, 9.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.14892578125, -0.1441669464111328, -0.13940811157226562, -0.13464927673339844, -0.12989044189453125, -0.12513160705566406, -0.12037277221679688, -0.11561393737792969, -0.1108551025390625, -0.10609626770019531, -0.10133743286132812, -0.09657859802246094, -0.09181976318359375, -0.08706092834472656, -0.08230209350585938, -0.07754325866699219, -0.072784423828125, -0.06802558898925781, -0.06326675415039062, -0.05850791931152344, -0.05374908447265625, -0.04899024963378906, -0.044231414794921875, -0.03947257995605469, -0.0347137451171875, -0.029954910278320312, -0.025196075439453125, -0.020437240600585938, -0.01567840576171875, -0.010919570922851562, -0.006160736083984375, -0.0014019012451171875, 0.00335693359375, 0.008115768432617188, 0.012874603271484375, 0.017633438110351562, 0.02239227294921875, 0.027151107788085938, 0.031909942626953125, 0.03666877746582031, 0.0414276123046875, 0.04618644714355469, 0.050945281982421875, 0.05570411682128906, 0.06046295166015625, 0.06522178649902344, 0.06998062133789062, 0.07473945617675781, 0.079498291015625, 0.08425712585449219, 0.08901596069335938, 0.09377479553222656, 0.09853363037109375, 0.10329246520996094, 0.10805130004882812, 0.11281013488769531, 0.1175689697265625, 0.12232780456542969, 0.12708663940429688, 0.13184547424316406, 0.13660430908203125, 0.14136314392089844, 0.14612197875976562, 0.1508808135986328, 0.1556396484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 15.0, 16.0, 20.0, 16.0, 15.0, 38.0, 31.0, 37.0, 59.0, 45.0, 64.0, 75.0, 71.0, 66.0, 69.0, 57.0, 57.0, 38.0, 42.0, 31.0, 17.0, 20.0, 15.0, 17.0, 8.0, 6.0, 8.0, 3.0, 3.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12138748168945312, -0.11728668212890625, -0.11318588256835938, -0.1090850830078125, -0.10498428344726562, -0.10088348388671875, -0.09678268432617188, -0.092681884765625, -0.08858108520507812, -0.08448028564453125, -0.08037948608398438, -0.0762786865234375, -0.07217788696289062, -0.06807708740234375, -0.06397628784179688, -0.05987548828125, -0.055774688720703125, -0.05167388916015625, -0.047573089599609375, -0.0434722900390625, -0.039371490478515625, -0.03527069091796875, -0.031169891357421875, -0.027069091796875, -0.022968292236328125, -0.01886749267578125, -0.014766693115234375, -0.0106658935546875, -0.006565093994140625, -0.00246429443359375, 0.001636505126953125, 0.0057373046875, 0.009838104248046875, 0.01393890380859375, 0.018039703369140625, 0.0221405029296875, 0.026241302490234375, 0.03034210205078125, 0.034442901611328125, 0.038543701171875, 0.042644500732421875, 0.04674530029296875, 0.050846099853515625, 0.0549468994140625, 0.059047698974609375, 0.06314849853515625, 0.06724929809570312, 0.07135009765625, 0.07545089721679688, 0.07955169677734375, 0.08365249633789062, 0.0877532958984375, 0.09185409545898438, 0.09595489501953125, 0.10005569458007812, 0.104156494140625, 0.10825729370117188, 0.11235809326171875, 0.11645889282226562, 0.1205596923828125, 0.12466049194335938, 0.12876129150390625, 0.13286209106445312, 0.136962890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 17.0, 40.0, 78.0, 124.0, 279.0, 205.0, 109.0, 64.0, 27.0, 18.0, 12.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.352621555328369, -3.210792303085327, -3.068963050842285, -2.927133798599243, -2.785304546356201, -2.643475294113159, -2.501646041870117, -2.359816789627075, -2.217987537384033, -2.076158285140991, -1.9343290328979492, -1.7924997806549072, -1.6506705284118652, -1.5088412761688232, -1.3670120239257812, -1.2251827716827393, -1.0833535194396973, -0.9415242671966553, -0.7996950149536133, -0.6578657627105713, -0.5160365104675293, -0.3742072582244873, -0.2323780059814453, -0.09054875373840332, 0.05128049850463867, 0.19310975074768066, 0.33493900299072266, 0.47676825523376465, 0.6185975074768066, 0.7604267597198486, 0.9022560119628906, 1.0440852642059326, 1.1859140396118164, 1.3277432918548584, 1.4695725440979004, 1.6114017963409424, 1.7532310485839844, 1.8950603008270264, 2.0368895530700684, 2.1787188053131104, 2.3205480575561523, 2.4623773097991943, 2.6042065620422363, 2.7460358142852783, 2.8878650665283203, 3.0296943187713623, 3.1715235710144043, 3.3133528232574463, 3.4551820755004883, 3.5970113277435303, 3.7388405799865723, 3.8806698322296143, 4.022499084472656, 4.164328575134277, 4.30615758895874, 4.447986602783203, 4.589816093444824, 4.731645584106445, 4.873474597930908, 5.015303611755371, 5.157133102416992, 5.298962593078613, 5.440791606903076, 5.582620620727539, 5.72445011138916]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 6.0, 7.0, 8.0, 1.0, 18.0, 12.0, 12.0, 21.0, 19.0, 24.0, 26.0, 22.0, 23.0, 30.0, 39.0, 38.0, 52.0, 53.0, 63.0, 50.0, 62.0, 46.0, 45.0, 32.0, 37.0, 38.0, 28.0, 23.0, 27.0, 24.0, 14.0, 22.0, 13.0, 22.0, 4.0, 3.0, 6.0, 7.0, 5.0, 3.0, 8.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6170198917388916, -1.5671344995498657, -1.5172491073608398, -1.4673638343811035, -1.4174784421920776, -1.3675930500030518, -1.3177076578140259, -1.267822265625, -1.2179369926452637, -1.1680516004562378, -1.118166208267212, -1.0682809352874756, -1.0183955430984497, -0.9685101509094238, -0.918624758720398, -0.8687393665313721, -0.8188539743423462, -0.7689685821533203, -0.7190832495689392, -0.6691978573799133, -0.6193125247955322, -0.5694271326065063, -0.5195417404174805, -0.469656378030777, -0.4197710156440735, -0.36988565325737, -0.3200002908706665, -0.2701148986816406, -0.22022953629493713, -0.17034417390823364, -0.12045878171920776, -0.07057341933250427, -0.02068793773651123, 0.029197432100772858, 0.07908280193805695, 0.12896817922592163, 0.17885354161262512, 0.2287389039993286, 0.2786242961883545, 0.328509658575058, 0.3783950209617615, 0.42828038334846497, 0.47816574573516846, 0.5280511379241943, 0.5779365301132202, 0.6278218626976013, 0.6777072548866272, 0.7275925874710083, 0.7774779796600342, 0.8273633718490601, 0.8772487044334412, 0.927134096622467, 0.9770194292068481, 1.026904821395874, 1.0767902135849, 1.1266756057739258, 1.176560878753662, 1.226446270942688, 1.2763316631317139, 1.3262169361114502, 1.376102328300476, 1.425987720489502, 1.4758731126785278, 1.5257585048675537, 1.5756438970565796]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 6.0, 7.0, 16.0, 18.0, 13.0, 43.0, 54.0, 78.0, 110.0, 178.0, 274.0, 448.0, 767.0, 1300.0, 2189.0, 3901.0, 7173.0, 13792.0, 28199.0, 61542.0, 157710.0, 478225.0, 1372458.0, 1336529.0, 457310.0, 153234.0, 60513.0, 27780.0, 13703.0, 7208.0, 3969.0, 2220.0, 1279.0, 723.0, 471.0, 285.0, 204.0, 116.0, 83.0, 47.0, 31.0, 26.0, 16.0, 19.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0897216796875, -0.08682632446289062, -0.08393096923828125, -0.08103561401367188, -0.0781402587890625, -0.07524490356445312, -0.07234954833984375, -0.06945419311523438, -0.066558837890625, -0.06366348266601562, -0.06076812744140625, -0.057872772216796875, -0.0549774169921875, -0.052082061767578125, -0.04918670654296875, -0.046291351318359375, -0.04339599609375, -0.040500640869140625, -0.03760528564453125, -0.034709930419921875, -0.0318145751953125, -0.028919219970703125, -0.02602386474609375, -0.023128509521484375, -0.020233154296875, -0.017337799072265625, -0.01444244384765625, -0.011547088623046875, -0.0086517333984375, -0.005756378173828125, -0.00286102294921875, 3.4332275390625e-05, 0.0029296875, 0.005825042724609375, 0.00872039794921875, 0.011615753173828125, 0.0145111083984375, 0.017406463623046875, 0.02030181884765625, 0.023197174072265625, 0.026092529296875, 0.028987884521484375, 0.03188323974609375, 0.034778594970703125, 0.0376739501953125, 0.040569305419921875, 0.04346466064453125, 0.046360015869140625, 0.04925537109375, 0.052150726318359375, 0.05504608154296875, 0.057941436767578125, 0.0608367919921875, 0.06373214721679688, 0.06662750244140625, 0.06952285766601562, 0.072418212890625, 0.07531356811523438, 0.07820892333984375, 0.08110427856445312, 0.0839996337890625, 0.08689498901367188, 0.08979034423828125, 0.09268569946289062, 0.0955810546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 8.0, 10.0, 9.0, 14.0, 17.0, 19.0, 26.0, 30.0, 37.0, 37.0, 37.0, 41.0, 52.0, 40.0, 51.0, 40.0, 45.0, 38.0, 49.0, 48.0, 50.0, 34.0, 35.0, 35.0, 24.0, 18.0, 21.0, 16.0, 16.0, 16.0, 11.0, 5.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0731201171875, -0.07046890258789062, -0.06781768798828125, -0.06516647338867188, -0.0625152587890625, -0.059864044189453125, -0.05721282958984375, -0.054561614990234375, -0.051910400390625, -0.049259185791015625, -0.04660797119140625, -0.043956756591796875, -0.0413055419921875, -0.038654327392578125, -0.03600311279296875, -0.033351898193359375, -0.03070068359375, -0.028049468994140625, -0.02539825439453125, -0.022747039794921875, -0.0200958251953125, -0.017444610595703125, -0.01479339599609375, -0.012142181396484375, -0.009490966796875, -0.006839752197265625, -0.00418853759765625, -0.001537322998046875, 0.0011138916015625, 0.003765106201171875, 0.00641632080078125, 0.009067535400390625, 0.01171875, 0.014369964599609375, 0.01702117919921875, 0.019672393798828125, 0.0223236083984375, 0.024974822998046875, 0.02762603759765625, 0.030277252197265625, 0.032928466796875, 0.035579681396484375, 0.03823089599609375, 0.040882110595703125, 0.0435333251953125, 0.046184539794921875, 0.04883575439453125, 0.051486968994140625, 0.05413818359375, 0.056789398193359375, 0.05944061279296875, 0.062091827392578125, 0.0647430419921875, 0.06739425659179688, 0.07004547119140625, 0.07269668579101562, 0.075347900390625, 0.07799911499023438, 0.08065032958984375, 0.08330154418945312, 0.0859527587890625, 0.08860397338867188, 0.09125518798828125, 0.09390640258789062, 0.0965576171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 10.0, 21.0, 27.0, 46.0, 71.0, 109.0, 207.0, 457.0, 1202.0, 3765.0, 15801.0, 99486.0, 1393468.0, 2477906.0, 167879.0, 24936.0, 5796.0, 1823.0, 621.0, 265.0, 156.0, 90.0, 54.0, 32.0, 12.0, 7.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.26617431640625, -0.2559814453125, -0.24578857421875, -0.235595703125, -0.22540283203125, -0.2152099609375, -0.20501708984375, -0.19482421875, -0.18463134765625, -0.1744384765625, -0.16424560546875, -0.154052734375, -0.14385986328125, -0.1336669921875, -0.12347412109375, -0.11328125, -0.10308837890625, -0.0928955078125, -0.08270263671875, -0.072509765625, -0.06231689453125, -0.0521240234375, -0.04193115234375, -0.03173828125, -0.02154541015625, -0.0113525390625, -0.00115966796875, 0.009033203125, 0.01922607421875, 0.0294189453125, 0.03961181640625, 0.0498046875, 0.05999755859375, 0.0701904296875, 0.08038330078125, 0.090576171875, 0.10076904296875, 0.1109619140625, 0.12115478515625, 0.13134765625, 0.14154052734375, 0.1517333984375, 0.16192626953125, 0.172119140625, 0.18231201171875, 0.1925048828125, 0.20269775390625, 0.212890625, 0.22308349609375, 0.2332763671875, 0.24346923828125, 0.253662109375, 0.26385498046875, 0.2740478515625, 0.28424072265625, 0.29443359375, 0.30462646484375, 0.3148193359375, 0.32501220703125, 0.335205078125, 0.34539794921875, 0.3555908203125, 0.36578369140625, 0.3759765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 10.0, 13.0, 3.0, 11.0, 20.0, 20.0, 23.0, 37.0, 60.0, 60.0, 109.0, 148.0, 251.0, 325.0, 421.0, 504.0, 588.0, 409.0, 294.0, 213.0, 142.0, 98.0, 79.0, 58.0, 45.0, 40.0, 22.0, 15.0, 23.0, 9.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.27581024169921875, -0.2671966552734375, -0.25858306884765625, -0.249969482421875, -0.24135589599609375, -0.2327423095703125, -0.22412872314453125, -0.21551513671875, -0.20690155029296875, -0.1982879638671875, -0.18967437744140625, -0.181060791015625, -0.17244720458984375, -0.1638336181640625, -0.15522003173828125, -0.1466064453125, -0.13799285888671875, -0.1293792724609375, -0.12076568603515625, -0.112152099609375, -0.10353851318359375, -0.0949249267578125, -0.08631134033203125, -0.07769775390625, -0.06908416748046875, -0.0604705810546875, -0.05185699462890625, -0.043243408203125, -0.03462982177734375, -0.0260162353515625, -0.01740264892578125, -0.0087890625, -0.00017547607421875, 0.0084381103515625, 0.01705169677734375, 0.025665283203125, 0.03427886962890625, 0.0428924560546875, 0.05150604248046875, 0.06011962890625, 0.06873321533203125, 0.0773468017578125, 0.08596038818359375, 0.094573974609375, 0.10318756103515625, 0.1118011474609375, 0.12041473388671875, 0.1290283203125, 0.13764190673828125, 0.1462554931640625, 0.15486907958984375, 0.163482666015625, 0.17209625244140625, 0.1807098388671875, 0.18932342529296875, 0.19793701171875, 0.20655059814453125, 0.2151641845703125, 0.22377777099609375, 0.232391357421875, 0.24100494384765625, 0.2496185302734375, 0.25823211669921875, 0.266845703125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 33.0, 119.0, 305.0, 334.0, 141.0, 37.0, 8.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.593810081481934, -4.385926246643066, -4.178042411804199, -3.970158576965332, -3.762274742126465, -3.5543909072875977, -3.3465073108673096, -3.1386234760284424, -2.930739641189575, -2.722855806350708, -2.514971971511841, -2.3070883750915527, -2.0992045402526855, -1.8913205862045288, -1.6834368705749512, -1.475553035736084, -1.2676692008972168, -1.0597853660583496, -0.8519015908241272, -0.6440178155899048, -0.4361339807510376, -0.2282501459121704, -0.020366430282592773, 0.18751740455627441, 0.3954012393951416, 0.6032850742340088, 0.8111688494682312, 1.0190526247024536, 1.2269364595413208, 1.434820294380188, 1.6427040100097656, 1.8505878448486328, 2.0584716796875, 2.266355514526367, 2.4742393493652344, 2.6821231842041016, 2.8900070190429688, 3.097890853881836, 3.305774450302124, 3.513658285140991, 3.7215421199798584, 3.9294259548187256, 4.137309551239014, 4.345193386077881, 4.553077220916748, 4.760961055755615, 4.968844890594482, 5.17672872543335, 5.384612560272217, 5.592496395111084, 5.800380229949951, 6.008264064788818, 6.2161478996276855, 6.424031734466553, 6.631915092468262, 6.839798927307129, 7.047682762145996, 7.255566596984863, 7.4634504318237305, 7.671334266662598, 7.879218101501465, 8.087101936340332, 8.2949857711792, 8.502869606018066, 8.710753440856934]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 5.0, 18.0, 11.0, 9.0, 18.0, 21.0, 27.0, 37.0, 26.0, 30.0, 50.0, 47.0, 50.0, 54.0, 58.0, 52.0, 65.0, 50.0, 44.0, 37.0, 42.0, 32.0, 37.0, 34.0, 28.0, 27.0, 18.0, 15.0, 14.0, 4.0, 9.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7327477931976318, -1.6812776327133179, -1.6298075914382935, -1.5783374309539795, -1.526867389678955, -1.4753972291946411, -1.4239270687103271, -1.3724570274353027, -1.3209868669509888, -1.2695167064666748, -1.2180466651916504, -1.1665765047073364, -1.1151063442230225, -1.063636302947998, -1.012166142463684, -0.9606960415840149, -0.9092259407043457, -0.8577558398246765, -0.8062857389450073, -0.7548155784606934, -0.7033454775810242, -0.651875376701355, -0.600405216217041, -0.5489351153373718, -0.49746501445770264, -0.44599491357803345, -0.39452478289604187, -0.3430546522140503, -0.2915845513343811, -0.24011445045471191, -0.18864431977272034, -0.13717418909072876, -0.08570408821105957, -0.03423397243022919, 0.017236143350601196, 0.06870625913143158, 0.12017637491226196, 0.17164647579193115, 0.22311660647392273, 0.2745867371559143, 0.3260568380355835, 0.3775269389152527, 0.42899706959724426, 0.48046720027923584, 0.531937301158905, 0.5834074020385742, 0.6348775625228882, 0.6863476634025574, 0.7378177642822266, 0.7892878651618958, 0.8407579660415649, 0.8922281265258789, 0.9436982274055481, 0.9951683282852173, 1.0466384887695312, 1.0981085300445557, 1.1495786905288696, 1.2010488510131836, 1.252518892288208, 1.303989052772522, 1.355459213256836, 1.4069292545318604, 1.4583994150161743, 1.5098695755004883, 1.5613396167755127]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 6.0, 15.0, 19.0, 24.0, 37.0, 58.0, 72.0, 132.0, 197.0, 304.0, 417.0, 660.0, 1026.0, 1609.0, 2544.0, 4038.0, 6968.0, 12157.0, 22698.0, 47008.0, 116031.0, 306390.0, 308740.0, 116705.0, 47094.0, 23078.0, 12225.0, 7058.0, 4092.0, 2550.0, 1583.0, 1022.0, 680.0, 428.0, 295.0, 199.0, 123.0, 97.0, 59.0, 37.0, 31.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1729736328125, -0.16788673400878906, -0.16279983520507812, -0.1577129364013672, -0.15262603759765625, -0.1475391387939453, -0.14245223999023438, -0.13736534118652344, -0.1322784423828125, -0.12719154357910156, -0.12210464477539062, -0.11701774597167969, -0.11193084716796875, -0.10684394836425781, -0.10175704956054688, -0.09667015075683594, -0.091583251953125, -0.08649635314941406, -0.08140945434570312, -0.07632255554199219, -0.07123565673828125, -0.06614875793457031, -0.061061859130859375, -0.05597496032714844, -0.0508880615234375, -0.04580116271972656, -0.040714263916015625, -0.03562736511230469, -0.03054046630859375, -0.025453567504882812, -0.020366668701171875, -0.015279769897460938, -0.01019287109375, -0.0051059722900390625, -1.9073486328125e-05, 0.0050678253173828125, 0.01015472412109375, 0.015241622924804688, 0.020328521728515625, 0.025415420532226562, 0.0305023193359375, 0.03558921813964844, 0.040676116943359375, 0.04576301574707031, 0.05084991455078125, 0.05593681335449219, 0.061023712158203125, 0.06611061096191406, 0.071197509765625, 0.07628440856933594, 0.08137130737304688, 0.08645820617675781, 0.09154510498046875, 0.09663200378417969, 0.10171890258789062, 0.10680580139160156, 0.1118927001953125, 0.11697959899902344, 0.12206649780273438, 0.1271533966064453, 0.13224029541015625, 0.1373271942138672, 0.14241409301757812, 0.14750099182128906, 0.152587890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 11.0, 9.0, 12.0, 11.0, 30.0, 16.0, 22.0, 21.0, 31.0, 36.0, 35.0, 37.0, 35.0, 49.0, 46.0, 56.0, 39.0, 37.0, 50.0, 45.0, 41.0, 39.0, 40.0, 28.0, 39.0, 18.0, 19.0, 18.0, 20.0, 14.0, 16.0, 19.0, 8.0, 9.0, 14.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0985107421875, -0.09566974639892578, -0.09282875061035156, -0.08998775482177734, -0.08714675903320312, -0.0843057632446289, -0.08146476745605469, -0.07862377166748047, -0.07578277587890625, -0.07294178009033203, -0.07010078430175781, -0.0672597885131836, -0.06441879272460938, -0.061577796936035156, -0.05873680114746094, -0.05589580535888672, -0.0530548095703125, -0.05021381378173828, -0.04737281799316406, -0.044531822204589844, -0.041690826416015625, -0.038849830627441406, -0.03600883483886719, -0.03316783905029297, -0.03032684326171875, -0.02748584747314453, -0.024644851684570312, -0.021803855895996094, -0.018962860107421875, -0.016121864318847656, -0.013280868530273438, -0.010439872741699219, -0.007598876953125, -0.004757881164550781, -0.0019168853759765625, 0.0009241104125976562, 0.003765106201171875, 0.006606101989746094, 0.009447097778320312, 0.012288093566894531, 0.01512908935546875, 0.01797008514404297, 0.020811080932617188, 0.023652076721191406, 0.026493072509765625, 0.029334068298339844, 0.03217506408691406, 0.03501605987548828, 0.0378570556640625, 0.04069805145263672, 0.04353904724121094, 0.046380043029785156, 0.049221038818359375, 0.052062034606933594, 0.05490303039550781, 0.05774402618408203, 0.06058502197265625, 0.06342601776123047, 0.06626701354980469, 0.0691080093383789, 0.07194900512695312, 0.07479000091552734, 0.07763099670410156, 0.08047199249267578, 0.08331298828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 15.0, 25.0, 29.0, 30.0, 50.0, 66.0, 99.0, 138.0, 200.0, 375.0, 582.0, 1079.0, 2474.0, 7259.0, 28125.0, 225900.0, 707806.0, 55352.0, 11777.0, 3585.0, 1484.0, 746.0, 428.0, 258.0, 188.0, 112.0, 76.0, 69.0, 56.0, 34.0, 38.0, 22.0, 4.0, 17.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.475341796875, -0.4618377685546875, -0.448333740234375, -0.4348297119140625, -0.42132568359375, -0.4078216552734375, -0.394317626953125, -0.3808135986328125, -0.3673095703125, -0.3538055419921875, -0.340301513671875, -0.3267974853515625, -0.31329345703125, -0.2997894287109375, -0.286285400390625, -0.2727813720703125, -0.25927734375, -0.2457733154296875, -0.232269287109375, -0.2187652587890625, -0.20526123046875, -0.1917572021484375, -0.178253173828125, -0.1647491455078125, -0.1512451171875, -0.1377410888671875, -0.124237060546875, -0.1107330322265625, -0.09722900390625, -0.0837249755859375, -0.070220947265625, -0.0567169189453125, -0.043212890625, -0.0297088623046875, -0.016204833984375, -0.0027008056640625, 0.01080322265625, 0.0243072509765625, 0.037811279296875, 0.0513153076171875, 0.0648193359375, 0.0783233642578125, 0.091827392578125, 0.1053314208984375, 0.11883544921875, 0.1323394775390625, 0.145843505859375, 0.1593475341796875, 0.1728515625, 0.1863555908203125, 0.199859619140625, 0.2133636474609375, 0.22686767578125, 0.2403717041015625, 0.253875732421875, 0.2673797607421875, 0.2808837890625, 0.2943878173828125, 0.307891845703125, 0.3213958740234375, 0.33489990234375, 0.3484039306640625, 0.361907958984375, 0.3754119873046875, 0.388916015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 3.0, 9.0, 7.0, 8.0, 22.0, 18.0, 30.0, 22.0, 33.0, 29.0, 38.0, 54.0, 40.0, 52.0, 44.0, 59.0, 55.0, 45.0, 59.0, 44.0, 45.0, 40.0, 39.0, 33.0, 21.0, 24.0, 22.0, 18.0, 17.0, 18.0, 7.0, 4.0, 5.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.5087890625, -0.49488067626953125, -0.4809722900390625, -0.46706390380859375, -0.453155517578125, -0.43924713134765625, -0.4253387451171875, -0.41143035888671875, -0.39752197265625, -0.38361358642578125, -0.3697052001953125, -0.35579681396484375, -0.341888427734375, -0.32798004150390625, -0.3140716552734375, -0.30016326904296875, -0.2862548828125, -0.27234649658203125, -0.2584381103515625, -0.24452972412109375, -0.230621337890625, -0.21671295166015625, -0.2028045654296875, -0.18889617919921875, -0.17498779296875, -0.16107940673828125, -0.1471710205078125, -0.13326263427734375, -0.119354248046875, -0.10544586181640625, -0.0915374755859375, -0.07762908935546875, -0.063720703125, -0.04981231689453125, -0.0359039306640625, -0.02199554443359375, -0.008087158203125, 0.00582122802734375, 0.0197296142578125, 0.03363800048828125, 0.04754638671875, 0.06145477294921875, 0.0753631591796875, 0.08927154541015625, 0.103179931640625, 0.11708831787109375, 0.1309967041015625, 0.14490509033203125, 0.1588134765625, 0.17272186279296875, 0.1866302490234375, 0.20053863525390625, 0.214447021484375, 0.22835540771484375, 0.2422637939453125, 0.25617218017578125, 0.27008056640625, 0.28398895263671875, 0.2978973388671875, 0.31180572509765625, 0.325714111328125, 0.33962249755859375, 0.3535308837890625, 0.36743927001953125, 0.38134765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 12.0, 13.0, 19.0, 20.0, 45.0, 72.0, 145.0, 261.0, 502.0, 1068.0, 2956.0, 9259.0, 39906.0, 248455.0, 646810.0, 76062.0, 15581.0, 4404.0, 1571.0, 691.0, 304.0, 162.0, 96.0, 47.0, 39.0, 14.0, 9.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17308998107910156, -0.16771316528320312, -0.1623363494873047, -0.15695953369140625, -0.1515827178955078, -0.14620590209960938, -0.14082908630371094, -0.1354522705078125, -0.13007545471191406, -0.12469863891601562, -0.11932182312011719, -0.11394500732421875, -0.10856819152832031, -0.10319137573242188, -0.09781455993652344, -0.092437744140625, -0.08706092834472656, -0.08168411254882812, -0.07630729675292969, -0.07093048095703125, -0.06555366516113281, -0.060176849365234375, -0.05480003356933594, -0.0494232177734375, -0.04404640197753906, -0.038669586181640625, -0.03329277038574219, -0.02791595458984375, -0.022539138793945312, -0.017162322998046875, -0.011785507202148438, -0.00640869140625, -0.0010318756103515625, 0.004344940185546875, 0.009721755981445312, 0.01509857177734375, 0.020475387573242188, 0.025852203369140625, 0.031229019165039062, 0.0366058349609375, 0.04198265075683594, 0.047359466552734375, 0.05273628234863281, 0.05811309814453125, 0.06348991394042969, 0.06886672973632812, 0.07424354553222656, 0.079620361328125, 0.08499717712402344, 0.09037399291992188, 0.09575080871582031, 0.10112762451171875, 0.10650444030761719, 0.11188125610351562, 0.11725807189941406, 0.1226348876953125, 0.12801170349121094, 0.13338851928710938, 0.1387653350830078, 0.14414215087890625, 0.1495189666748047, 0.15489578247070312, 0.16027259826660156, 0.1656494140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 7.0, 13.0, 22.0, 24.0, 30.0, 45.0, 88.0, 125.0, 157.0, 141.0, 111.0, 74.0, 58.0, 26.0, 26.0, 15.0, 12.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.934573709964752e-05, -5.66430389881134e-05, -5.3940340876579285e-05, -5.1237642765045166e-05, -4.853494465351105e-05, -4.583224654197693e-05, -4.312954843044281e-05, -4.042685031890869e-05, -3.772415220737457e-05, -3.5021454095840454e-05, -3.2318755984306335e-05, -2.9616057872772217e-05, -2.6913359761238098e-05, -2.421066164970398e-05, -2.150796353816986e-05, -1.8805265426635742e-05, -1.6102567315101624e-05, -1.3399869203567505e-05, -1.0697171092033386e-05, -7.994472980499268e-06, -5.291774868965149e-06, -2.5890767574310303e-06, 1.1362135410308838e-07, 2.816319465637207e-06, 5.519017577171326e-06, 8.221715688705444e-06, 1.0924413800239563e-05, 1.3627111911773682e-05, 1.63298100233078e-05, 1.903250813484192e-05, 2.1735206246376038e-05, 2.4437904357910156e-05, 2.7140602469444275e-05, 2.9843300580978394e-05, 3.254599869251251e-05, 3.524869680404663e-05, 3.795139491558075e-05, 4.065409302711487e-05, 4.335679113864899e-05, 4.6059489250183105e-05, 4.8762187361717224e-05, 5.146488547325134e-05, 5.416758358478546e-05, 5.687028169631958e-05, 5.95729798078537e-05, 6.227567791938782e-05, 6.497837603092194e-05, 6.768107414245605e-05, 7.038377225399017e-05, 7.308647036552429e-05, 7.578916847705841e-05, 7.849186658859253e-05, 8.119456470012665e-05, 8.389726281166077e-05, 8.659996092319489e-05, 8.9302659034729e-05, 9.200535714626312e-05, 9.470805525779724e-05, 9.741075336933136e-05, 0.00010011345148086548, 0.0001028161495923996, 0.00010551884770393372, 0.00010822154581546783, 0.00011092424392700195]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 9.0, 11.0, 29.0, 37.0, 47.0, 93.0, 168.0, 369.0, 817.0, 1988.0, 7156.0, 50365.0, 723657.0, 235686.0, 21466.0, 4035.0, 1367.0, 615.0, 268.0, 164.0, 77.0, 44.0, 36.0, 13.0, 12.0, 2.0, 10.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15541648864746094, -0.14860153198242188, -0.1417865753173828, -0.13497161865234375, -0.1281566619873047, -0.12134170532226562, -0.11452674865722656, -0.1077117919921875, -0.10089683532714844, -0.09408187866210938, -0.08726692199707031, -0.08045196533203125, -0.07363700866699219, -0.06682205200195312, -0.06000709533691406, -0.053192138671875, -0.04637718200683594, -0.039562225341796875, -0.03274726867675781, -0.02593231201171875, -0.019117355346679688, -0.012302398681640625, -0.0054874420166015625, 0.0013275146484375, 0.008142471313476562, 0.014957427978515625, 0.021772384643554688, 0.02858734130859375, 0.03540229797363281, 0.042217254638671875, 0.04903221130371094, 0.05584716796875, 0.06266212463378906, 0.06947708129882812, 0.07629203796386719, 0.08310699462890625, 0.08992195129394531, 0.09673690795898438, 0.10355186462402344, 0.1103668212890625, 0.11718177795410156, 0.12399673461914062, 0.1308116912841797, 0.13762664794921875, 0.1444416046142578, 0.15125656127929688, 0.15807151794433594, 0.164886474609375, 0.17170143127441406, 0.17851638793945312, 0.1853313446044922, 0.19214630126953125, 0.1989612579345703, 0.20577621459960938, 0.21259117126464844, 0.2194061279296875, 0.22622108459472656, 0.23303604125976562, 0.2398509979248047, 0.24666595458984375, 0.2534809112548828, 0.2602958679199219, 0.26711082458496094, 0.27392578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 16.0, 8.0, 16.0, 18.0, 36.0, 43.0, 44.0, 47.0, 77.0, 85.0, 101.0, 101.0, 76.0, 70.0, 48.0, 41.0, 38.0, 28.0, 20.0, 21.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.15641403198242188, -0.15181732177734375, -0.14722061157226562, -0.1426239013671875, -0.13802719116210938, -0.13343048095703125, -0.12883377075195312, -0.124237060546875, -0.11964035034179688, -0.11504364013671875, -0.11044692993164062, -0.1058502197265625, -0.10125350952148438, -0.09665679931640625, -0.09206008911132812, -0.08746337890625, -0.08286666870117188, -0.07826995849609375, -0.07367324829101562, -0.0690765380859375, -0.06447982788085938, -0.05988311767578125, -0.055286407470703125, -0.050689697265625, -0.046092987060546875, -0.04149627685546875, -0.036899566650390625, -0.0323028564453125, -0.027706146240234375, -0.02310943603515625, -0.018512725830078125, -0.013916015625, -0.009319305419921875, -0.00472259521484375, -0.000125885009765625, 0.0044708251953125, 0.009067535400390625, 0.01366424560546875, 0.018260955810546875, 0.022857666015625, 0.027454376220703125, 0.03205108642578125, 0.036647796630859375, 0.0412445068359375, 0.045841217041015625, 0.05043792724609375, 0.055034637451171875, 0.05963134765625, 0.06422805786132812, 0.06882476806640625, 0.07342147827148438, 0.0780181884765625, 0.08261489868164062, 0.08721160888671875, 0.09180831909179688, 0.096405029296875, 0.10100173950195312, 0.10559844970703125, 0.11019515991210938, 0.1147918701171875, 0.11938858032226562, 0.12398529052734375, 0.12858200073242188, 0.1331787109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 6.0, 15.0, 38.0, 45.0, 63.0, 96.0, 157.0, 211.0, 123.0, 81.0, 58.0, 34.0, 17.0, 8.0, 11.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716684103012085, -2.6395390033721924, -2.5623936653137207, -2.485248565673828, -2.4081032276153564, -2.330958127975464, -2.253812789916992, -2.1766676902770996, -2.099522590637207, -2.0223774909973145, -1.9452321529388428, -1.8680869340896606, -1.7909417152404785, -1.713796615600586, -1.6366513967514038, -1.5595061779022217, -1.48236083984375, -1.4052156209945679, -1.3280704021453857, -1.2509251832962036, -1.1737799644470215, -1.096634864807129, -1.0194896459579468, -0.9423444271087646, -0.8651992082595825, -0.7880539894104004, -0.7109087705612183, -0.6337636113166809, -0.5566183924674988, -0.47947317361831665, -0.4023279845714569, -0.32518279552459717, -0.24803781509399414, -0.1708926111459732, -0.09374740719795227, -0.016602203249931335, 0.0605430006980896, 0.13768821954727173, 0.21483340859413147, 0.2919785976409912, 0.36912381649017334, 0.44626903533935547, 0.5234142541885376, 0.600559413433075, 0.6777046322822571, 0.7548498511314392, 0.8319950103759766, 0.9091402292251587, 0.9862854480743408, 1.063430666923523, 1.140575885772705, 1.2177211046218872, 1.2948663234710693, 1.372011423110962, 1.449156641960144, 1.5263018608093262, 1.6034470796585083, 1.6805922985076904, 1.7577375173568726, 1.8348827362060547, 1.9120278358459473, 1.989173173904419, 2.0663182735443115, 2.143463611602783, 2.220608711242676]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 8.0, 11.0, 17.0, 13.0, 2.0, 15.0, 13.0, 26.0, 17.0, 26.0, 32.0, 29.0, 32.0, 35.0, 36.0, 42.0, 54.0, 72.0, 53.0, 51.0, 44.0, 40.0, 37.0, 32.0, 21.0, 21.0, 28.0, 23.0, 18.0, 20.0, 26.0, 17.0, 14.0, 13.0, 8.0, 10.0, 6.0, 7.0, 7.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2956559658050537, -1.248177170753479, -1.2006983757019043, -1.1532195806503296, -1.1057407855987549, -1.0582619905471802, -1.0107831954956055, -0.963304340839386, -0.9158255457878113, -0.8683467507362366, -0.8208679556846619, -0.7733891010284424, -0.7259103059768677, -0.678431510925293, -0.6309527158737183, -0.5834739208221436, -0.5359951257705688, -0.48851633071899414, -0.44103753566741943, -0.39355871081352234, -0.34607991576194763, -0.2986011207103729, -0.25112229585647583, -0.20364350080490112, -0.15616470575332642, -0.10868590325117111, -0.06120710074901581, -0.013728290796279907, 0.0337505042552948, 0.0812292993068695, 0.1287081241607666, 0.1761869192123413, 0.22366571426391602, 0.2711445093154907, 0.31862330436706543, 0.3661021292209625, 0.41358092427253723, 0.46105971932411194, 0.508538544178009, 0.5560173392295837, 0.6034961342811584, 0.6509749293327332, 0.6984537243843079, 0.7459325790405273, 0.793411374092102, 0.8408901691436768, 0.8883689641952515, 0.9358477592468262, 0.9833265542984009, 1.0308053493499756, 1.0782841444015503, 1.125762939453125, 1.1732417345046997, 1.2207205295562744, 1.2681994438171387, 1.3156781196594238, 1.363157033920288, 1.4106358289718628, 1.4581146240234375, 1.5055934190750122, 1.553072214126587, 1.6005510091781616, 1.6480298042297363, 1.6955087184906006, 1.7429873943328857]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 10.0, 26.0, 33.0, 51.0, 81.0, 167.0, 298.0, 516.0, 1131.0, 2391.0, 5129.0, 11971.0, 32381.0, 113191.0, 602930.0, 2389046.0, 826910.0, 142349.0, 39660.0, 14466.0, 6090.0, 2794.0, 1267.0, 645.0, 324.0, 194.0, 93.0, 59.0, 29.0, 20.0, 14.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115478515625, -0.11113548278808594, -0.10679244995117188, -0.10244941711425781, -0.09810638427734375, -0.09376335144042969, -0.08942031860351562, -0.08507728576660156, -0.0807342529296875, -0.07639122009277344, -0.07204818725585938, -0.06770515441894531, -0.06336212158203125, -0.05901908874511719, -0.054676055908203125, -0.05033302307128906, -0.045989990234375, -0.04164695739746094, -0.037303924560546875, -0.03296089172363281, -0.02861785888671875, -0.024274826049804688, -0.019931793212890625, -0.015588760375976562, -0.0112457275390625, -0.0069026947021484375, -0.002559661865234375, 0.0017833709716796875, 0.00612640380859375, 0.010469436645507812, 0.014812469482421875, 0.019155502319335938, 0.02349853515625, 0.027841567993164062, 0.032184600830078125, 0.03652763366699219, 0.04087066650390625, 0.04521369934082031, 0.049556732177734375, 0.05389976501464844, 0.0582427978515625, 0.06258583068847656, 0.06692886352539062, 0.07127189636230469, 0.07561492919921875, 0.07995796203613281, 0.08430099487304688, 0.08864402770996094, 0.092987060546875, 0.09733009338378906, 0.10167312622070312, 0.10601615905761719, 0.11035919189453125, 0.11470222473144531, 0.11904525756835938, 0.12338829040527344, 0.1277313232421875, 0.13207435607910156, 0.13641738891601562, 0.1407604217529297, 0.14510345458984375, 0.1494464874267578, 0.15378952026367188, 0.15813255310058594, 0.1624755859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 8.0, 12.0, 10.0, 12.0, 25.0, 25.0, 22.0, 18.0, 36.0, 18.0, 23.0, 43.0, 37.0, 41.0, 51.0, 44.0, 33.0, 47.0, 32.0, 49.0, 43.0, 37.0, 43.0, 30.0, 37.0, 31.0, 31.0, 24.0, 26.0, 15.0, 16.0, 10.0, 15.0, 10.0, 12.0, 5.0, 4.0, 12.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.09185791015625, -0.08912944793701172, -0.08640098571777344, -0.08367252349853516, -0.08094406127929688, -0.0782155990600586, -0.07548713684082031, -0.07275867462158203, -0.07003021240234375, -0.06730175018310547, -0.06457328796386719, -0.061844825744628906, -0.059116363525390625, -0.056387901306152344, -0.05365943908691406, -0.05093097686767578, -0.0482025146484375, -0.04547405242919922, -0.04274559020996094, -0.040017127990722656, -0.037288665771484375, -0.034560203552246094, -0.03183174133300781, -0.02910327911376953, -0.02637481689453125, -0.02364635467529297, -0.020917892456054688, -0.018189430236816406, -0.015460968017578125, -0.012732505798339844, -0.010004043579101562, -0.007275581359863281, -0.004547119140625, -0.0018186569213867188, 0.0009098052978515625, 0.0036382675170898438, 0.006366729736328125, 0.009095191955566406, 0.011823654174804688, 0.014552116394042969, 0.01728057861328125, 0.02000904083251953, 0.022737503051757812, 0.025465965270996094, 0.028194427490234375, 0.030922889709472656, 0.03365135192871094, 0.03637981414794922, 0.0391082763671875, 0.04183673858642578, 0.04456520080566406, 0.047293663024902344, 0.050022125244140625, 0.052750587463378906, 0.05547904968261719, 0.05820751190185547, 0.06093597412109375, 0.06366443634033203, 0.06639289855957031, 0.0691213607788086, 0.07184982299804688, 0.07457828521728516, 0.07730674743652344, 0.08003520965576172, 0.082763671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 15.0, 18.0, 30.0, 25.0, 48.0, 76.0, 146.0, 289.0, 649.0, 1697.0, 6374.0, 29110.0, 235719.0, 3274532.0, 581802.0, 50274.0, 9452.0, 2420.0, 780.0, 323.0, 169.0, 107.0, 67.0, 39.0, 26.0, 13.0, 25.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31982421875, -0.3093910217285156, -0.29895782470703125, -0.2885246276855469, -0.2780914306640625, -0.2676582336425781, -0.25722503662109375, -0.24679183959960938, -0.236358642578125, -0.22592544555664062, -0.21549224853515625, -0.20505905151367188, -0.1946258544921875, -0.18419265747070312, -0.17375946044921875, -0.16332626342773438, -0.15289306640625, -0.14245986938476562, -0.13202667236328125, -0.12159347534179688, -0.1111602783203125, -0.10072708129882812, -0.09029388427734375, -0.07986068725585938, -0.069427490234375, -0.058994293212890625, -0.04856109619140625, -0.038127899169921875, -0.0276947021484375, -0.017261505126953125, -0.00682830810546875, 0.003604888916015625, 0.0140380859375, 0.024471282958984375, 0.03490447998046875, 0.045337677001953125, 0.0557708740234375, 0.06620407104492188, 0.07663726806640625, 0.08707046508789062, 0.097503662109375, 0.10793685913085938, 0.11837005615234375, 0.12880325317382812, 0.1392364501953125, 0.14966964721679688, 0.16010284423828125, 0.17053604125976562, 0.18096923828125, 0.19140243530273438, 0.20183563232421875, 0.21226882934570312, 0.2227020263671875, 0.23313522338867188, 0.24356842041015625, 0.2540016174316406, 0.264434814453125, 0.2748680114746094, 0.28530120849609375, 0.2957344055175781, 0.3061676025390625, 0.3166007995605469, 0.32703399658203125, 0.3374671936035156, 0.347900390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 4.0, 6.0, 10.0, 10.0, 9.0, 12.0, 16.0, 17.0, 30.0, 39.0, 48.0, 64.0, 94.0, 108.0, 138.0, 209.0, 265.0, 387.0, 471.0, 447.0, 426.0, 318.0, 233.0, 173.0, 130.0, 95.0, 59.0, 49.0, 35.0, 31.0, 32.0, 19.0, 10.0, 14.0, 13.0, 16.0, 2.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.208740234375, -0.20246315002441406, -0.19618606567382812, -0.1899089813232422, -0.18363189697265625, -0.1773548126220703, -0.17107772827148438, -0.16480064392089844, -0.1585235595703125, -0.15224647521972656, -0.14596939086914062, -0.1396923065185547, -0.13341522216796875, -0.1271381378173828, -0.12086105346679688, -0.11458396911621094, -0.108306884765625, -0.10202980041503906, -0.09575271606445312, -0.08947563171386719, -0.08319854736328125, -0.07692146301269531, -0.07064437866210938, -0.06436729431152344, -0.0580902099609375, -0.05181312561035156, -0.045536041259765625, -0.03925895690917969, -0.03298187255859375, -0.026704788208007812, -0.020427703857421875, -0.014150619506835938, -0.00787353515625, -0.0015964508056640625, 0.004680633544921875, 0.010957717895507812, 0.01723480224609375, 0.023511886596679688, 0.029788970947265625, 0.03606605529785156, 0.0423431396484375, 0.04862022399902344, 0.054897308349609375, 0.06117439270019531, 0.06745147705078125, 0.07372856140136719, 0.08000564575195312, 0.08628273010253906, 0.092559814453125, 0.09883689880371094, 0.10511398315429688, 0.11139106750488281, 0.11766815185546875, 0.12394523620605469, 0.13022232055664062, 0.13649940490722656, 0.1427764892578125, 0.14905357360839844, 0.15533065795898438, 0.1616077423095703, 0.16788482666015625, 0.1741619110107422, 0.18043899536132812, 0.18671607971191406, 0.1929931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 3.0, 11.0, 21.0, 50.0, 128.0, 189.0, 222.0, 190.0, 98.0, 33.0, 30.0, 10.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.001578330993652, -3.8913233280181885, -3.7810683250427246, -3.67081356048584, -3.560558557510376, -3.450303554534912, -3.3400485515594482, -3.2297935485839844, -3.1195385456085205, -3.0092835426330566, -2.8990285396575928, -2.788773536682129, -2.678518772125244, -2.5682637691497803, -2.4580087661743164, -2.3477537631988525, -2.2374987602233887, -2.127243757247925, -2.016988754272461, -1.9067338705062866, -1.7964788675308228, -1.6862239837646484, -1.5759689807891846, -1.4657139778137207, -1.355459213256836, -1.245204210281372, -1.1349493265151978, -1.0246943235397339, -0.91443932056427, -0.8041843771934509, -0.6939294338226318, -0.583674430847168, -0.4734194278717041, -0.3631644546985626, -0.25290948152542114, -0.14265453815460205, -0.03239956498146057, 0.07785540819168091, 0.1881103515625, 0.29836535453796387, 0.40862029790878296, 0.518875241279602, 0.6291302442550659, 0.739385187625885, 0.8496401309967041, 0.959895133972168, 1.0701501369476318, 1.1804051399230957, 1.29066002368927, 1.4009150266647339, 1.5111699104309082, 1.621424913406372, 1.731679916381836, 1.8419349193572998, 1.9521898031234741, 2.0624446868896484, 2.1726996898651123, 2.282954692840576, 2.39320969581604, 2.503464698791504, 2.6137194633483887, 2.7239744663238525, 2.8342294692993164, 2.9444844722747803, 3.054739475250244]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 1.0, 3.0, 6.0, 3.0, 4.0, 9.0, 3.0, 6.0, 21.0, 9.0, 13.0, 15.0, 10.0, 15.0, 27.0, 17.0, 27.0, 17.0, 30.0, 26.0, 24.0, 32.0, 40.0, 49.0, 50.0, 41.0, 48.0, 34.0, 28.0, 25.0, 43.0, 27.0, 36.0, 30.0, 27.0, 19.0, 20.0, 27.0, 25.0, 19.0, 19.0, 19.0, 12.0, 4.0, 8.0, 11.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.9727334380149841, -0.9419143795967102, -0.911095380783081, -0.8802763223648071, -0.8494572639465332, -0.8186382055282593, -0.7878191471099854, -0.7570001482963562, -0.7261810898780823, -0.6953620314598083, -0.6645430326461792, -0.6337239742279053, -0.6029049158096313, -0.5720858573913574, -0.5412667989730835, -0.5104478001594543, -0.4796287417411804, -0.4488096833229065, -0.41799065470695496, -0.3871716260910034, -0.3563525676727295, -0.32553350925445557, -0.29471448063850403, -0.2638954520225525, -0.23307639360427856, -0.20225735008716583, -0.1714383065700531, -0.14061926305294037, -0.10980021953582764, -0.0789811760187149, -0.04816213250160217, -0.01734308898448944, 0.013475894927978516, 0.04429493844509125, 0.07511398196220398, 0.10593302547931671, 0.13675206899642944, 0.16757111251354218, 0.1983901560306549, 0.22920919954776764, 0.26002824306488037, 0.2908473014831543, 0.32166633009910583, 0.3524853587150574, 0.3833044171333313, 0.4141234755516052, 0.44494250416755676, 0.4757615327835083, 0.5065805912017822, 0.5373996496200562, 0.5682187080383301, 0.5990377068519592, 0.6298567652702332, 0.6606758236885071, 0.6914948225021362, 0.7223138809204102, 0.7531329393386841, 0.783951997756958, 0.8147710561752319, 0.8455900549888611, 0.876409113407135, 0.9072281718254089, 0.9380471706390381, 0.968866229057312, 0.9996852874755859]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 18.0, 19.0, 28.0, 49.0, 67.0, 80.0, 113.0, 154.0, 240.0, 386.0, 500.0, 780.0, 1275.0, 2041.0, 3319.0, 5835.0, 11634.0, 27507.0, 75728.0, 208970.0, 356553.0, 218206.0, 78832.0, 28612.0, 12245.0, 5960.0, 3436.0, 1982.0, 1324.0, 846.0, 562.0, 376.0, 284.0, 188.0, 112.0, 69.0, 56.0, 38.0, 37.0, 33.0, 10.0, 9.0, 2.0, 7.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.1357421875, -0.13169288635253906, -0.12764358520507812, -0.12359428405761719, -0.11954498291015625, -0.11549568176269531, -0.11144638061523438, -0.10739707946777344, -0.1033477783203125, -0.09929847717285156, -0.09524917602539062, -0.09119987487792969, -0.08715057373046875, -0.08310127258300781, -0.07905197143554688, -0.07500267028808594, -0.070953369140625, -0.06690406799316406, -0.06285476684570312, -0.05880546569824219, -0.05475616455078125, -0.05070686340332031, -0.046657562255859375, -0.04260826110839844, -0.0385589599609375, -0.03450965881347656, -0.030460357666015625, -0.026411056518554688, -0.02236175537109375, -0.018312454223632812, -0.014263153076171875, -0.010213851928710938, -0.00616455078125, -0.0021152496337890625, 0.001934051513671875, 0.0059833526611328125, 0.01003265380859375, 0.014081954956054688, 0.018131256103515625, 0.022180557250976562, 0.0262298583984375, 0.030279159545898438, 0.034328460693359375, 0.03837776184082031, 0.04242706298828125, 0.04647636413574219, 0.050525665283203125, 0.05457496643066406, 0.058624267578125, 0.06267356872558594, 0.06672286987304688, 0.07077217102050781, 0.07482147216796875, 0.07887077331542969, 0.08292007446289062, 0.08696937561035156, 0.0910186767578125, 0.09506797790527344, 0.09911727905273438, 0.10316658020019531, 0.10721588134765625, 0.11126518249511719, 0.11531448364257812, 0.11936378479003906, 0.1234130859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 6.0, 3.0, 8.0, 7.0, 8.0, 12.0, 26.0, 20.0, 30.0, 29.0, 29.0, 35.0, 50.0, 46.0, 52.0, 49.0, 61.0, 43.0, 44.0, 42.0, 58.0, 42.0, 36.0, 37.0, 35.0, 34.0, 30.0, 20.0, 15.0, 24.0, 13.0, 14.0, 9.0, 10.0, 9.0, 2.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11265277862548828, -0.10921669006347656, -0.10578060150146484, -0.10234451293945312, -0.0989084243774414, -0.09547233581542969, -0.09203624725341797, -0.08860015869140625, -0.08516407012939453, -0.08172798156738281, -0.0782918930053711, -0.07485580444335938, -0.07141971588134766, -0.06798362731933594, -0.06454753875732422, -0.0611114501953125, -0.05767536163330078, -0.05423927307128906, -0.050803184509277344, -0.047367095947265625, -0.043931007385253906, -0.04049491882324219, -0.03705883026123047, -0.03362274169921875, -0.03018665313720703, -0.026750564575195312, -0.023314476013183594, -0.019878387451171875, -0.016442298889160156, -0.013006210327148438, -0.009570121765136719, -0.006134033203125, -0.0026979446411132812, 0.0007381439208984375, 0.004174232482910156, 0.007610321044921875, 0.011046409606933594, 0.014482498168945312, 0.01791858673095703, 0.02135467529296875, 0.02479076385498047, 0.028226852416992188, 0.031662940979003906, 0.035099029541015625, 0.038535118103027344, 0.04197120666503906, 0.04540729522705078, 0.0488433837890625, 0.05227947235107422, 0.05571556091308594, 0.059151649475097656, 0.06258773803710938, 0.0660238265991211, 0.06945991516113281, 0.07289600372314453, 0.07633209228515625, 0.07976818084716797, 0.08320426940917969, 0.0866403579711914, 0.09007644653320312, 0.09351253509521484, 0.09694862365722656, 0.10038471221923828, 0.10382080078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 10.0, 12.0, 9.0, 15.0, 27.0, 33.0, 53.0, 84.0, 132.0, 264.0, 495.0, 1064.0, 2671.0, 8138.0, 47748.0, 664711.0, 287364.0, 26294.0, 5546.0, 2041.0, 835.0, 380.0, 217.0, 124.0, 74.0, 58.0, 38.0, 24.0, 16.0, 13.0, 13.0, 8.0, 10.0, 5.0, 6.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.336669921875, -0.32642364501953125, -0.3161773681640625, -0.30593109130859375, -0.295684814453125, -0.28543853759765625, -0.2751922607421875, -0.26494598388671875, -0.25469970703125, -0.24445343017578125, -0.2342071533203125, -0.22396087646484375, -0.213714599609375, -0.20346832275390625, -0.1932220458984375, -0.18297576904296875, -0.1727294921875, -0.16248321533203125, -0.1522369384765625, -0.14199066162109375, -0.131744384765625, -0.12149810791015625, -0.1112518310546875, -0.10100555419921875, -0.09075927734375, -0.08051300048828125, -0.0702667236328125, -0.06002044677734375, -0.049774169921875, -0.03952789306640625, -0.0292816162109375, -0.01903533935546875, -0.0087890625, 0.00145721435546875, 0.0117034912109375, 0.02194976806640625, 0.032196044921875, 0.04244232177734375, 0.0526885986328125, 0.06293487548828125, 0.07318115234375, 0.08342742919921875, 0.0936737060546875, 0.10391998291015625, 0.114166259765625, 0.12441253662109375, 0.1346588134765625, 0.14490509033203125, 0.1551513671875, 0.16539764404296875, 0.1756439208984375, 0.18589019775390625, 0.196136474609375, 0.20638275146484375, 0.2166290283203125, 0.22687530517578125, 0.23712158203125, 0.24736785888671875, 0.2576141357421875, 0.26786041259765625, 0.278106689453125, 0.28835296630859375, 0.2985992431640625, 0.30884552001953125, 0.319091796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 14.0, 13.0, 22.0, 13.0, 19.0, 27.0, 34.0, 32.0, 45.0, 60.0, 47.0, 61.0, 86.0, 59.0, 62.0, 59.0, 69.0, 42.0, 35.0, 38.0, 35.0, 23.0, 16.0, 9.0, 9.0, 12.0, 4.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51416015625, -0.49811553955078125, -0.4820709228515625, -0.46602630615234375, -0.449981689453125, -0.43393707275390625, -0.4178924560546875, -0.40184783935546875, -0.38580322265625, -0.36975860595703125, -0.3537139892578125, -0.33766937255859375, -0.321624755859375, -0.30558013916015625, -0.2895355224609375, -0.27349090576171875, -0.2574462890625, -0.24140167236328125, -0.2253570556640625, -0.20931243896484375, -0.193267822265625, -0.17722320556640625, -0.1611785888671875, -0.14513397216796875, -0.12908935546875, -0.11304473876953125, -0.0970001220703125, -0.08095550537109375, -0.064910888671875, -0.04886627197265625, -0.0328216552734375, -0.01677703857421875, -0.000732421875, 0.01531219482421875, 0.0313568115234375, 0.04740142822265625, 0.063446044921875, 0.07949066162109375, 0.0955352783203125, 0.11157989501953125, 0.12762451171875, 0.14366912841796875, 0.1597137451171875, 0.17575836181640625, 0.191802978515625, 0.20784759521484375, 0.2238922119140625, 0.23993682861328125, 0.2559814453125, 0.27202606201171875, 0.2880706787109375, 0.30411529541015625, 0.320159912109375, 0.33620452880859375, 0.3522491455078125, 0.36829376220703125, 0.38433837890625, 0.40038299560546875, 0.4164276123046875, 0.43247222900390625, 0.448516845703125, 0.46456146240234375, 0.4806060791015625, 0.49665069580078125, 0.5126953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 12.0, 14.0, 26.0, 35.0, 60.0, 127.0, 252.0, 554.0, 1418.0, 4677.0, 20803.0, 142456.0, 745483.0, 109505.0, 16982.0, 3862.0, 1275.0, 526.0, 214.0, 101.0, 69.0, 39.0, 25.0, 12.0, 8.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.124267578125, -0.11918258666992188, -0.11409759521484375, -0.10901260375976562, -0.1039276123046875, -0.09884262084960938, -0.09375762939453125, -0.08867263793945312, -0.083587646484375, -0.07850265502929688, -0.07341766357421875, -0.06833267211914062, -0.0632476806640625, -0.058162689208984375, -0.05307769775390625, -0.047992706298828125, -0.04290771484375, -0.037822723388671875, -0.03273773193359375, -0.027652740478515625, -0.0225677490234375, -0.017482757568359375, -0.01239776611328125, -0.007312774658203125, -0.002227783203125, 0.002857208251953125, 0.00794219970703125, 0.013027191162109375, 0.0181121826171875, 0.023197174072265625, 0.02828216552734375, 0.033367156982421875, 0.0384521484375, 0.043537139892578125, 0.04862213134765625, 0.053707122802734375, 0.0587921142578125, 0.06387710571289062, 0.06896209716796875, 0.07404708862304688, 0.079132080078125, 0.08421707153320312, 0.08930206298828125, 0.09438705444335938, 0.0994720458984375, 0.10455703735351562, 0.10964202880859375, 0.11472702026367188, 0.11981201171875, 0.12489700317382812, 0.12998199462890625, 0.13506698608398438, 0.1401519775390625, 0.14523696899414062, 0.15032196044921875, 0.15540695190429688, 0.160491943359375, 0.16557693481445312, 0.17066192626953125, 0.17574691772460938, 0.1808319091796875, 0.18591690063476562, 0.19100189208984375, 0.19608688354492188, 0.201171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 7.0, 11.0, 18.0, 18.0, 35.0, 32.0, 28.0, 71.0, 74.0, 82.0, 101.0, 85.0, 98.0, 77.0, 70.0, 36.0, 28.0, 32.0, 29.0, 24.0, 7.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.607439041137695e-05, -4.481431096792221e-05, -4.355423152446747e-05, -4.2294152081012726e-05, -4.1034072637557983e-05, -3.977399319410324e-05, -3.85139137506485e-05, -3.7253834307193756e-05, -3.5993754863739014e-05, -3.473367542028427e-05, -3.347359597682953e-05, -3.2213516533374786e-05, -3.0953437089920044e-05, -2.96933576464653e-05, -2.843327820301056e-05, -2.7173198759555817e-05, -2.5913119316101074e-05, -2.4653039872646332e-05, -2.339296042919159e-05, -2.2132880985736847e-05, -2.0872801542282104e-05, -1.9612722098827362e-05, -1.835264265537262e-05, -1.7092563211917877e-05, -1.5832483768463135e-05, -1.4572404325008392e-05, -1.331232488155365e-05, -1.2052245438098907e-05, -1.0792165994644165e-05, -9.532086551189423e-06, -8.27200710773468e-06, -7.011927664279938e-06, -5.751848220825195e-06, -4.491768777370453e-06, -3.2316893339157104e-06, -1.971609890460968e-06, -7.115304470062256e-07, 5.485489964485168e-07, 1.8086284399032593e-06, 3.0687078833580017e-06, 4.328787326812744e-06, 5.5888667702674866e-06, 6.848946213722229e-06, 8.109025657176971e-06, 9.369105100631714e-06, 1.0629184544086456e-05, 1.1889263987541199e-05, 1.3149343430995941e-05, 1.4409422874450684e-05, 1.5669502317905426e-05, 1.692958176136017e-05, 1.818966120481491e-05, 1.9449740648269653e-05, 2.0709820091724396e-05, 2.1969899535179138e-05, 2.322997897863388e-05, 2.4490058422088623e-05, 2.5750137865543365e-05, 2.7010217308998108e-05, 2.827029675245285e-05, 2.9530376195907593e-05, 3.0790455639362335e-05, 3.205053508281708e-05, 3.331061452627182e-05, 3.457069396972656e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 12.0, 13.0, 21.0, 24.0, 51.0, 56.0, 87.0, 170.0, 355.0, 649.0, 1452.0, 3589.0, 11813.0, 49752.0, 288272.0, 590288.0, 77347.0, 16300.0, 4789.0, 1754.0, 819.0, 389.0, 195.0, 117.0, 82.0, 41.0, 29.0, 20.0, 15.0, 16.0, 12.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.160400390625, -0.15619373321533203, -0.15198707580566406, -0.1477804183959961, -0.14357376098632812, -0.13936710357666016, -0.1351604461669922, -0.13095378875732422, -0.12674713134765625, -0.12254047393798828, -0.11833381652832031, -0.11412715911865234, -0.10992050170898438, -0.1057138442993164, -0.10150718688964844, -0.09730052947998047, -0.0930938720703125, -0.08888721466064453, -0.08468055725097656, -0.0804738998413086, -0.07626724243164062, -0.07206058502197266, -0.06785392761230469, -0.06364727020263672, -0.05944061279296875, -0.05523395538330078, -0.05102729797363281, -0.046820640563964844, -0.042613983154296875, -0.038407325744628906, -0.03420066833496094, -0.02999401092529297, -0.025787353515625, -0.02158069610595703, -0.017374038696289062, -0.013167381286621094, -0.008960723876953125, -0.004754066467285156, -0.0005474090576171875, 0.0036592483520507812, 0.00786590576171875, 0.012072563171386719, 0.016279220581054688, 0.020485877990722656, 0.024692535400390625, 0.028899192810058594, 0.03310585021972656, 0.03731250762939453, 0.0415191650390625, 0.04572582244873047, 0.04993247985839844, 0.054139137268066406, 0.058345794677734375, 0.06255245208740234, 0.06675910949707031, 0.07096576690673828, 0.07517242431640625, 0.07937908172607422, 0.08358573913574219, 0.08779239654541016, 0.09199905395507812, 0.0962057113647461, 0.10041236877441406, 0.10461902618408203, 0.10882568359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 16.0, 26.0, 39.0, 52.0, 65.0, 71.0, 95.0, 104.0, 90.0, 91.0, 67.0, 54.0, 58.0, 38.0, 23.0, 13.0, 19.0, 7.0, 6.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.14571762084960938, -0.14165496826171875, -0.13759231567382812, -0.1335296630859375, -0.12946701049804688, -0.12540435791015625, -0.12134170532226562, -0.117279052734375, -0.11321640014648438, -0.10915374755859375, -0.10509109497070312, -0.1010284423828125, -0.09696578979492188, -0.09290313720703125, -0.08884048461914062, -0.08477783203125, -0.08071517944335938, -0.07665252685546875, -0.07258987426757812, -0.0685272216796875, -0.06446456909179688, -0.06040191650390625, -0.056339263916015625, -0.052276611328125, -0.048213958740234375, -0.04415130615234375, -0.040088653564453125, -0.0360260009765625, -0.031963348388671875, -0.02790069580078125, -0.023838043212890625, -0.019775390625, -0.015712738037109375, -0.01165008544921875, -0.007587432861328125, -0.0035247802734375, 0.000537872314453125, 0.00460052490234375, 0.008663177490234375, 0.012725830078125, 0.016788482666015625, 0.02085113525390625, 0.024913787841796875, 0.0289764404296875, 0.033039093017578125, 0.03710174560546875, 0.041164398193359375, 0.04522705078125, 0.049289703369140625, 0.05335235595703125, 0.057415008544921875, 0.0614776611328125, 0.06554031372070312, 0.06960296630859375, 0.07366561889648438, 0.077728271484375, 0.08179092407226562, 0.08585357666015625, 0.08991622924804688, 0.0939788818359375, 0.09804153442382812, 0.10210418701171875, 0.10616683959960938, 0.1102294921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 11.0, 14.0, 25.0, 52.0, 95.0, 136.0, 265.0, 177.0, 97.0, 58.0, 32.0, 8.0, 6.0, 9.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.548521041870117, -3.4740092754364014, -3.3994977474212646, -3.324985980987549, -3.250474214553833, -3.175962448120117, -3.1014509201049805, -3.0269391536712646, -2.952427387237549, -2.877915620803833, -2.8034040927886963, -2.7288923263549805, -2.6543805599212646, -2.579868793487549, -2.505357265472412, -2.4308454990386963, -2.3563339710235596, -2.2818222045898438, -2.207310676574707, -2.132798910140991, -2.0582871437072754, -1.9837754964828491, -1.9092638492584229, -1.834752082824707, -1.7602404356002808, -1.6857287883758545, -1.6112170219421387, -1.5367053747177124, -1.4621937274932861, -1.3876819610595703, -1.313170313835144, -1.2386586666107178, -1.1641470193862915, -1.0896353721618652, -1.0151236057281494, -0.9406119585037231, -0.8661002516746521, -0.791588544845581, -0.7170768976211548, -0.6425651907920837, -0.5680534839630127, -0.49354177713394165, -0.419030100107193, -0.34451842308044434, -0.2700067162513733, -0.19549500942230225, -0.12098333239555359, -0.04647165536880493, 0.028040051460266113, 0.10255174338817596, 0.17706343531608582, 0.2515751123428345, 0.3260868191719055, 0.40059852600097656, 0.4751102030277252, 0.5496218800544739, 0.6241335868835449, 0.698645293712616, 0.773157000541687, 0.8476686477661133, 0.9221803545951843, 0.9966920614242554, 1.0712037086486816, 1.1457154750823975, 1.2202271223068237]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 15.0, 17.0, 19.0, 20.0, 17.0, 30.0, 31.0, 56.0, 41.0, 60.0, 93.0, 86.0, 73.0, 82.0, 62.0, 48.0, 31.0, 28.0, 24.0, 25.0, 15.0, 15.0, 14.0, 12.0, 15.0, 9.0, 9.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.151763916015625, -2.0883803367614746, -2.024996757507324, -1.9616132974624634, -1.8982298374176025, -1.8348462581634521, -1.7714626789093018, -1.7080790996551514, -1.6446956396102905, -1.5813120603561401, -1.5179286003112793, -1.454545021057129, -1.3911614418029785, -1.3277779817581177, -1.2643944025039673, -1.2010109424591064, -1.137627363204956, -1.0742437839508057, -1.0108603239059448, -0.9474767446517944, -0.8840932250022888, -0.8207097053527832, -0.7573261260986328, -0.6939426064491272, -0.6305590867996216, -0.567175567150116, -0.5037920475006104, -0.44040846824645996, -0.37702494859695435, -0.31364142894744873, -0.2502578794956207, -0.18687433004379272, -0.12349069118499756, -0.06010715663433075, 0.0032763779163360596, 0.06665991246700287, 0.13004344701766968, 0.1934269666671753, 0.2568105161190033, 0.3201940655708313, 0.3835775852203369, 0.44696110486984253, 0.5103446245193481, 0.5737282037734985, 0.6371117234230042, 0.7004952430725098, 0.7638788223266602, 0.8272623419761658, 0.8906458616256714, 0.954029381275177, 1.0174129009246826, 1.080796480178833, 1.1441800594329834, 1.2075635194778442, 1.2709470987319946, 1.3343305587768555, 1.3977141380310059, 1.4610977172851562, 1.524481177330017, 1.5878647565841675, 1.6512482166290283, 1.7146317958831787, 1.778015375137329, 1.8413989543914795, 1.9047824144363403]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 12.0, 27.0, 23.0, 43.0, 73.0, 113.0, 173.0, 313.0, 478.0, 824.0, 1417.0, 2629.0, 4741.0, 9433.0, 20248.0, 48136.0, 140285.0, 530389.0, 1851855.0, 1155840.0, 281993.0, 83610.0, 31713.0, 14273.0, 6908.0, 3727.0, 2065.0, 1109.0, 668.0, 436.0, 233.0, 185.0, 112.0, 69.0, 33.0, 35.0, 15.0, 8.0, 7.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1180419921875, -0.11474227905273438, -0.11144256591796875, -0.10814285278320312, -0.1048431396484375, -0.10154342651367188, -0.09824371337890625, -0.09494400024414062, -0.091644287109375, -0.08834457397460938, -0.08504486083984375, -0.08174514770507812, -0.0784454345703125, -0.07514572143554688, -0.07184600830078125, -0.06854629516601562, -0.06524658203125, -0.061946868896484375, -0.05864715576171875, -0.055347442626953125, -0.0520477294921875, -0.048748016357421875, -0.04544830322265625, -0.042148590087890625, -0.038848876953125, -0.035549163818359375, -0.03224945068359375, -0.028949737548828125, -0.0256500244140625, -0.022350311279296875, -0.01905059814453125, -0.015750885009765625, -0.012451171875, -0.009151458740234375, -0.00585174560546875, -0.002552032470703125, 0.0007476806640625, 0.004047393798828125, 0.00734710693359375, 0.010646820068359375, 0.013946533203125, 0.017246246337890625, 0.02054595947265625, 0.023845672607421875, 0.0271453857421875, 0.030445098876953125, 0.03374481201171875, 0.037044525146484375, 0.04034423828125, 0.043643951416015625, 0.04694366455078125, 0.050243377685546875, 0.0535430908203125, 0.056842803955078125, 0.06014251708984375, 0.06344223022460938, 0.066741943359375, 0.07004165649414062, 0.07334136962890625, 0.07664108276367188, 0.0799407958984375, 0.08324050903320312, 0.08654022216796875, 0.08983993530273438, 0.0931396484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 8.0, 10.0, 10.0, 11.0, 19.0, 13.0, 26.0, 27.0, 35.0, 35.0, 37.0, 48.0, 52.0, 46.0, 52.0, 47.0, 59.0, 45.0, 51.0, 55.0, 39.0, 45.0, 37.0, 33.0, 17.0, 24.0, 26.0, 17.0, 8.0, 18.0, 9.0, 14.0, 6.0, 7.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10247802734375, -0.09899139404296875, -0.0955047607421875, -0.09201812744140625, -0.088531494140625, -0.08504486083984375, -0.0815582275390625, -0.07807159423828125, -0.0745849609375, -0.07109832763671875, -0.0676116943359375, -0.06412506103515625, -0.060638427734375, -0.05715179443359375, -0.0536651611328125, -0.05017852783203125, -0.04669189453125, -0.04320526123046875, -0.0397186279296875, -0.03623199462890625, -0.032745361328125, -0.02925872802734375, -0.0257720947265625, -0.02228546142578125, -0.018798828125, -0.01531219482421875, -0.0118255615234375, -0.00833892822265625, -0.004852294921875, -0.00136566162109375, 0.0021209716796875, 0.00560760498046875, 0.00909423828125, 0.01258087158203125, 0.0160675048828125, 0.01955413818359375, 0.023040771484375, 0.02652740478515625, 0.0300140380859375, 0.03350067138671875, 0.0369873046875, 0.04047393798828125, 0.0439605712890625, 0.04744720458984375, 0.050933837890625, 0.05442047119140625, 0.0579071044921875, 0.06139373779296875, 0.06488037109375, 0.06836700439453125, 0.0718536376953125, 0.07534027099609375, 0.078826904296875, 0.08231353759765625, 0.0858001708984375, 0.08928680419921875, 0.0927734375, 0.09626007080078125, 0.0997467041015625, 0.10323333740234375, 0.106719970703125, 0.11020660400390625, 0.1136932373046875, 0.11717987060546875, 0.12066650390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 9.0, 15.0, 24.0, 40.0, 77.0, 192.0, 479.0, 2534.0, 30734.0, 3126536.0, 1014953.0, 16496.0, 1540.0, 373.0, 105.0, 67.0, 37.0, 21.0, 16.0, 7.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6374435424804688, -0.6186370849609375, -0.5998306274414062, -0.581024169921875, -0.5622177124023438, -0.5434112548828125, -0.5246047973632812, -0.50579833984375, -0.48699188232421875, -0.4681854248046875, -0.44937896728515625, -0.430572509765625, -0.41176605224609375, -0.3929595947265625, -0.37415313720703125, -0.3553466796875, -0.33654022216796875, -0.3177337646484375, -0.29892730712890625, -0.280120849609375, -0.26131439208984375, -0.2425079345703125, -0.22370147705078125, -0.20489501953125, -0.18608856201171875, -0.1672821044921875, -0.14847564697265625, -0.129669189453125, -0.11086273193359375, -0.0920562744140625, -0.07324981689453125, -0.054443359375, -0.03563690185546875, -0.0168304443359375, 0.00197601318359375, 0.020782470703125, 0.03958892822265625, 0.0583953857421875, 0.07720184326171875, 0.09600830078125, 0.11481475830078125, 0.1336212158203125, 0.15242767333984375, 0.171234130859375, 0.19004058837890625, 0.2088470458984375, 0.22765350341796875, 0.2464599609375, 0.26526641845703125, 0.2840728759765625, 0.30287933349609375, 0.321685791015625, 0.34049224853515625, 0.3592987060546875, 0.37810516357421875, 0.39691162109375, 0.41571807861328125, 0.4345245361328125, 0.45333099365234375, 0.472137451171875, 0.49094390869140625, 0.5097503662109375, 0.5285568237304688, 0.54736328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 4.0, 4.0, 12.0, 11.0, 18.0, 23.0, 26.0, 40.0, 49.0, 92.0, 102.0, 147.0, 195.0, 360.0, 509.0, 575.0, 610.0, 379.0, 272.0, 165.0, 118.0, 92.0, 74.0, 38.0, 27.0, 29.0, 18.0, 17.0, 13.0, 9.0, 9.0, 6.0, 8.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.25914764404296875, -0.2516937255859375, -0.24423980712890625, -0.236785888671875, -0.22933197021484375, -0.2218780517578125, -0.21442413330078125, -0.20697021484375, -0.19951629638671875, -0.1920623779296875, -0.18460845947265625, -0.177154541015625, -0.16970062255859375, -0.1622467041015625, -0.15479278564453125, -0.1473388671875, -0.13988494873046875, -0.1324310302734375, -0.12497711181640625, -0.117523193359375, -0.11006927490234375, -0.1026153564453125, -0.09516143798828125, -0.08770751953125, -0.08025360107421875, -0.0727996826171875, -0.06534576416015625, -0.057891845703125, -0.05043792724609375, -0.0429840087890625, -0.03553009033203125, -0.028076171875, -0.02062225341796875, -0.0131683349609375, -0.00571441650390625, 0.001739501953125, 0.00919342041015625, 0.0166473388671875, 0.02410125732421875, 0.03155517578125, 0.03900909423828125, 0.0464630126953125, 0.05391693115234375, 0.061370849609375, 0.06882476806640625, 0.0762786865234375, 0.08373260498046875, 0.0911865234375, 0.09864044189453125, 0.1060943603515625, 0.11354827880859375, 0.121002197265625, 0.12845611572265625, 0.1359100341796875, 0.14336395263671875, 0.15081787109375, 0.15827178955078125, 0.1657257080078125, 0.17317962646484375, 0.180633544921875, 0.18808746337890625, 0.1955413818359375, 0.20299530029296875, 0.21044921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 5.0, 12.0, 30.0, 71.0, 178.0, 270.0, 217.0, 127.0, 57.0, 16.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.443475246429443, -4.325896739959717, -4.20831823348999, -4.090740203857422, -3.9731616973876953, -3.8555831909179688, -3.738004684448242, -3.6204264163970947, -3.5028481483459473, -3.3852696418762207, -3.2676913738250732, -3.1501128673553467, -3.032534599304199, -2.9149560928344727, -2.797377586364746, -2.6797993183135986, -2.562220811843872, -2.4446423053741455, -2.327064037322998, -2.2094855308532715, -2.091907262802124, -1.9743287563323975, -1.8567503690719604, -1.7391719818115234, -1.6215935945510864, -1.5040152072906494, -1.3864368200302124, -1.2688584327697754, -1.1512799263000488, -1.0337016582489014, -0.9161231517791748, -0.7985447645187378, -0.6809661388397217, -0.5633877515792847, -0.44580933451652527, -0.32823091745376587, -0.21065253019332886, -0.09307414293289185, 0.02450430393218994, 0.14208269119262695, 0.25966107845306396, 0.377239465713501, 0.4948178827762604, 0.6123962998390198, 0.7299746870994568, 0.8475530743598938, 0.9651315212249756, 1.0827099084854126, 1.2002882957458496, 1.3178666830062866, 1.4354450702667236, 1.5530235767364502, 1.6706018447875977, 1.7881803512573242, 1.9057587385177612, 2.0233371257781982, 2.1409153938293457, 2.2584939002990723, 2.3760721683502197, 2.4936506748199463, 2.6112289428710938, 2.7288074493408203, 2.846385955810547, 2.9639642238616943, 3.081542730331421]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 13.0, 7.0, 12.0, 12.0, 15.0, 15.0, 23.0, 27.0, 23.0, 29.0, 31.0, 27.0, 27.0, 36.0, 43.0, 47.0, 38.0, 46.0, 53.0, 42.0, 40.0, 32.0, 43.0, 28.0, 33.0, 25.0, 29.0, 27.0, 23.0, 20.0, 17.0, 20.0, 18.0, 11.0, 12.0, 9.0, 12.0, 2.0, 5.0, 5.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.9159272909164429, -0.8853943943977356, -0.8548614978790283, -0.824328601360321, -0.7937957048416138, -0.7632628083229065, -0.7327299118041992, -0.7021970152854919, -0.6716641187667847, -0.6411312222480774, -0.6105983257293701, -0.5800654292106628, -0.5495325326919556, -0.5189996361732483, -0.488466739654541, -0.45793384313583374, -0.4274009168148041, -0.3968680202960968, -0.3663351237773895, -0.33580222725868225, -0.305269330739975, -0.2747364044189453, -0.24420352280139923, -0.21367062628269196, -0.18313772976398468, -0.1526048332452774, -0.12207193672657013, -0.09153903275728226, -0.06100613623857498, -0.03047323226928711, 5.9664249420166016e-05, 0.03059256076812744, 0.06112545728683472, 0.09165835380554199, 0.12219125032424927, 0.15272414684295654, 0.18325704336166382, 0.2137899547815323, 0.24432285130023956, 0.27485573291778564, 0.3053886294364929, 0.3359215259552002, 0.36645442247390747, 0.39698731899261475, 0.427520215511322, 0.4580531120300293, 0.4885860085487366, 0.5191189050674438, 0.5496518611907959, 0.5801847577095032, 0.6107176542282104, 0.6412505507469177, 0.671783447265625, 0.7023163437843323, 0.7328492403030396, 0.7633821368217468, 0.7939150333404541, 0.8244479298591614, 0.8549808263778687, 0.8855137228965759, 0.9160466194152832, 0.9465795159339905, 0.9771124124526978, 1.0076453685760498, 1.0381782054901123]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 20.0, 28.0, 35.0, 43.0, 55.0, 124.0, 149.0, 228.0, 378.0, 565.0, 966.0, 1739.0, 3484.0, 7865.0, 21546.0, 79546.0, 345421.0, 431516.0, 109036.0, 27529.0, 9451.0, 3891.0, 2012.0, 1116.0, 676.0, 378.0, 248.0, 159.0, 106.0, 81.0, 49.0, 35.0, 21.0, 19.0, 9.0, 9.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.20703125, -0.20113372802734375, -0.1952362060546875, -0.18933868408203125, -0.183441162109375, -0.17754364013671875, -0.1716461181640625, -0.16574859619140625, -0.15985107421875, -0.15395355224609375, -0.1480560302734375, -0.14215850830078125, -0.136260986328125, -0.13036346435546875, -0.1244659423828125, -0.11856842041015625, -0.1126708984375, -0.10677337646484375, -0.1008758544921875, -0.09497833251953125, -0.089080810546875, -0.08318328857421875, -0.0772857666015625, -0.07138824462890625, -0.06549072265625, -0.05959320068359375, -0.0536956787109375, -0.04779815673828125, -0.041900634765625, -0.03600311279296875, -0.0301055908203125, -0.02420806884765625, -0.018310546875, -0.01241302490234375, -0.0065155029296875, -0.00061798095703125, 0.005279541015625, 0.01117706298828125, 0.0170745849609375, 0.02297210693359375, 0.02886962890625, 0.03476715087890625, 0.0406646728515625, 0.04656219482421875, 0.052459716796875, 0.05835723876953125, 0.0642547607421875, 0.07015228271484375, 0.0760498046875, 0.08194732666015625, 0.0878448486328125, 0.09374237060546875, 0.099639892578125, 0.10553741455078125, 0.1114349365234375, 0.11733245849609375, 0.12322998046875, 0.12912750244140625, 0.1350250244140625, 0.14092254638671875, 0.146820068359375, 0.15271759033203125, 0.1586151123046875, 0.16451263427734375, 0.17041015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 7.0, 18.0, 14.0, 17.0, 12.0, 17.0, 17.0, 18.0, 27.0, 34.0, 38.0, 27.0, 33.0, 35.0, 46.0, 36.0, 47.0, 42.0, 43.0, 34.0, 26.0, 43.0, 38.0, 48.0, 24.0, 29.0, 34.0, 27.0, 19.0, 9.0, 22.0, 13.0, 18.0, 10.0, 7.0, 11.0, 10.0, 4.0, 7.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.09228515625, -0.0894479751586914, -0.08661079406738281, -0.08377361297607422, -0.08093643188476562, -0.07809925079345703, -0.07526206970214844, -0.07242488861083984, -0.06958770751953125, -0.06675052642822266, -0.06391334533691406, -0.06107616424560547, -0.058238983154296875, -0.05540180206298828, -0.05256462097167969, -0.049727439880371094, -0.0468902587890625, -0.044053077697753906, -0.04121589660644531, -0.03837871551513672, -0.035541534423828125, -0.03270435333251953, -0.029867172241210938, -0.027029991149902344, -0.02419281005859375, -0.021355628967285156, -0.018518447875976562, -0.01568126678466797, -0.012844085693359375, -0.010006904602050781, -0.0071697235107421875, -0.004332542419433594, -0.001495361328125, 0.0013418197631835938, 0.0041790008544921875, 0.007016181945800781, 0.009853363037109375, 0.012690544128417969, 0.015527725219726562, 0.018364906311035156, 0.02120208740234375, 0.024039268493652344, 0.026876449584960938, 0.02971363067626953, 0.032550811767578125, 0.03538799285888672, 0.03822517395019531, 0.041062355041503906, 0.0438995361328125, 0.046736717224121094, 0.04957389831542969, 0.05241107940673828, 0.055248260498046875, 0.05808544158935547, 0.06092262268066406, 0.06375980377197266, 0.06659698486328125, 0.06943416595458984, 0.07227134704589844, 0.07510852813720703, 0.07794570922851562, 0.08078289031982422, 0.08362007141113281, 0.0864572525024414, 0.08929443359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 6.0, 1.0, 6.0, 6.0, 11.0, 13.0, 22.0, 21.0, 27.0, 46.0, 57.0, 87.0, 120.0, 179.0, 343.0, 577.0, 1137.0, 2652.0, 8290.0, 41535.0, 590465.0, 355327.0, 35229.0, 7199.0, 2508.0, 1168.0, 568.0, 343.0, 198.0, 130.0, 87.0, 53.0, 34.0, 34.0, 20.0, 11.0, 12.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.322998046875, -0.31375885009765625, -0.3045196533203125, -0.29528045654296875, -0.286041259765625, -0.27680206298828125, -0.2675628662109375, -0.25832366943359375, -0.24908447265625, -0.23984527587890625, -0.2306060791015625, -0.22136688232421875, -0.212127685546875, -0.20288848876953125, -0.1936492919921875, -0.18441009521484375, -0.1751708984375, -0.16593170166015625, -0.1566925048828125, -0.14745330810546875, -0.138214111328125, -0.12897491455078125, -0.1197357177734375, -0.11049652099609375, -0.10125732421875, -0.09201812744140625, -0.0827789306640625, -0.07353973388671875, -0.064300537109375, -0.05506134033203125, -0.0458221435546875, -0.03658294677734375, -0.02734375, -0.01810455322265625, -0.0088653564453125, 0.00037384033203125, 0.009613037109375, 0.01885223388671875, 0.0280914306640625, 0.03733062744140625, 0.04656982421875, 0.05580902099609375, 0.0650482177734375, 0.07428741455078125, 0.083526611328125, 0.09276580810546875, 0.1020050048828125, 0.11124420166015625, 0.1204833984375, 0.12972259521484375, 0.1389617919921875, 0.14820098876953125, 0.157440185546875, 0.16667938232421875, 0.1759185791015625, 0.18515777587890625, 0.19439697265625, 0.20363616943359375, 0.2128753662109375, 0.22211456298828125, 0.231353759765625, 0.24059295654296875, 0.2498321533203125, 0.25907135009765625, 0.268310546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 6.0, 1.0, 3.0, 4.0, 9.0, 12.0, 15.0, 10.0, 23.0, 18.0, 27.0, 40.0, 37.0, 41.0, 52.0, 60.0, 62.0, 63.0, 63.0, 60.0, 58.0, 51.0, 40.0, 48.0, 42.0, 22.0, 21.0, 30.0, 14.0, 18.0, 15.0, 5.0, 6.0, 4.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5652580261230469, -0.5499496459960938, -0.5346412658691406, -0.5193328857421875, -0.5040245056152344, -0.48871612548828125, -0.4734077453613281, -0.458099365234375, -0.4427909851074219, -0.42748260498046875, -0.4121742248535156, -0.3968658447265625, -0.3815574645996094, -0.36624908447265625, -0.3509407043457031, -0.33563232421875, -0.3203239440917969, -0.30501556396484375, -0.2897071838378906, -0.2743988037109375, -0.2590904235839844, -0.24378204345703125, -0.22847366333007812, -0.213165283203125, -0.19785690307617188, -0.18254852294921875, -0.16724014282226562, -0.1519317626953125, -0.13662338256835938, -0.12131500244140625, -0.10600662231445312, -0.0906982421875, -0.07538986206054688, -0.06008148193359375, -0.044773101806640625, -0.0294647216796875, -0.014156341552734375, 0.00115203857421875, 0.016460418701171875, 0.031768798828125, 0.047077178955078125, 0.06238555908203125, 0.07769393920898438, 0.0930023193359375, 0.10831069946289062, 0.12361907958984375, 0.13892745971679688, 0.15423583984375, 0.16954421997070312, 0.18485260009765625, 0.20016098022460938, 0.2154693603515625, 0.23077774047851562, 0.24608612060546875, 0.2613945007324219, 0.276702880859375, 0.2920112609863281, 0.30731964111328125, 0.3226280212402344, 0.3379364013671875, 0.3532447814941406, 0.36855316162109375, 0.3838615417480469, 0.399169921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 0.0, 2.0, 3.0, 5.0, 14.0, 18.0, 22.0, 48.0, 72.0, 128.0, 227.0, 421.0, 825.0, 1903.0, 4791.0, 13562.0, 52784.0, 558532.0, 345092.0, 49111.0, 12910.0, 4508.0, 1820.0, 778.0, 414.0, 231.0, 134.0, 69.0, 39.0, 36.0, 22.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12782955169677734, -0.12406730651855469, -0.12030506134033203, -0.11654281616210938, -0.11278057098388672, -0.10901832580566406, -0.1052560806274414, -0.10149383544921875, -0.0977315902709961, -0.09396934509277344, -0.09020709991455078, -0.08644485473632812, -0.08268260955810547, -0.07892036437988281, -0.07515811920166016, -0.0713958740234375, -0.06763362884521484, -0.06387138366699219, -0.06010913848876953, -0.056346893310546875, -0.05258464813232422, -0.04882240295410156, -0.045060157775878906, -0.04129791259765625, -0.037535667419433594, -0.03377342224121094, -0.03001117706298828, -0.026248931884765625, -0.02248668670654297, -0.018724441528320312, -0.014962196350097656, -0.011199951171875, -0.007437705993652344, -0.0036754608154296875, 8.678436279296875e-05, 0.003849029541015625, 0.007611274719238281, 0.011373519897460938, 0.015135765075683594, 0.01889801025390625, 0.022660255432128906, 0.026422500610351562, 0.03018474578857422, 0.033946990966796875, 0.03770923614501953, 0.04147148132324219, 0.045233726501464844, 0.0489959716796875, 0.052758216857910156, 0.05652046203613281, 0.06028270721435547, 0.06404495239257812, 0.06780719757080078, 0.07156944274902344, 0.0753316879272461, 0.07909393310546875, 0.0828561782836914, 0.08661842346191406, 0.09038066864013672, 0.09414291381835938, 0.09790515899658203, 0.10166740417480469, 0.10542964935302734, 0.10919189453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 1.0, 6.0, 3.0, 10.0, 7.0, 19.0, 21.0, 43.0, 38.0, 38.0, 67.0, 73.0, 113.0, 102.0, 82.0, 84.0, 77.0, 42.0, 40.0, 34.0, 24.0, 15.0, 10.0, 9.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.68952751159668e-05, -3.5715289413928986e-05, -3.4535303711891174e-05, -3.335531800985336e-05, -3.217533230781555e-05, -3.099534660577774e-05, -2.981536090373993e-05, -2.8635375201702118e-05, -2.7455389499664307e-05, -2.6275403797626495e-05, -2.5095418095588684e-05, -2.3915432393550873e-05, -2.273544669151306e-05, -2.155546098947525e-05, -2.037547528743744e-05, -1.9195489585399628e-05, -1.8015503883361816e-05, -1.6835518181324005e-05, -1.5655532479286194e-05, -1.4475546777248383e-05, -1.3295561075210571e-05, -1.211557537317276e-05, -1.0935589671134949e-05, -9.755603969097137e-06, -8.575618267059326e-06, -7.395632565021515e-06, -6.215646862983704e-06, -5.035661160945892e-06, -3.855675458908081e-06, -2.6756897568702698e-06, -1.4957040548324585e-06, -3.157183527946472e-07, 8.642673492431641e-07, 2.0442530512809753e-06, 3.2242387533187866e-06, 4.404224455356598e-06, 5.584210157394409e-06, 6.7641958594322205e-06, 7.944181561470032e-06, 9.124167263507843e-06, 1.0304152965545654e-05, 1.1484138667583466e-05, 1.2664124369621277e-05, 1.3844110071659088e-05, 1.50240957736969e-05, 1.620408147573471e-05, 1.7384067177772522e-05, 1.8564052879810333e-05, 1.9744038581848145e-05, 2.0924024283885956e-05, 2.2104009985923767e-05, 2.328399568796158e-05, 2.446398138999939e-05, 2.56439670920372e-05, 2.6823952794075012e-05, 2.8003938496112823e-05, 2.9183924198150635e-05, 3.0363909900188446e-05, 3.154389560222626e-05, 3.272388130426407e-05, 3.390386700630188e-05, 3.508385270833969e-05, 3.62638384103775e-05, 3.7443824112415314e-05, 3.8623809814453125e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 4.0, 19.0, 25.0, 39.0, 70.0, 168.0, 354.0, 874.0, 3299.0, 19379.0, 286796.0, 703163.0, 28185.0, 4348.0, 1128.0, 381.0, 140.0, 83.0, 49.0, 18.0, 12.0, 11.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15822601318359375, -0.1516571044921875, -0.14508819580078125, -0.138519287109375, -0.13195037841796875, -0.1253814697265625, -0.11881256103515625, -0.11224365234375, -0.10567474365234375, -0.0991058349609375, -0.09253692626953125, -0.085968017578125, -0.07939910888671875, -0.0728302001953125, -0.06626129150390625, -0.0596923828125, -0.05312347412109375, -0.0465545654296875, -0.03998565673828125, -0.033416748046875, -0.02684783935546875, -0.0202789306640625, -0.01371002197265625, -0.00714111328125, -0.00057220458984375, 0.0059967041015625, 0.01256561279296875, 0.019134521484375, 0.02570343017578125, 0.0322723388671875, 0.03884124755859375, 0.04541015625, 0.05197906494140625, 0.0585479736328125, 0.06511688232421875, 0.071685791015625, 0.07825469970703125, 0.0848236083984375, 0.09139251708984375, 0.09796142578125, 0.10453033447265625, 0.1110992431640625, 0.11766815185546875, 0.124237060546875, 0.13080596923828125, 0.1373748779296875, 0.14394378662109375, 0.1505126953125, 0.15708160400390625, 0.1636505126953125, 0.17021942138671875, 0.176788330078125, 0.18335723876953125, 0.1899261474609375, 0.19649505615234375, 0.20306396484375, 0.20963287353515625, 0.2162017822265625, 0.22277069091796875, 0.229339599609375, 0.23590850830078125, 0.2424774169921875, 0.24904632568359375, 0.255615234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 17.0, 12.0, 20.0, 25.0, 51.0, 68.0, 100.0, 129.0, 172.0, 131.0, 78.0, 61.0, 33.0, 22.0, 20.0, 12.0, 11.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1607666015625, -0.1559600830078125, -0.151153564453125, -0.1463470458984375, -0.14154052734375, -0.1367340087890625, -0.131927490234375, -0.1271209716796875, -0.122314453125, -0.1175079345703125, -0.112701416015625, -0.1078948974609375, -0.10308837890625, -0.0982818603515625, -0.093475341796875, -0.0886688232421875, -0.0838623046875, -0.0790557861328125, -0.074249267578125, -0.0694427490234375, -0.06463623046875, -0.0598297119140625, -0.055023193359375, -0.0502166748046875, -0.04541015625, -0.0406036376953125, -0.035797119140625, -0.0309906005859375, -0.02618408203125, -0.0213775634765625, -0.016571044921875, -0.0117645263671875, -0.0069580078125, -0.0021514892578125, 0.002655029296875, 0.0074615478515625, 0.01226806640625, 0.0170745849609375, 0.021881103515625, 0.0266876220703125, 0.031494140625, 0.0363006591796875, 0.041107177734375, 0.0459136962890625, 0.05072021484375, 0.0555267333984375, 0.060333251953125, 0.0651397705078125, 0.0699462890625, 0.0747528076171875, 0.079559326171875, 0.0843658447265625, 0.08917236328125, 0.0939788818359375, 0.098785400390625, 0.1035919189453125, 0.1083984375, 0.1132049560546875, 0.118011474609375, 0.1228179931640625, 0.12762451171875, 0.1324310302734375, 0.137237548828125, 0.1420440673828125, 0.1468505859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 10.0, 55.0, 92.0, 208.0, 383.0, 155.0, 47.0, 28.0, 8.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.750192165374756, -3.6341590881347656, -3.5181257724761963, -3.402092695236206, -3.286059617996216, -3.1700263023376465, -3.0539932250976562, -2.937960147857666, -2.821927070617676, -2.7058939933776855, -2.589860677719116, -2.473827600479126, -2.3577945232391357, -2.2417612075805664, -2.125728130340576, -2.009695053100586, -1.8936617374420166, -1.7776285409927368, -1.6615954637527466, -1.5455622673034668, -1.4295291900634766, -1.3134959936141968, -1.197462797164917, -1.0814297199249268, -0.965396523475647, -0.849363386631012, -0.733330249786377, -0.6172970533370972, -0.5012639164924622, -0.38523077964782715, -0.26919758319854736, -0.15316444635391235, -0.037131309509277344, 0.07890184223651886, 0.19493499398231506, 0.31096816062927246, 0.42700129747390747, 0.5430344343185425, 0.6590676307678223, 0.7751007676124573, 0.8911339044570923, 1.007167100906372, 1.1232001781463623, 1.239233374595642, 1.3552665710449219, 1.471299648284912, 1.587332844734192, 1.7033660411834717, 1.819399118423462, 1.9354323148727417, 2.0514655113220215, 2.1674985885620117, 2.283531665802002, 2.399564743041992, 2.5155980587005615, 2.6316311359405518, 2.747664451599121, 2.8636975288391113, 2.9797308444976807, 3.095763921737671, 3.211796998977661, 3.3278303146362305, 3.4438633918762207, 3.559896469116211, 3.675929546356201]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 5.0, 6.0, 6.0, 9.0, 12.0, 6.0, 13.0, 14.0, 24.0, 19.0, 27.0, 22.0, 28.0, 35.0, 32.0, 44.0, 45.0, 59.0, 71.0, 63.0, 67.0, 60.0, 45.0, 33.0, 26.0, 21.0, 21.0, 25.0, 21.0, 17.0, 22.0, 15.0, 8.0, 9.0, 15.0, 8.0, 14.0, 7.0, 5.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.4265739917755127, -1.3821661472320557, -1.3377584218978882, -1.2933505773544312, -1.2489428520202637, -1.2045350074768066, -1.1601271629333496, -1.1157194375991821, -1.0713117122650146, -1.0269038677215576, -0.9824961423873901, -0.9380882978439331, -0.8936805725097656, -0.8492727279663086, -0.8048649430274963, -0.7604571580886841, -0.716049313545227, -0.6716415286064148, -0.6272337436676025, -0.5828258991241455, -0.538418173789978, -0.4940103590488434, -0.44960254430770874, -0.4051947593688965, -0.36078697443008423, -0.316379189491272, -0.2719714045524597, -0.22756358981132507, -0.18315580487251282, -0.13874801993370056, -0.09434020519256592, -0.04993242025375366, -0.005524754524230957, 0.038883037865161896, 0.08329083025455475, 0.1276986300945282, 0.17210641503334045, 0.2165141999721527, 0.26092201471328735, 0.3053297996520996, 0.34973758459091187, 0.3941453695297241, 0.4385531544685364, 0.482960969209671, 0.5273687839508057, 0.5717765092849731, 0.6161843538284302, 0.6605921387672424, 0.7049999237060547, 0.7494077086448669, 0.7938154935836792, 0.8382233381271362, 0.8826310634613037, 0.9270389080047607, 0.971446692943573, 1.0158544778823853, 1.0602622032165527, 1.1046700477600098, 1.1490777730941772, 1.1934856176376343, 1.2378933429718018, 1.2823011875152588, 1.3267090320587158, 1.3711167573928833, 1.4155246019363403]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 10.0, 8.0, 14.0, 16.0, 37.0, 46.0, 74.0, 135.0, 179.0, 299.0, 475.0, 738.0, 1380.0, 2306.0, 4219.0, 8160.0, 16659.0, 37654.0, 97272.0, 298451.0, 1000340.0, 1762845.0, 653703.0, 190244.0, 65268.0, 26910.0, 12390.0, 6166.0, 3448.0, 1962.0, 1071.0, 722.0, 387.0, 246.0, 145.0, 102.0, 62.0, 48.0, 28.0, 22.0, 9.0, 12.0, 4.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.1021728515625, -0.09901142120361328, -0.09584999084472656, -0.09268856048583984, -0.08952713012695312, -0.0863656997680664, -0.08320426940917969, -0.08004283905029297, -0.07688140869140625, -0.07371997833251953, -0.07055854797363281, -0.0673971176147461, -0.06423568725585938, -0.061074256896972656, -0.05791282653808594, -0.05475139617919922, -0.0515899658203125, -0.04842853546142578, -0.04526710510253906, -0.042105674743652344, -0.038944244384765625, -0.035782814025878906, -0.03262138366699219, -0.02945995330810547, -0.02629852294921875, -0.02313709259033203, -0.019975662231445312, -0.016814231872558594, -0.013652801513671875, -0.010491371154785156, -0.0073299407958984375, -0.004168510437011719, -0.001007080078125, 0.0021543502807617188, 0.0053157806396484375, 0.008477210998535156, 0.011638641357421875, 0.014800071716308594, 0.017961502075195312, 0.02112293243408203, 0.02428436279296875, 0.02744579315185547, 0.030607223510742188, 0.033768653869628906, 0.036930084228515625, 0.040091514587402344, 0.04325294494628906, 0.04641437530517578, 0.0495758056640625, 0.05273723602294922, 0.05589866638183594, 0.059060096740722656, 0.062221527099609375, 0.0653829574584961, 0.06854438781738281, 0.07170581817626953, 0.07486724853515625, 0.07802867889404297, 0.08119010925292969, 0.0843515396118164, 0.08751296997070312, 0.09067440032958984, 0.09383583068847656, 0.09699726104736328, 0.10015869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 9.0, 6.0, 11.0, 22.0, 18.0, 14.0, 30.0, 29.0, 28.0, 26.0, 44.0, 61.0, 35.0, 47.0, 54.0, 43.0, 42.0, 48.0, 57.0, 36.0, 36.0, 48.0, 27.0, 31.0, 24.0, 23.0, 26.0, 16.0, 17.0, 18.0, 5.0, 10.0, 5.0, 11.0, 8.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.10357666015625, -0.10036563873291016, -0.09715461730957031, -0.09394359588623047, -0.09073257446289062, -0.08752155303955078, -0.08431053161621094, -0.0810995101928711, -0.07788848876953125, -0.0746774673461914, -0.07146644592285156, -0.06825542449951172, -0.06504440307617188, -0.06183338165283203, -0.05862236022949219, -0.055411338806152344, -0.0522003173828125, -0.048989295959472656, -0.04577827453613281, -0.04256725311279297, -0.039356231689453125, -0.03614521026611328, -0.03293418884277344, -0.029723167419433594, -0.02651214599609375, -0.023301124572753906, -0.020090103149414062, -0.01687908172607422, -0.013668060302734375, -0.010457038879394531, -0.0072460174560546875, -0.004034996032714844, -0.000823974609375, 0.0023870468139648438, 0.0055980682373046875, 0.008809089660644531, 0.012020111083984375, 0.015231132507324219, 0.018442153930664062, 0.021653175354003906, 0.02486419677734375, 0.028075218200683594, 0.03128623962402344, 0.03449726104736328, 0.037708282470703125, 0.04091930389404297, 0.04413032531738281, 0.047341346740722656, 0.0505523681640625, 0.053763389587402344, 0.05697441101074219, 0.06018543243408203, 0.06339645385742188, 0.06660747528076172, 0.06981849670410156, 0.0730295181274414, 0.07624053955078125, 0.0794515609741211, 0.08266258239746094, 0.08587360382080078, 0.08908462524414062, 0.09229564666748047, 0.09550666809082031, 0.09871768951416016, 0.1019287109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 5.0, 9.0, 15.0, 12.0, 26.0, 33.0, 43.0, 68.0, 115.0, 238.0, 465.0, 1390.0, 6516.0, 48851.0, 902653.0, 3084150.0, 132315.0, 13540.0, 2426.0, 655.0, 272.0, 157.0, 97.0, 60.0, 48.0, 17.0, 23.0, 22.0, 12.0, 7.0, 5.0, 9.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26018524169921875, -0.2498626708984375, -0.23954010009765625, -0.229217529296875, -0.21889495849609375, -0.2085723876953125, -0.19824981689453125, -0.18792724609375, -0.17760467529296875, -0.1672821044921875, -0.15695953369140625, -0.146636962890625, -0.13631439208984375, -0.1259918212890625, -0.11566925048828125, -0.1053466796875, -0.09502410888671875, -0.0847015380859375, -0.07437896728515625, -0.064056396484375, -0.05373382568359375, -0.0434112548828125, -0.03308868408203125, -0.02276611328125, -0.01244354248046875, -0.0021209716796875, 0.00820159912109375, 0.018524169921875, 0.02884674072265625, 0.0391693115234375, 0.04949188232421875, 0.059814453125, 0.07013702392578125, 0.0804595947265625, 0.09078216552734375, 0.101104736328125, 0.11142730712890625, 0.1217498779296875, 0.13207244873046875, 0.14239501953125, 0.15271759033203125, 0.1630401611328125, 0.17336273193359375, 0.183685302734375, 0.19400787353515625, 0.2043304443359375, 0.21465301513671875, 0.2249755859375, 0.23529815673828125, 0.2456207275390625, 0.25594329833984375, 0.266265869140625, 0.27658843994140625, 0.2869110107421875, 0.29723358154296875, 0.30755615234375, 0.31787872314453125, 0.3282012939453125, 0.33852386474609375, 0.348846435546875, 0.35916900634765625, 0.3694915771484375, 0.37981414794921875, 0.39013671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 6.0, 7.0, 12.0, 23.0, 20.0, 22.0, 28.0, 43.0, 40.0, 66.0, 84.0, 113.0, 144.0, 203.0, 265.0, 355.0, 469.0, 502.0, 423.0, 310.0, 235.0, 177.0, 143.0, 83.0, 66.0, 64.0, 36.0, 20.0, 27.0, 16.0, 16.0, 9.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2010498046875, -0.1950206756591797, -0.18899154663085938, -0.18296241760253906, -0.17693328857421875, -0.17090415954589844, -0.16487503051757812, -0.1588459014892578, -0.1528167724609375, -0.1467876434326172, -0.14075851440429688, -0.13472938537597656, -0.12870025634765625, -0.12267112731933594, -0.11664199829101562, -0.11061286926269531, -0.104583740234375, -0.09855461120605469, -0.09252548217773438, -0.08649635314941406, -0.08046722412109375, -0.07443809509277344, -0.06840896606445312, -0.06237983703613281, -0.0563507080078125, -0.05032157897949219, -0.044292449951171875, -0.03826332092285156, -0.03223419189453125, -0.026205062866210938, -0.020175933837890625, -0.014146804809570312, -0.00811767578125, -0.0020885467529296875, 0.003940582275390625, 0.009969711303710938, 0.01599884033203125, 0.022027969360351562, 0.028057098388671875, 0.03408622741699219, 0.0401153564453125, 0.04614448547363281, 0.052173614501953125, 0.05820274353027344, 0.06423187255859375, 0.07026100158691406, 0.07629013061523438, 0.08231925964355469, 0.088348388671875, 0.09437751770019531, 0.10040664672851562, 0.10643577575683594, 0.11246490478515625, 0.11849403381347656, 0.12452316284179688, 0.1305522918701172, 0.1365814208984375, 0.1426105499267578, 0.14863967895507812, 0.15466880798339844, 0.16069793701171875, 0.16672706604003906, 0.17275619506835938, 0.1787853240966797, 0.184814453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 10.0, 6.0, 21.0, 42.0, 90.0, 132.0, 186.0, 217.0, 149.0, 65.0, 39.0, 22.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.780270576477051, -4.6871161460876465, -4.593961715698242, -4.50080680847168, -4.407652378082275, -4.314497947692871, -4.221343517303467, -4.1281890869140625, -4.0350341796875, -3.9418797492980957, -3.8487250804901123, -3.755570650100708, -3.6624159812927246, -3.5692615509033203, -3.476107120513916, -3.3829524517059326, -3.2897980213165283, -3.196643590927124, -3.1034889221191406, -3.0103344917297363, -2.917179822921753, -2.8240253925323486, -2.7308707237243652, -2.637716293334961, -2.5445618629455566, -2.4514074325561523, -2.358252763748169, -2.2650983333587646, -2.1719436645507812, -2.078789234161377, -1.985634684562683, -1.8924801349639893, -1.7993252277374268, -1.706170678138733, -1.613016128540039, -1.5198616981506348, -1.4267070293426514, -1.333552598953247, -1.2403980493545532, -1.1472434997558594, -1.0540889501571655, -0.9609344005584717, -0.8677798509597778, -0.7746253609657288, -0.6814708113670349, -0.5883162617683411, -0.495161771774292, -0.40200722217559814, -0.3088526725769043, -0.21569813787937164, -0.12254360318183899, -0.02938908338546753, 0.06376546621322632, 0.15692001581192017, 0.25007450580596924, 0.3432290554046631, 0.43638360500335693, 0.5295381546020508, 0.6226927042007446, 0.7158471941947937, 0.8090017437934875, 0.9021562933921814, 0.9953107833862305, 1.0884653329849243, 1.1816198825836182]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 16.0, 20.0, 31.0, 38.0, 36.0, 40.0, 38.0, 41.0, 36.0, 44.0, 44.0, 54.0, 44.0, 39.0, 49.0, 52.0, 41.0, 41.0, 43.0, 41.0, 32.0, 26.0, 26.0, 16.0, 10.0, 12.0, 8.0, 11.0, 9.0, 6.0, 6.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.13295578956604, -1.0957857370376587, -1.058615803718567, -1.0214457511901855, -0.984275758266449, -0.9471057653427124, -0.909935712814331, -0.8727657198905945, -0.8355957269668579, -0.7984257340431213, -0.7612557411193848, -0.7240856885910034, -0.6869156956672668, -0.6497457027435303, -0.6125756502151489, -0.5754056572914124, -0.5382356643676758, -0.5010656714439392, -0.46389564871788025, -0.4267256259918213, -0.3895556330680847, -0.35238564014434814, -0.3152156174182892, -0.2780455946922302, -0.24087560176849365, -0.2037055939435959, -0.16653558611869812, -0.12936557829380035, -0.09219557046890259, -0.05502556264400482, -0.017855554819107056, 0.019314467906951904, 0.05648446083068848, 0.09365446865558624, 0.130824476480484, 0.16799448430538177, 0.20516449213027954, 0.2423344999551773, 0.2795045077800751, 0.31667453050613403, 0.3538445234298706, 0.3910145163536072, 0.42818453907966614, 0.4653545618057251, 0.5025245547294617, 0.5396945476531982, 0.5768646001815796, 0.6140345931053162, 0.6512045860290527, 0.6883745789527893, 0.7255445718765259, 0.7627146244049072, 0.7998846173286438, 0.8370546102523804, 0.8742246627807617, 0.9113946557044983, 0.9485646486282349, 0.9857346415519714, 1.022904634475708, 1.0600746870040894, 1.0972447395324707, 1.1344146728515625, 1.1715847253799438, 1.2087547779083252, 1.245924711227417]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 13.0, 15.0, 14.0, 30.0, 44.0, 66.0, 115.0, 126.0, 227.0, 374.0, 611.0, 1029.0, 1734.0, 3559.0, 7302.0, 16019.0, 39553.0, 112505.0, 335226.0, 341060.0, 116146.0, 40555.0, 16581.0, 7438.0, 3647.0, 1852.0, 1051.0, 562.0, 384.0, 238.0, 179.0, 110.0, 64.0, 44.0, 22.0, 21.0, 14.0, 8.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12422752380371094, -0.11979293823242188, -0.11535835266113281, -0.11092376708984375, -0.10648918151855469, -0.10205459594726562, -0.09762001037597656, -0.0931854248046875, -0.08875083923339844, -0.08431625366210938, -0.07988166809082031, -0.07544708251953125, -0.07101249694824219, -0.06657791137695312, -0.06214332580566406, -0.057708740234375, -0.05327415466308594, -0.048839569091796875, -0.04440498352050781, -0.03997039794921875, -0.03553581237792969, -0.031101226806640625, -0.026666641235351562, -0.0222320556640625, -0.017797470092773438, -0.013362884521484375, -0.008928298950195312, -0.00449371337890625, -5.91278076171875e-05, 0.004375457763671875, 0.008810043334960938, 0.01324462890625, 0.017679214477539062, 0.022113800048828125, 0.026548385620117188, 0.03098297119140625, 0.03541755676269531, 0.039852142333984375, 0.04428672790527344, 0.0487213134765625, 0.05315589904785156, 0.057590484619140625, 0.06202507019042969, 0.06645965576171875, 0.07089424133300781, 0.07532882690429688, 0.07976341247558594, 0.084197998046875, 0.08863258361816406, 0.09306716918945312, 0.09750175476074219, 0.10193634033203125, 0.10637092590332031, 0.11080551147460938, 0.11524009704589844, 0.1196746826171875, 0.12410926818847656, 0.12854385375976562, 0.1329784393310547, 0.13741302490234375, 0.1418476104736328, 0.14628219604492188, 0.15071678161621094, 0.1551513671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 11.0, 19.0, 17.0, 24.0, 32.0, 19.0, 37.0, 38.0, 24.0, 42.0, 47.0, 48.0, 46.0, 68.0, 62.0, 56.0, 43.0, 46.0, 28.0, 36.0, 34.0, 36.0, 30.0, 29.0, 23.0, 25.0, 17.0, 13.0, 13.0, 4.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.12385940551757812, -0.11991119384765625, -0.11596298217773438, -0.1120147705078125, -0.10806655883789062, -0.10411834716796875, -0.10017013549804688, -0.096221923828125, -0.09227371215820312, -0.08832550048828125, -0.08437728881835938, -0.0804290771484375, -0.07648086547851562, -0.07253265380859375, -0.06858444213867188, -0.06463623046875, -0.060688018798828125, -0.05673980712890625, -0.052791595458984375, -0.0488433837890625, -0.044895172119140625, -0.04094696044921875, -0.036998748779296875, -0.033050537109375, -0.029102325439453125, -0.02515411376953125, -0.021205902099609375, -0.0172576904296875, -0.013309478759765625, -0.00936126708984375, -0.005413055419921875, -0.00146484375, 0.002483367919921875, 0.00643157958984375, 0.010379791259765625, 0.0143280029296875, 0.018276214599609375, 0.02222442626953125, 0.026172637939453125, 0.030120849609375, 0.034069061279296875, 0.03801727294921875, 0.041965484619140625, 0.0459136962890625, 0.049861907958984375, 0.05381011962890625, 0.057758331298828125, 0.06170654296875, 0.06565475463867188, 0.06960296630859375, 0.07355117797851562, 0.0774993896484375, 0.08144760131835938, 0.08539581298828125, 0.08934402465820312, 0.093292236328125, 0.09724044799804688, 0.10118865966796875, 0.10513687133789062, 0.1090850830078125, 0.11303329467773438, 0.11698150634765625, 0.12092971801757812, 0.1248779296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 7.0, 8.0, 20.0, 30.0, 32.0, 52.0, 80.0, 109.0, 167.0, 298.0, 505.0, 1014.0, 2421.0, 7933.0, 46813.0, 751485.0, 208703.0, 20823.0, 4562.0, 1634.0, 782.0, 385.0, 235.0, 146.0, 87.0, 66.0, 50.0, 37.0, 19.0, 7.0, 13.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2997550964355469, -0.28969573974609375, -0.2796363830566406, -0.2695770263671875, -0.2595176696777344, -0.24945831298828125, -0.23939895629882812, -0.229339599609375, -0.21928024291992188, -0.20922088623046875, -0.19916152954101562, -0.1891021728515625, -0.17904281616210938, -0.16898345947265625, -0.15892410278320312, -0.14886474609375, -0.13880538940429688, -0.12874603271484375, -0.11868667602539062, -0.1086273193359375, -0.09856796264648438, -0.08850860595703125, -0.07844924926757812, -0.068389892578125, -0.058330535888671875, -0.04827117919921875, -0.038211822509765625, -0.0281524658203125, -0.018093109130859375, -0.00803375244140625, 0.002025604248046875, 0.0120849609375, 0.022144317626953125, 0.03220367431640625, 0.042263031005859375, 0.0523223876953125, 0.062381744384765625, 0.07244110107421875, 0.08250045776367188, 0.092559814453125, 0.10261917114257812, 0.11267852783203125, 0.12273788452148438, 0.1327972412109375, 0.14285659790039062, 0.15291595458984375, 0.16297531127929688, 0.17303466796875, 0.18309402465820312, 0.19315338134765625, 0.20321273803710938, 0.2132720947265625, 0.22333145141601562, 0.23339080810546875, 0.24345016479492188, 0.253509521484375, 0.2635688781738281, 0.27362823486328125, 0.2836875915527344, 0.2937469482421875, 0.3038063049316406, 0.31386566162109375, 0.3239250183105469, 0.333984375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 9.0, 3.0, 6.0, 11.0, 4.0, 14.0, 17.0, 23.0, 28.0, 24.0, 47.0, 37.0, 51.0, 39.0, 71.0, 76.0, 74.0, 75.0, 69.0, 56.0, 53.0, 37.0, 32.0, 40.0, 24.0, 26.0, 15.0, 12.0, 6.0, 11.0, 4.0, 2.0, 3.0, 6.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45751953125, -0.4389190673828125, -0.420318603515625, -0.4017181396484375, -0.38311767578125, -0.3645172119140625, -0.345916748046875, -0.3273162841796875, -0.3087158203125, -0.2901153564453125, -0.271514892578125, -0.2529144287109375, -0.23431396484375, -0.2157135009765625, -0.197113037109375, -0.1785125732421875, -0.159912109375, -0.1413116455078125, -0.122711181640625, -0.1041107177734375, -0.08551025390625, -0.0669097900390625, -0.048309326171875, -0.0297088623046875, -0.0111083984375, 0.0074920654296875, 0.026092529296875, 0.0446929931640625, 0.06329345703125, 0.0818939208984375, 0.100494384765625, 0.1190948486328125, 0.1376953125, 0.1562957763671875, 0.174896240234375, 0.1934967041015625, 0.21209716796875, 0.2306976318359375, 0.249298095703125, 0.2678985595703125, 0.2864990234375, 0.3050994873046875, 0.323699951171875, 0.3423004150390625, 0.36090087890625, 0.3795013427734375, 0.398101806640625, 0.4167022705078125, 0.435302734375, 0.4539031982421875, 0.472503662109375, 0.4911041259765625, 0.50970458984375, 0.5283050537109375, 0.546905517578125, 0.5655059814453125, 0.5841064453125, 0.6027069091796875, 0.621307373046875, 0.6399078369140625, 0.65850830078125, 0.6771087646484375, 0.695709228515625, 0.7143096923828125, 0.73291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 12.0, 17.0, 20.0, 27.0, 52.0, 73.0, 107.0, 165.0, 348.0, 785.0, 1903.0, 5516.0, 19496.0, 104913.0, 758454.0, 124819.0, 22042.0, 6027.0, 2071.0, 851.0, 393.0, 182.0, 109.0, 51.0, 39.0, 26.0, 19.0, 10.0, 10.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.09893798828125, -0.09623050689697266, -0.09352302551269531, -0.09081554412841797, -0.08810806274414062, -0.08540058135986328, -0.08269309997558594, -0.0799856185913086, -0.07727813720703125, -0.0745706558227539, -0.07186317443847656, -0.06915569305419922, -0.06644821166992188, -0.06374073028564453, -0.06103324890136719, -0.058325767517089844, -0.0556182861328125, -0.052910804748535156, -0.05020332336425781, -0.04749584197998047, -0.044788360595703125, -0.04208087921142578, -0.03937339782714844, -0.036665916442871094, -0.03395843505859375, -0.031250953674316406, -0.028543472290039062, -0.02583599090576172, -0.023128509521484375, -0.02042102813720703, -0.017713546752929688, -0.015006065368652344, -0.012298583984375, -0.009591102600097656, -0.0068836212158203125, -0.004176139831542969, -0.001468658447265625, 0.0012388229370117188, 0.0039463043212890625, 0.006653785705566406, 0.00936126708984375, 0.012068748474121094, 0.014776229858398438, 0.01748371124267578, 0.020191192626953125, 0.02289867401123047, 0.025606155395507812, 0.028313636779785156, 0.0310211181640625, 0.033728599548339844, 0.03643608093261719, 0.03914356231689453, 0.041851043701171875, 0.04455852508544922, 0.04726600646972656, 0.049973487854003906, 0.05268096923828125, 0.055388450622558594, 0.05809593200683594, 0.06080341339111328, 0.06351089477539062, 0.06621837615966797, 0.06892585754394531, 0.07163333892822266, 0.0743408203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 9.0, 10.0, 10.0, 13.0, 30.0, 38.0, 46.0, 63.0, 103.0, 117.0, 131.0, 89.0, 77.0, 50.0, 50.0, 38.0, 35.0, 20.0, 11.0, 8.0, 8.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1961669921875e-05, -4.0815211832523346e-05, -3.966875374317169e-05, -3.852229565382004e-05, -3.7375837564468384e-05, -3.622937947511673e-05, -3.5082921385765076e-05, -3.393646329641342e-05, -3.279000520706177e-05, -3.1643547117710114e-05, -3.049708902835846e-05, -2.9350630939006805e-05, -2.820417284965515e-05, -2.7057714760303497e-05, -2.5911256670951843e-05, -2.476479858160019e-05, -2.3618340492248535e-05, -2.247188240289688e-05, -2.1325424313545227e-05, -2.0178966224193573e-05, -1.903250813484192e-05, -1.7886050045490265e-05, -1.673959195613861e-05, -1.5593133866786957e-05, -1.4446675777435303e-05, -1.3300217688083649e-05, -1.2153759598731995e-05, -1.100730150938034e-05, -9.860843420028687e-06, -8.714385330677032e-06, -7.567927241325378e-06, -6.421469151973724e-06, -5.27501106262207e-06, -4.128552973270416e-06, -2.982094883918762e-06, -1.8356367945671082e-06, -6.891787052154541e-07, 4.5727938413619995e-07, 1.603737473487854e-06, 2.750195562839508e-06, 3.896653652191162e-06, 5.043111741542816e-06, 6.18956983089447e-06, 7.336027920246124e-06, 8.482486009597778e-06, 9.628944098949432e-06, 1.0775402188301086e-05, 1.192186027765274e-05, 1.3068318367004395e-05, 1.4214776456356049e-05, 1.5361234545707703e-05, 1.6507692635059357e-05, 1.765415072441101e-05, 1.8800608813762665e-05, 1.994706690311432e-05, 2.1093524992465973e-05, 2.2239983081817627e-05, 2.338644117116928e-05, 2.4532899260520935e-05, 2.567935734987259e-05, 2.6825815439224243e-05, 2.7972273528575897e-05, 2.911873161792755e-05, 3.0265189707279205e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 10.0, 13.0, 20.0, 19.0, 28.0, 42.0, 47.0, 96.0, 127.0, 196.0, 336.0, 552.0, 1041.0, 2103.0, 4865.0, 13082.0, 41519.0, 158794.0, 646894.0, 125512.0, 33769.0, 11069.0, 4233.0, 1841.0, 969.0, 496.0, 275.0, 171.0, 140.0, 83.0, 57.0, 41.0, 31.0, 19.0, 16.0, 7.0, 13.0, 3.0, 11.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0679931640625, -0.06595849990844727, -0.06392383575439453, -0.0618891716003418, -0.05985450744628906, -0.05781984329223633, -0.055785179138183594, -0.05375051498413086, -0.051715850830078125, -0.04968118667602539, -0.047646522521972656, -0.04561185836791992, -0.04357719421386719, -0.04154253005981445, -0.03950786590576172, -0.037473201751708984, -0.03543853759765625, -0.033403873443603516, -0.03136920928955078, -0.029334545135498047, -0.027299880981445312, -0.025265216827392578, -0.023230552673339844, -0.02119588851928711, -0.019161224365234375, -0.01712656021118164, -0.015091896057128906, -0.013057231903076172, -0.011022567749023438, -0.008987903594970703, -0.006953239440917969, -0.004918575286865234, -0.0028839111328125, -0.0008492469787597656, 0.0011854171752929688, 0.003220081329345703, 0.0052547454833984375, 0.007289409637451172, 0.009324073791503906, 0.01135873794555664, 0.013393402099609375, 0.01542806625366211, 0.017462730407714844, 0.019497394561767578, 0.021532058715820312, 0.023566722869873047, 0.02560138702392578, 0.027636051177978516, 0.02967071533203125, 0.031705379486083984, 0.03374004364013672, 0.03577470779418945, 0.03780937194824219, 0.03984403610229492, 0.041878700256347656, 0.04391336441040039, 0.045948028564453125, 0.04798269271850586, 0.050017356872558594, 0.05205202102661133, 0.05408668518066406, 0.0561213493347168, 0.05815601348876953, 0.060190677642822266, 0.062225341796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 9.0, 12.0, 14.0, 18.0, 28.0, 19.0, 24.0, 27.0, 61.0, 51.0, 83.0, 84.0, 90.0, 99.0, 85.0, 72.0, 49.0, 40.0, 26.0, 25.0, 16.0, 13.0, 10.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.06919288635253906, -0.06654739379882812, -0.06390190124511719, -0.06125640869140625, -0.05861091613769531, -0.055965423583984375, -0.05331993103027344, -0.0506744384765625, -0.04802894592285156, -0.045383453369140625, -0.04273796081542969, -0.04009246826171875, -0.03744697570800781, -0.034801483154296875, -0.03215599060058594, -0.029510498046875, -0.026865005493164062, -0.024219512939453125, -0.021574020385742188, -0.01892852783203125, -0.016283035278320312, -0.013637542724609375, -0.010992050170898438, -0.0083465576171875, -0.0057010650634765625, -0.003055572509765625, -0.0004100799560546875, 0.00223541259765625, 0.0048809051513671875, 0.007526397705078125, 0.010171890258789062, 0.0128173828125, 0.015462875366210938, 0.018108367919921875, 0.020753860473632812, 0.02339935302734375, 0.026044845581054688, 0.028690338134765625, 0.03133583068847656, 0.0339813232421875, 0.03662681579589844, 0.039272308349609375, 0.04191780090332031, 0.04456329345703125, 0.04720878601074219, 0.049854278564453125, 0.05249977111816406, 0.055145263671875, 0.05779075622558594, 0.060436248779296875, 0.06308174133300781, 0.06572723388671875, 0.06837272644042969, 0.07101821899414062, 0.07366371154785156, 0.0763092041015625, 0.07895469665527344, 0.08160018920898438, 0.08424568176269531, 0.08689117431640625, 0.08953666687011719, 0.09218215942382812, 0.09482765197753906, 0.09747314453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 18.0, 29.0, 129.0, 453.0, 211.0, 88.0, 30.0, 15.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8410844802856445, -2.726147413253784, -2.611210584640503, -2.4962735176086426, -2.3813366889953613, -2.266399621963501, -2.1514627933502197, -2.0365257263183594, -1.9215888977050781, -1.8066519498825073, -1.6917150020599365, -1.5767780542373657, -1.461841106414795, -1.3469040393829346, -1.2319672107696533, -1.117030143737793, -1.0020931959152222, -0.8871562480926514, -0.7722193002700806, -0.6572823524475098, -0.542345404624939, -0.4274083971977234, -0.3124714493751526, -0.1975345015525818, -0.08259755373001099, 0.03233940154314041, 0.1472763568162918, 0.2622133195400238, 0.3771502673625946, 0.4920872449874878, 0.6070241928100586, 0.7219611406326294, 0.8368980884552002, 0.951835036277771, 1.0667719841003418, 1.1817089319229126, 1.2966458797454834, 1.4115829467773438, 1.526519775390625, 1.6414568424224854, 1.7563936710357666, 1.8713306188583374, 1.9862675666809082, 2.1012046337127686, 2.21614146232605, 2.33107852935791, 2.4460153579711914, 2.5609524250030518, 2.675889492034912, 2.7908265590667725, 2.9057633876800537, 3.020700454711914, 3.1356372833251953, 3.2505743503570557, 3.365511178970337, 3.4804482460021973, 3.5953850746154785, 3.710322141647339, 3.82525897026062, 3.9401960372924805, 4.055132865905762, 4.170069694519043, 4.285006999969482, 4.399943828582764, 4.514880657196045]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 11.0, 6.0, 4.0, 9.0, 11.0, 14.0, 16.0, 13.0, 15.0, 20.0, 19.0, 24.0, 23.0, 27.0, 54.0, 59.0, 77.0, 121.0, 99.0, 72.0, 51.0, 33.0, 29.0, 27.0, 18.0, 28.0, 21.0, 23.0, 10.0, 5.0, 13.0, 7.0, 8.0, 9.0, 4.0, 7.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8421064615249634, -1.7893468141555786, -1.7365871667861938, -1.683827519416809, -1.6310678720474243, -1.5783082246780396, -1.5255485773086548, -1.47278892993927, -1.4200292825698853, -1.3672696352005005, -1.3145099878311157, -1.261750340461731, -1.2089906930923462, -1.1562310457229614, -1.1034713983535767, -1.050711750984192, -0.9979521036148071, -0.9451924562454224, -0.8924328088760376, -0.8396731615066528, -0.7869135141372681, -0.7341538667678833, -0.6813942193984985, -0.6286345720291138, -0.575874924659729, -0.5231152772903442, -0.4703556299209595, -0.4175959825515747, -0.36483633518218994, -0.3120766878128052, -0.2593170404434204, -0.20655739307403564, -0.15379774570465088, -0.10103809833526611, -0.04827845096588135, 0.004481196403503418, 0.057240843772888184, 0.11000049114227295, 0.16276013851165771, 0.21551978588104248, 0.26827943325042725, 0.321039080619812, 0.3737987279891968, 0.42655837535858154, 0.4793180227279663, 0.5320776700973511, 0.5848373174667358, 0.6375969648361206, 0.6903566122055054, 0.7431162595748901, 0.7958759069442749, 0.8486355543136597, 0.9013952016830444, 0.9541548490524292, 1.006914496421814, 1.0596741437911987, 1.1124337911605835, 1.1651934385299683, 1.217953085899353, 1.2707127332687378, 1.3234723806381226, 1.3762320280075073, 1.428991675376892, 1.4817513227462769, 1.5345109701156616]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 14.0, 21.0, 34.0, 64.0, 80.0, 135.0, 246.0, 416.0, 784.0, 1401.0, 2919.0, 6328.0, 15285.0, 39835.0, 121174.0, 436136.0, 1440325.0, 1486981.0, 447735.0, 124885.0, 40458.0, 15601.0, 6734.0, 3225.0, 1526.0, 842.0, 433.0, 273.0, 140.0, 95.0, 67.0, 38.0, 20.0, 7.0, 10.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15314483642578125, -0.1474761962890625, -0.14180755615234375, -0.136138916015625, -0.13047027587890625, -0.1248016357421875, -0.11913299560546875, -0.11346435546875, -0.10779571533203125, -0.1021270751953125, -0.09645843505859375, -0.090789794921875, -0.08512115478515625, -0.0794525146484375, -0.07378387451171875, -0.068115234375, -0.06244659423828125, -0.0567779541015625, -0.05110931396484375, -0.045440673828125, -0.03977203369140625, -0.0341033935546875, -0.02843475341796875, -0.02276611328125, -0.01709747314453125, -0.0114288330078125, -0.00576019287109375, -9.1552734375e-05, 0.00557708740234375, 0.0112457275390625, 0.01691436767578125, 0.0225830078125, 0.02825164794921875, 0.0339202880859375, 0.03958892822265625, 0.045257568359375, 0.05092620849609375, 0.0565948486328125, 0.06226348876953125, 0.06793212890625, 0.07360076904296875, 0.0792694091796875, 0.08493804931640625, 0.090606689453125, 0.09627532958984375, 0.1019439697265625, 0.10761260986328125, 0.11328125, 0.11894989013671875, 0.1246185302734375, 0.13028717041015625, 0.135955810546875, 0.14162445068359375, 0.1472930908203125, 0.15296173095703125, 0.15863037109375, 0.16429901123046875, 0.1699676513671875, 0.17563629150390625, 0.181304931640625, 0.18697357177734375, 0.1926422119140625, 0.19831085205078125, 0.2039794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 5.0, 9.0, 8.0, 9.0, 11.0, 12.0, 14.0, 10.0, 20.0, 20.0, 28.0, 25.0, 35.0, 45.0, 30.0, 37.0, 35.0, 40.0, 38.0, 49.0, 49.0, 50.0, 38.0, 43.0, 36.0, 28.0, 35.0, 38.0, 20.0, 27.0, 20.0, 30.0, 16.0, 16.0, 13.0, 11.0, 13.0, 10.0, 5.0, 5.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.09203910827636719, -0.08898544311523438, -0.08593177795410156, -0.08287811279296875, -0.07982444763183594, -0.07677078247070312, -0.07371711730957031, -0.0706634521484375, -0.06760978698730469, -0.06455612182617188, -0.06150245666503906, -0.05844879150390625, -0.05539512634277344, -0.052341461181640625, -0.04928779602050781, -0.046234130859375, -0.04318046569824219, -0.040126800537109375, -0.03707313537597656, -0.03401947021484375, -0.030965805053710938, -0.027912139892578125, -0.024858474731445312, -0.0218048095703125, -0.018751144409179688, -0.015697479248046875, -0.012643814086914062, -0.00959014892578125, -0.0065364837646484375, -0.003482818603515625, -0.0004291534423828125, 0.00262451171875, 0.0056781768798828125, 0.008731842041015625, 0.011785507202148438, 0.01483917236328125, 0.017892837524414062, 0.020946502685546875, 0.024000167846679688, 0.0270538330078125, 0.030107498168945312, 0.033161163330078125, 0.03621482849121094, 0.03926849365234375, 0.04232215881347656, 0.045375823974609375, 0.04842948913574219, 0.051483154296875, 0.05453681945800781, 0.057590484619140625, 0.06064414978027344, 0.06369781494140625, 0.06675148010253906, 0.06980514526367188, 0.07285881042480469, 0.0759124755859375, 0.07896614074707031, 0.08201980590820312, 0.08507347106933594, 0.08812713623046875, 0.09118080139160156, 0.09423446655273438, 0.09728813171386719, 0.100341796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 8.0, 14.0, 25.0, 33.0, 40.0, 78.0, 143.0, 270.0, 572.0, 1414.0, 6135.0, 188943.0, 3957168.0, 34109.0, 3303.0, 998.0, 435.0, 230.0, 132.0, 81.0, 47.0, 36.0, 12.0, 13.0, 9.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.233551025390625, -1.20050048828125, -1.167449951171875, -1.1343994140625, -1.101348876953125, -1.06829833984375, -1.035247802734375, -1.002197265625, -0.969146728515625, -0.93609619140625, -0.903045654296875, -0.8699951171875, -0.836944580078125, -0.80389404296875, -0.770843505859375, -0.73779296875, -0.704742431640625, -0.67169189453125, -0.638641357421875, -0.6055908203125, -0.572540283203125, -0.53948974609375, -0.506439208984375, -0.473388671875, -0.440338134765625, -0.40728759765625, -0.374237060546875, -0.3411865234375, -0.308135986328125, -0.27508544921875, -0.242034912109375, -0.208984375, -0.175933837890625, -0.14288330078125, -0.109832763671875, -0.0767822265625, -0.043731689453125, -0.01068115234375, 0.022369384765625, 0.055419921875, 0.088470458984375, 0.12152099609375, 0.154571533203125, 0.1876220703125, 0.220672607421875, 0.25372314453125, 0.286773681640625, 0.31982421875, 0.352874755859375, 0.38592529296875, 0.418975830078125, 0.4520263671875, 0.485076904296875, 0.51812744140625, 0.551177978515625, 0.584228515625, 0.617279052734375, 0.65032958984375, 0.683380126953125, 0.7164306640625, 0.749481201171875, 0.78253173828125, 0.815582275390625, 0.8486328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 4.0, 3.0, 12.0, 12.0, 24.0, 25.0, 21.0, 36.0, 56.0, 70.0, 107.0, 147.0, 175.0, 217.0, 301.0, 382.0, 503.0, 485.0, 347.0, 272.0, 242.0, 171.0, 130.0, 80.0, 71.0, 40.0, 39.0, 40.0, 16.0, 5.0, 6.0, 5.0, 8.0, 3.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.308349609375, -0.29645538330078125, -0.2845611572265625, -0.27266693115234375, -0.260772705078125, -0.24887847900390625, -0.2369842529296875, -0.22509002685546875, -0.21319580078125, -0.20130157470703125, -0.1894073486328125, -0.17751312255859375, -0.165618896484375, -0.15372467041015625, -0.1418304443359375, -0.12993621826171875, -0.1180419921875, -0.10614776611328125, -0.0942535400390625, -0.08235931396484375, -0.070465087890625, -0.05857086181640625, -0.0466766357421875, -0.03478240966796875, -0.02288818359375, -0.01099395751953125, 0.0009002685546875, 0.01279449462890625, 0.024688720703125, 0.03658294677734375, 0.0484771728515625, 0.06037139892578125, 0.072265625, 0.08415985107421875, 0.0960540771484375, 0.10794830322265625, 0.119842529296875, 0.13173675537109375, 0.1436309814453125, 0.15552520751953125, 0.16741943359375, 0.17931365966796875, 0.1912078857421875, 0.20310211181640625, 0.214996337890625, 0.22689056396484375, 0.2387847900390625, 0.25067901611328125, 0.2625732421875, 0.27446746826171875, 0.2863616943359375, 0.29825592041015625, 0.310150146484375, 0.32204437255859375, 0.3339385986328125, 0.34583282470703125, 0.35772705078125, 0.36962127685546875, 0.3815155029296875, 0.39340972900390625, 0.405303955078125, 0.41719818115234375, 0.4290924072265625, 0.44098663330078125, 0.452880859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 10.0, 12.0, 24.0, 52.0, 103.0, 202.0, 258.0, 167.0, 86.0, 36.0, 21.0, 14.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-11.689427375793457, -11.461386680603027, -11.233345031738281, -11.005304336547852, -10.777262687683105, -10.549221992492676, -10.32118034362793, -10.0931396484375, -9.865097999572754, -9.637057304382324, -9.409015655517578, -9.180974960327148, -8.952933311462402, -8.724892616271973, -8.496850967407227, -8.268810272216797, -8.040769577026367, -7.812728404998779, -7.584687232971191, -7.3566460609436035, -7.128604888916016, -6.900563716888428, -6.67252254486084, -6.44448184967041, -6.216440200805664, -5.988399028778076, -5.760357856750488, -5.5323166847229, -5.3042755126953125, -5.076234340667725, -4.848193168640137, -4.620152473449707, -4.392110347747803, -4.164069175720215, -3.936028003692627, -3.707986831665039, -3.479945659637451, -3.2519044876098633, -3.0238635540008545, -2.7958223819732666, -2.5677812099456787, -2.339740037918091, -2.111698865890503, -1.8836578130722046, -1.6556166410446167, -1.4275754690170288, -1.1995344161987305, -0.9714932441711426, -0.7434520721435547, -0.5154109001159668, -0.2873697876930237, -0.059328675270080566, 0.16871249675750732, 0.3967536687850952, 0.6247947216033936, 0.8528358936309814, 1.0808770656585693, 1.3089182376861572, 1.5369594097137451, 1.7650004625320435, 1.9930416345596313, 2.2210826873779297, 2.4491238594055176, 2.6771650314331055, 2.9052062034606934]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 9.0, 16.0, 13.0, 18.0, 15.0, 23.0, 30.0, 35.0, 23.0, 33.0, 25.0, 44.0, 28.0, 47.0, 51.0, 52.0, 65.0, 51.0, 52.0, 40.0, 43.0, 39.0, 17.0, 35.0, 23.0, 30.0, 17.0, 18.0, 17.0, 14.0, 5.0, 9.0, 7.0, 10.0, 8.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.046013832092285, -1.9810378551483154, -1.9160618782043457, -1.8510857820510864, -1.7861098051071167, -1.721133828163147, -1.6561577320098877, -1.591181755065918, -1.5262057781219482, -1.4612298011779785, -1.3962538242340088, -1.3312777280807495, -1.2663017511367798, -1.20132577419281, -1.1363496780395508, -1.071373701095581, -1.0063977241516113, -0.9414217472076416, -0.8764457106590271, -0.8114696741104126, -0.7464936971664429, -0.6815177202224731, -0.6165416836738586, -0.5515656471252441, -0.4865896701812744, -0.4216136634349823, -0.3566376566886902, -0.29166164994239807, -0.22668564319610596, -0.16170963644981384, -0.09673362970352173, -0.031757622957229614, 0.0332183837890625, 0.09819439053535461, 0.16317039728164673, 0.22814640402793884, 0.29312241077423096, 0.35809841752052307, 0.4230744242668152, 0.4880504310131073, 0.5530264377593994, 0.6180024147033691, 0.6829784512519836, 0.7479544878005981, 0.8129304647445679, 0.8779064416885376, 0.9428824782371521, 1.0078585147857666, 1.0728344917297363, 1.137810468673706, 1.2027864456176758, 1.267762541770935, 1.3327385187149048, 1.3977144956588745, 1.4626905918121338, 1.5276665687561035, 1.5926425457000732, 1.657618522644043, 1.7225944995880127, 1.787570595741272, 1.8525465726852417, 1.9175225496292114, 1.9824986457824707, 2.0474746227264404, 2.11245059967041]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 7.0, 5.0, 10.0, 5.0, 10.0, 17.0, 31.0, 47.0, 74.0, 132.0, 234.0, 453.0, 857.0, 1784.0, 4133.0, 11067.0, 34835.0, 145195.0, 606868.0, 180520.0, 41037.0, 12549.0, 4658.0, 2014.0, 910.0, 496.0, 255.0, 148.0, 79.0, 55.0, 29.0, 24.0, 10.0, 6.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139404296875, -0.13262557983398438, -0.12584686279296875, -0.11906814575195312, -0.1122894287109375, -0.10551071166992188, -0.09873199462890625, -0.09195327758789062, -0.085174560546875, -0.07839584350585938, -0.07161712646484375, -0.06483840942382812, -0.0580596923828125, -0.051280975341796875, -0.04450225830078125, -0.037723541259765625, -0.03094482421875, -0.024166107177734375, -0.01738739013671875, -0.010608673095703125, -0.0038299560546875, 0.002948760986328125, 0.00972747802734375, 0.016506195068359375, 0.023284912109375, 0.030063629150390625, 0.03684234619140625, 0.043621063232421875, 0.0503997802734375, 0.057178497314453125, 0.06395721435546875, 0.07073593139648438, 0.0775146484375, 0.08429336547851562, 0.09107208251953125, 0.09785079956054688, 0.1046295166015625, 0.11140823364257812, 0.11818695068359375, 0.12496566772460938, 0.131744384765625, 0.13852310180664062, 0.14530181884765625, 0.15208053588867188, 0.1588592529296875, 0.16563796997070312, 0.17241668701171875, 0.17919540405273438, 0.18597412109375, 0.19275283813476562, 0.19953155517578125, 0.20631027221679688, 0.2130889892578125, 0.21986770629882812, 0.22664642333984375, 0.23342514038085938, 0.240203857421875, 0.24698257446289062, 0.25376129150390625, 0.2605400085449219, 0.2673187255859375, 0.2740974426269531, 0.28087615966796875, 0.2876548767089844, 0.29443359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 3.0, 12.0, 12.0, 22.0, 21.0, 21.0, 23.0, 33.0, 33.0, 49.0, 50.0, 57.0, 51.0, 59.0, 63.0, 67.0, 60.0, 61.0, 40.0, 39.0, 33.0, 30.0, 23.0, 18.0, 24.0, 20.0, 13.0, 13.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2159423828125, -0.20929527282714844, -0.20264816284179688, -0.1960010528564453, -0.18935394287109375, -0.1827068328857422, -0.17605972290039062, -0.16941261291503906, -0.1627655029296875, -0.15611839294433594, -0.14947128295898438, -0.1428241729736328, -0.13617706298828125, -0.1295299530029297, -0.12288284301757812, -0.11623573303222656, -0.109588623046875, -0.10294151306152344, -0.09629440307617188, -0.08964729309082031, -0.08300018310546875, -0.07635307312011719, -0.06970596313476562, -0.06305885314941406, -0.0564117431640625, -0.04976463317871094, -0.043117523193359375, -0.03647041320800781, -0.02982330322265625, -0.023176193237304688, -0.016529083251953125, -0.009881973266601562, -0.00323486328125, 0.0034122467041015625, 0.010059356689453125, 0.016706466674804688, 0.02335357666015625, 0.030000686645507812, 0.036647796630859375, 0.04329490661621094, 0.0499420166015625, 0.05658912658691406, 0.06323623657226562, 0.06988334655761719, 0.07653045654296875, 0.08317756652832031, 0.08982467651367188, 0.09647178649902344, 0.103118896484375, 0.10976600646972656, 0.11641311645507812, 0.12306022644042969, 0.12970733642578125, 0.1363544464111328, 0.14300155639648438, 0.14964866638183594, 0.1562957763671875, 0.16294288635253906, 0.16958999633789062, 0.1762371063232422, 0.18288421630859375, 0.1895313262939453, 0.19617843627929688, 0.20282554626464844, 0.20947265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 10.0, 10.0, 18.0, 27.0, 30.0, 30.0, 43.0, 60.0, 110.0, 146.0, 260.0, 483.0, 979.0, 2443.0, 7386.0, 32771.0, 664987.0, 297607.0, 29973.0, 6668.0, 2313.0, 995.0, 419.0, 268.0, 160.0, 92.0, 54.0, 47.0, 43.0, 30.0, 26.0, 13.0, 9.0, 11.0, 9.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.277587890625, -0.2691688537597656, -0.26074981689453125, -0.2523307800292969, -0.2439117431640625, -0.23549270629882812, -0.22707366943359375, -0.21865463256835938, -0.210235595703125, -0.20181655883789062, -0.19339752197265625, -0.18497848510742188, -0.1765594482421875, -0.16814041137695312, -0.15972137451171875, -0.15130233764648438, -0.14288330078125, -0.13446426391601562, -0.12604522705078125, -0.11762619018554688, -0.1092071533203125, -0.10078811645507812, -0.09236907958984375, -0.08395004272460938, -0.075531005859375, -0.06711196899414062, -0.05869293212890625, -0.050273895263671875, -0.0418548583984375, -0.033435821533203125, -0.02501678466796875, -0.016597747802734375, -0.0081787109375, 0.000240325927734375, 0.00865936279296875, 0.017078399658203125, 0.0254974365234375, 0.033916473388671875, 0.04233551025390625, 0.050754547119140625, 0.059173583984375, 0.06759262084960938, 0.07601165771484375, 0.08443069458007812, 0.0928497314453125, 0.10126876831054688, 0.10968780517578125, 0.11810684204101562, 0.12652587890625, 0.13494491577148438, 0.14336395263671875, 0.15178298950195312, 0.1602020263671875, 0.16862106323242188, 0.17704010009765625, 0.18545913696289062, 0.193878173828125, 0.20229721069335938, 0.21071624755859375, 0.21913528442382812, 0.2275543212890625, 0.23597335815429688, 0.24439239501953125, 0.2528114318847656, 0.26123046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 5.0, 4.0, 6.0, 7.0, 5.0, 8.0, 15.0, 16.0, 16.0, 31.0, 25.0, 37.0, 33.0, 35.0, 61.0, 70.0, 70.0, 76.0, 76.0, 73.0, 61.0, 45.0, 36.0, 30.0, 25.0, 19.0, 22.0, 12.0, 5.0, 12.0, 9.0, 11.0, 7.0, 5.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.83251953125, -0.8089370727539062, -0.7853546142578125, -0.7617721557617188, -0.738189697265625, -0.7146072387695312, -0.6910247802734375, -0.6674423217773438, -0.64385986328125, -0.6202774047851562, -0.5966949462890625, -0.5731124877929688, -0.549530029296875, -0.5259475708007812, -0.5023651123046875, -0.47878265380859375, -0.4552001953125, -0.43161773681640625, -0.4080352783203125, -0.38445281982421875, -0.360870361328125, -0.33728790283203125, -0.3137054443359375, -0.29012298583984375, -0.26654052734375, -0.24295806884765625, -0.2193756103515625, -0.19579315185546875, -0.172210693359375, -0.14862823486328125, -0.1250457763671875, -0.10146331787109375, -0.077880859375, -0.05429840087890625, -0.0307159423828125, -0.00713348388671875, 0.016448974609375, 0.04003143310546875, 0.0636138916015625, 0.08719635009765625, 0.11077880859375, 0.13436126708984375, 0.1579437255859375, 0.18152618408203125, 0.205108642578125, 0.22869110107421875, 0.2522735595703125, 0.27585601806640625, 0.2994384765625, 0.32302093505859375, 0.3466033935546875, 0.37018585205078125, 0.393768310546875, 0.41735076904296875, 0.4409332275390625, 0.46451568603515625, 0.48809814453125, 0.5116806030273438, 0.5352630615234375, 0.5588455200195312, 0.582427978515625, 0.6060104370117188, 0.6295928955078125, 0.6531753540039062, 0.6767578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 13.0, 7.0, 8.0, 9.0, 9.0, 28.0, 29.0, 53.0, 61.0, 93.0, 159.0, 228.0, 388.0, 766.0, 1595.0, 3891.0, 11011.0, 43135.0, 776931.0, 170505.0, 26236.0, 7699.0, 2879.0, 1216.0, 625.0, 361.0, 191.0, 119.0, 78.0, 57.0, 36.0, 26.0, 28.0, 10.0, 13.0, 10.0, 11.0, 6.0, 10.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05914306640625, -0.0573420524597168, -0.055541038513183594, -0.05374002456665039, -0.05193901062011719, -0.050137996673583984, -0.04833698272705078, -0.04653596878051758, -0.044734954833984375, -0.04293394088745117, -0.04113292694091797, -0.039331912994384766, -0.03753089904785156, -0.03572988510131836, -0.033928871154785156, -0.03212785720825195, -0.03032684326171875, -0.028525829315185547, -0.026724815368652344, -0.02492380142211914, -0.023122787475585938, -0.021321773529052734, -0.01952075958251953, -0.017719745635986328, -0.015918731689453125, -0.014117717742919922, -0.012316703796386719, -0.010515689849853516, -0.008714675903320312, -0.006913661956787109, -0.005112648010253906, -0.003311634063720703, -0.0015106201171875, 0.0002903938293457031, 0.0020914077758789062, 0.0038924217224121094, 0.0056934356689453125, 0.007494449615478516, 0.009295463562011719, 0.011096477508544922, 0.012897491455078125, 0.014698505401611328, 0.01649951934814453, 0.018300533294677734, 0.020101547241210938, 0.02190256118774414, 0.023703575134277344, 0.025504589080810547, 0.02730560302734375, 0.029106616973876953, 0.030907630920410156, 0.03270864486694336, 0.03450965881347656, 0.036310672760009766, 0.03811168670654297, 0.03991270065307617, 0.041713714599609375, 0.04351472854614258, 0.04531574249267578, 0.047116756439208984, 0.04891777038574219, 0.05071878433227539, 0.052519798278808594, 0.0543208122253418, 0.056121826171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 8.0, 13.0, 10.0, 22.0, 21.0, 19.0, 33.0, 24.0, 37.0, 64.0, 76.0, 88.0, 79.0, 74.0, 84.0, 61.0, 52.0, 44.0, 28.0, 19.0, 25.0, 20.0, 15.0, 8.0, 9.0, 3.0, 9.0, 3.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5987625122070312e-05, -2.5277957320213318e-05, -2.4568289518356323e-05, -2.385862171649933e-05, -2.3148953914642334e-05, -2.243928611278534e-05, -2.1729618310928345e-05, -2.101995050907135e-05, -2.0310282707214355e-05, -1.960061490535736e-05, -1.8890947103500366e-05, -1.818127930164337e-05, -1.7471611499786377e-05, -1.6761943697929382e-05, -1.6052275896072388e-05, -1.5342608094215393e-05, -1.4632940292358398e-05, -1.3923272490501404e-05, -1.321360468864441e-05, -1.2503936886787415e-05, -1.179426908493042e-05, -1.1084601283073425e-05, -1.037493348121643e-05, -9.665265679359436e-06, -8.955597877502441e-06, -8.245930075645447e-06, -7.536262273788452e-06, -6.8265944719314575e-06, -6.116926670074463e-06, -5.407258868217468e-06, -4.697591066360474e-06, -3.987923264503479e-06, -3.2782554626464844e-06, -2.5685876607894897e-06, -1.8589198589324951e-06, -1.1492520570755005e-06, -4.3958425521850586e-07, 2.7008354663848877e-07, 9.797513484954834e-07, 1.689419150352478e-06, 2.3990869522094727e-06, 3.1087547540664673e-06, 3.818422555923462e-06, 4.5280903577804565e-06, 5.237758159637451e-06, 5.947425961494446e-06, 6.6570937633514404e-06, 7.366761565208435e-06, 8.07642936706543e-06, 8.786097168922424e-06, 9.495764970779419e-06, 1.0205432772636414e-05, 1.0915100574493408e-05, 1.1624768376350403e-05, 1.2334436178207397e-05, 1.3044103980064392e-05, 1.3753771781921387e-05, 1.4463439583778381e-05, 1.5173107385635376e-05, 1.588277518749237e-05, 1.6592442989349365e-05, 1.730211079120636e-05, 1.8011778593063354e-05, 1.872144639492035e-05, 1.9431114196777344e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 8.0, 9.0, 5.0, 12.0, 17.0, 24.0, 30.0, 56.0, 95.0, 183.0, 324.0, 684.0, 1595.0, 4056.0, 12376.0, 50714.0, 803435.0, 139194.0, 24168.0, 6936.0, 2549.0, 1032.0, 465.0, 232.0, 136.0, 66.0, 59.0, 26.0, 20.0, 15.0, 5.0, 7.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06637287139892578, -0.06414222717285156, -0.061911582946777344, -0.059680938720703125, -0.057450294494628906, -0.05521965026855469, -0.05298900604248047, -0.05075836181640625, -0.04852771759033203, -0.04629707336425781, -0.044066429138183594, -0.041835784912109375, -0.039605140686035156, -0.03737449645996094, -0.03514385223388672, -0.0329132080078125, -0.03068256378173828, -0.028451919555664062, -0.026221275329589844, -0.023990631103515625, -0.021759986877441406, -0.019529342651367188, -0.01729869842529297, -0.01506805419921875, -0.012837409973144531, -0.010606765747070312, -0.008376121520996094, -0.006145477294921875, -0.003914833068847656, -0.0016841888427734375, 0.0005464553833007812, 0.002777099609375, 0.005007743835449219, 0.0072383880615234375, 0.009469032287597656, 0.011699676513671875, 0.013930320739746094, 0.016160964965820312, 0.01839160919189453, 0.02062225341796875, 0.02285289764404297, 0.025083541870117188, 0.027314186096191406, 0.029544830322265625, 0.031775474548339844, 0.03400611877441406, 0.03623676300048828, 0.0384674072265625, 0.04069805145263672, 0.04292869567871094, 0.045159339904785156, 0.047389984130859375, 0.049620628356933594, 0.05185127258300781, 0.05408191680908203, 0.05631256103515625, 0.05854320526123047, 0.06077384948730469, 0.0630044937133789, 0.06523513793945312, 0.06746578216552734, 0.06969642639160156, 0.07192707061767578, 0.07415771484375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 19.0, 11.0, 17.0, 25.0, 20.0, 34.0, 57.0, 71.0, 108.0, 168.0, 161.0, 77.0, 68.0, 41.0, 34.0, 17.0, 19.0, 11.0, 10.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.13667869567871094, -0.13261032104492188, -0.1285419464111328, -0.12447357177734375, -0.12040519714355469, -0.11633682250976562, -0.11226844787597656, -0.1082000732421875, -0.10413169860839844, -0.10006332397460938, -0.09599494934082031, -0.09192657470703125, -0.08785820007324219, -0.08378982543945312, -0.07972145080566406, -0.075653076171875, -0.07158470153808594, -0.06751632690429688, -0.06344795227050781, -0.05937957763671875, -0.05531120300292969, -0.051242828369140625, -0.04717445373535156, -0.0431060791015625, -0.03903770446777344, -0.034969329833984375, -0.030900955200195312, -0.02683258056640625, -0.022764205932617188, -0.018695831298828125, -0.014627456665039062, -0.01055908203125, -0.0064907073974609375, -0.002422332763671875, 0.0016460418701171875, 0.00571441650390625, 0.009782791137695312, 0.013851165771484375, 0.017919540405273438, 0.0219879150390625, 0.026056289672851562, 0.030124664306640625, 0.03419303894042969, 0.03826141357421875, 0.04232978820800781, 0.046398162841796875, 0.05046653747558594, 0.054534912109375, 0.05860328674316406, 0.06267166137695312, 0.06674003601074219, 0.07080841064453125, 0.07487678527832031, 0.07894515991210938, 0.08301353454589844, 0.0870819091796875, 0.09115028381347656, 0.09521865844726562, 0.09928703308105469, 0.10335540771484375, 0.10742378234863281, 0.11149215698242188, 0.11556053161621094, 0.11962890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 12.0, 22.0, 83.0, 414.0, 313.0, 68.0, 37.0, 20.0, 9.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763082981109619, -2.6244237422943115, -2.485764741897583, -2.3471055030822754, -2.208446502685547, -2.0697872638702393, -1.9311280250549316, -1.7924689054489136, -1.6538097858428955, -1.5151506662368774, -1.3764915466308594, -1.2378323078155518, -1.0991731882095337, -0.9605140686035156, -0.8218548893928528, -0.6831957101821899, -0.5445365905761719, -0.4058774411678314, -0.26721829175949097, -0.1285591423511505, 0.010100007057189941, 0.148759126663208, 0.28741830587387085, 0.4260774850845337, 0.5647366046905518, 0.7033957242965698, 0.8420549035072327, 0.9807140827178955, 1.1193732023239136, 1.2580323219299316, 1.3966915607452393, 1.5353506803512573, 1.6740102767944336, 1.8126693964004517, 1.9513285160064697, 2.0899877548217773, 2.228646755218506, 2.3673059940338135, 2.505965232849121, 2.6446242332458496, 2.7832834720611572, 2.921942710876465, 3.0606017112731934, 3.199260950088501, 3.3379201889038086, 3.476579189300537, 3.6152384281158447, 3.7538976669311523, 3.892556667327881, 4.031215667724609, 4.169875144958496, 4.308534145355225, 4.447193145751953, 4.58585262298584, 4.724511623382568, 4.863170623779297, 5.001830101013184, 5.140489101409912, 5.279148578643799, 5.417807579040527, 5.556466579437256, 5.695125579833984, 5.833785057067871, 5.9724440574646, 6.111103057861328]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 9.0, 4.0, 10.0, 10.0, 10.0, 7.0, 15.0, 14.0, 13.0, 16.0, 30.0, 41.0, 92.0, 175.0, 190.0, 82.0, 43.0, 35.0, 34.0, 21.0, 22.0, 23.0, 15.0, 21.0, 11.0, 10.0, 8.0, 14.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.523611545562744, -2.449512004852295, -2.375412702560425, -2.3013131618499756, -2.2272136211395264, -2.153114080429077, -2.079014778137207, -2.004915237426758, -1.9308156967163086, -1.856716275215149, -1.7826167345046997, -1.70851731300354, -1.6344177722930908, -1.5603183507919312, -1.4862189292907715, -1.4121193885803223, -1.3380199670791626, -1.263920545578003, -1.1898210048675537, -1.115721583366394, -1.0416220426559448, -0.9675226211547852, -0.8934231400489807, -0.8193236589431763, -0.7452241778373718, -0.6711246967315674, -0.5970252156257629, -0.5229257345199585, -0.44882628321647644, -0.374726802110672, -0.30062735080718994, -0.2265278697013855, -0.15242838859558105, -0.07832891494035721, -0.004229441285133362, 0.06987002491950989, 0.14396950602531433, 0.21806898713111877, 0.29216843843460083, 0.3662679195404053, 0.4403674006462097, 0.5144668817520142, 0.5885663628578186, 0.662665843963623, 0.7367652654647827, 0.8108648061752319, 0.8849642276763916, 0.959063708782196, 1.0331631898880005, 1.1072626113891602, 1.1813621520996094, 1.255461573600769, 1.3295611143112183, 1.403660535812378, 1.4777600765228271, 1.5518594980239868, 1.6259589195251465, 1.7000583410263062, 1.7741578817367554, 1.848257303237915, 1.9223568439483643, 1.996456265449524, 2.0705556869506836, 2.144655227661133, 2.218754768371582]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 7.0, 2.0, 17.0, 7.0, 12.0, 20.0, 14.0, 8.0, 28.0, 28.0, 44.0, 32.0, 45.0, 50.0, 121.0, 172.0, 90.0, 46.0, 41.0, 37.0, 35.0, 27.0, 17.0, 18.0, 11.0, 12.0, 14.0, 7.0, 11.0, 3.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20849609375, -0.2016143798828125, -0.194732666015625, -0.1878509521484375, -0.18096923828125, -0.1740875244140625, -0.167205810546875, -0.1603240966796875, -0.1534423828125, -0.1465606689453125, -0.139678955078125, -0.1327972412109375, -0.12591552734375, -0.1190338134765625, -0.112152099609375, -0.1052703857421875, -0.098388671875, -0.0915069580078125, -0.084625244140625, -0.0777435302734375, -0.07086181640625, -0.0639801025390625, -0.057098388671875, -0.0502166748046875, -0.0433349609375, -0.0364532470703125, -0.029571533203125, -0.0226898193359375, -0.01580810546875, -0.0089263916015625, -0.002044677734375, 0.0048370361328125, 0.01171875, 0.0186004638671875, 0.025482177734375, 0.0323638916015625, 0.03924560546875, 0.0461273193359375, 0.053009033203125, 0.0598907470703125, 0.0667724609375, 0.0736541748046875, 0.080535888671875, 0.0874176025390625, 0.09429931640625, 0.1011810302734375, 0.108062744140625, 0.1149444580078125, 0.121826171875, 0.1287078857421875, 0.135589599609375, 0.1424713134765625, 0.14935302734375, 0.1562347412109375, 0.163116455078125, 0.1699981689453125, 0.1768798828125, 0.1837615966796875, 0.190643310546875, 0.1975250244140625, 0.20440673828125, 0.2112884521484375, 0.218170166015625, 0.2250518798828125, 0.23193359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 10.0, 6.0, 15.0, 17.0, 25.0, 27.0, 44.0, 83.0, 149.0, 253.0, 599.0, 1613.0, 4864.0, 28140.0, 8319679.0, 25565.0, 4759.0, 1555.0, 546.0, 239.0, 142.0, 69.0, 44.0, 24.0, 30.0, 16.0, 11.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.9834104180335999, -0.9500563144683838, -0.916702151298523, -0.8833479881286621, -0.849993884563446, -0.81663978099823, -0.7832856178283691, -0.7499314546585083, -0.7165773510932922, -0.6832232475280762, -0.6498690843582153, -0.6165149211883545, -0.5831608176231384, -0.5498067140579224, -0.5164525508880615, -0.48309841752052307, -0.4497442841529846, -0.41639015078544617, -0.3830360174179077, -0.34968188405036926, -0.3163277506828308, -0.28297361731529236, -0.2496194839477539, -0.21626535058021545, -0.182911217212677, -0.14955708384513855, -0.1162029504776001, -0.08284881711006165, -0.04949468374252319, -0.01614055037498474, 0.01721358299255371, 0.05056771636009216, 0.08392179012298584, 0.11727592349052429, 0.15063005685806274, 0.1839841902256012, 0.21733832359313965, 0.2506924569606781, 0.28404659032821655, 0.317400723695755, 0.35075485706329346, 0.3841089904308319, 0.41746312379837036, 0.4508172571659088, 0.48417139053344727, 0.5175255537033081, 0.5508796572685242, 0.5842337608337402, 0.6175879240036011, 0.6509420871734619, 0.684296190738678, 0.717650294303894, 0.7510044574737549, 0.7843586206436157, 0.8177127242088318, 0.8510668277740479, 0.8844209909439087, 0.9177751541137695, 0.9511292576789856, 0.9844833612442017, 1.0178375244140625, 1.0511916875839233, 1.0845458507537842, 1.1178998947143555, 1.1512540578842163]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 3.0, 4.0, 10.0, 0.0, 7.0, 4.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4420177936553955, -2.377901792526245, -2.3137857913970947, -2.2496697902679443, -2.185553550720215, -2.1214375495910645, -2.057321548461914, -1.9932055473327637, -1.9290895462036133, -1.864973545074463, -1.8008575439453125, -1.7367414236068726, -1.6726254224777222, -1.6085094213485718, -1.5443933010101318, -1.4802772998809814, -1.416161298751831, -1.3520452976226807, -1.2879292964935303, -1.2238131761550903, -1.15969717502594, -1.0955811738967896, -1.0314650535583496, -0.9673490524291992, -0.9032330513000488, -0.8391170501708984, -0.7750009894371033, -0.7108849287033081, -0.6467689275741577, -0.5826529264450073, -0.5185368657112122, -0.4544208347797394, -0.3903048038482666, -0.3261887729167938, -0.26207274198532104, -0.19795671105384827, -0.1338406801223755, -0.06972464919090271, -0.005608618259429932, 0.05850741267204285, 0.12262344360351562, 0.1867394745349884, 0.2508555054664612, 0.31497153639793396, 0.37908756732940674, 0.4432035982608795, 0.5073196291923523, 0.5714356899261475, 0.6355516910552979, 0.6996676921844482, 0.7637837529182434, 0.8278998136520386, 0.892015814781189, 0.9561318159103394, 1.0202479362487793, 1.0843639373779297, 1.14847993850708, 1.2125959396362305, 1.2767119407653809, 1.3408280611038208, 1.4049440622329712, 1.4690600633621216, 1.5331761837005615, 1.597292184829712, 1.6614081859588623]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 12.0, 15.0, 10.0, 13.0, 19.0, 29.0, 19.0, 53.0, 50.0, 61.0, 67.0, 73.0, 66.0, 73.0, 61.0, 72.0, 52.0, 37.0, 41.0, 33.0, 23.0, 27.0, 19.0, 20.0, 8.0, 7.0, 4.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.252197265625, -0.2451915740966797, -0.23818588256835938, -0.23118019104003906, -0.22417449951171875, -0.21716880798339844, -0.21016311645507812, -0.2031574249267578, -0.1961517333984375, -0.1891460418701172, -0.18214035034179688, -0.17513465881347656, -0.16812896728515625, -0.16112327575683594, -0.15411758422851562, -0.1471118927001953, -0.140106201171875, -0.1331005096435547, -0.12609481811523438, -0.11908912658691406, -0.11208343505859375, -0.10507774353027344, -0.09807205200195312, -0.09106636047363281, -0.0840606689453125, -0.07705497741699219, -0.07004928588867188, -0.06304359436035156, -0.05603790283203125, -0.04903221130371094, -0.042026519775390625, -0.03502082824707031, -0.02801513671875, -0.021009445190429688, -0.014003753662109375, -0.0069980621337890625, 7.62939453125e-06, 0.0070133209228515625, 0.014019012451171875, 0.021024703979492188, 0.0280303955078125, 0.03503608703613281, 0.042041778564453125, 0.04904747009277344, 0.05605316162109375, 0.06305885314941406, 0.07006454467773438, 0.07707023620605469, 0.084075927734375, 0.09108161926269531, 0.09808731079101562, 0.10509300231933594, 0.11209869384765625, 0.11910438537597656, 0.12611007690429688, 0.1331157684326172, 0.1401214599609375, 0.1471271514892578, 0.15413284301757812, 0.16113853454589844, 0.16814422607421875, 0.17514991760253906, 0.18215560913085938, 0.1891613006591797, 0.1961669921875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 4.0, 3.0, 2.0, 1.0, 9.0, 8.0, 10.0, 14.0, 23.0, 39.0, 44.0, 72.0, 87.0, 172.0, 287.0, 504.0, 897.0, 1760.0, 3382.0, 6829.0, 14535.0, 31699.0, 69050.0, 132932.0, 133537.0, 68603.0, 30965.0, 14308.0, 6928.0, 3462.0, 1791.0, 913.0, 542.0, 297.0, 214.0, 118.0, 63.0, 47.0, 40.0, 28.0, 18.0, 8.0, 9.0, 12.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.884765625, -0.8601913452148438, -0.8356170654296875, -0.8110427856445312, -0.786468505859375, -0.7618942260742188, -0.7373199462890625, -0.7127456665039062, -0.68817138671875, -0.6635971069335938, -0.6390228271484375, -0.6144485473632812, -0.589874267578125, -0.5652999877929688, -0.5407257080078125, -0.5161514282226562, -0.4915771484375, -0.46700286865234375, -0.4424285888671875, -0.41785430908203125, -0.393280029296875, -0.36870574951171875, -0.3441314697265625, -0.31955718994140625, -0.29498291015625, -0.27040863037109375, -0.2458343505859375, -0.22126007080078125, -0.196685791015625, -0.17211151123046875, -0.1475372314453125, -0.12296295166015625, -0.098388671875, -0.07381439208984375, -0.0492401123046875, -0.02466583251953125, -9.1552734375e-05, 0.02448272705078125, 0.0490570068359375, 0.07363128662109375, 0.09820556640625, 0.12277984619140625, 0.1473541259765625, 0.17192840576171875, 0.196502685546875, 0.22107696533203125, 0.2456512451171875, 0.27022552490234375, 0.2947998046875, 0.31937408447265625, 0.3439483642578125, 0.36852264404296875, 0.393096923828125, 0.41767120361328125, 0.4422454833984375, 0.46681976318359375, 0.49139404296875, 0.5159683227539062, 0.5405426025390625, 0.5651168823242188, 0.589691162109375, 0.6142654418945312, 0.6388397216796875, 0.6634140014648438, 0.68798828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 3.0, 8.0, 20.0, 29.0, 33.0, 45.0, 59.0, 70.0, 85.0, 102.0, 100.0, 95.0, 84.0, 55.0, 59.0, 51.0, 34.0, 28.0, 14.0, 7.0, 13.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39404296875, -0.3847827911376953, -0.3755226135253906, -0.36626243591308594, -0.35700225830078125, -0.34774208068847656, -0.3384819030761719, -0.3292217254638672, -0.3199615478515625, -0.3107013702392578, -0.3014411926269531, -0.29218101501464844, -0.28292083740234375, -0.27366065979003906, -0.2644004821777344, -0.2551403045654297, -0.245880126953125, -0.2366199493408203, -0.22735977172851562, -0.21809959411621094, -0.20883941650390625, -0.19957923889160156, -0.19031906127929688, -0.1810588836669922, -0.1717987060546875, -0.1625385284423828, -0.15327835083007812, -0.14401817321777344, -0.13475799560546875, -0.12549781799316406, -0.11623764038085938, -0.10697746276855469, -0.09771728515625, -0.08845710754394531, -0.07919692993164062, -0.06993675231933594, -0.06067657470703125, -0.05141639709472656, -0.042156219482421875, -0.03289604187011719, -0.0236358642578125, -0.014375686645507812, -0.005115509033203125, 0.0041446685791015625, 0.01340484619140625, 0.022665023803710938, 0.031925201416015625, 0.04118537902832031, 0.050445556640625, 0.05970573425292969, 0.06896591186523438, 0.07822608947753906, 0.08748626708984375, 0.09674644470214844, 0.10600662231445312, 0.11526679992675781, 0.1245269775390625, 0.1337871551513672, 0.14304733276367188, 0.15230751037597656, 0.16156768798828125, 0.17082786560058594, 0.18008804321289062, 0.1893482208251953, 0.1986083984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 7.0, 3.0, 6.0, 9.0, 19.0, 70.0, 171.0, 124.0, 30.0, 16.0, 9.0, 9.0, 2.0, 3.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.052302837371826, -2.983961343765259, -2.9156198501586914, -2.847278356552124, -2.7789368629455566, -2.7105953693389893, -2.642253875732422, -2.5739126205444336, -2.505570888519287, -2.4372293949127197, -2.3688879013061523, -2.300546407699585, -2.2322049140930176, -2.16386342048645, -2.095521926879883, -2.0271806716918945, -1.9588391780853271, -1.8904976844787598, -1.8221561908721924, -1.753814697265625, -1.6854732036590576, -1.6171317100524902, -1.5487903356552124, -1.480448842048645, -1.4121073484420776, -1.3437658548355103, -1.2754243612289429, -1.2070828676223755, -1.1387414932250977, -1.0703999996185303, -1.002058506011963, -0.9337170124053955, -0.8653757572174072, -0.7970342636108398, -0.7286927700042725, -0.6603513360023499, -0.5920098423957825, -0.5236683487892151, -0.4553268849849701, -0.3869854211807251, -0.3186439275741577, -0.25030243396759033, -0.18196097016334534, -0.11361949145793915, -0.04527801275253296, 0.023063480854034424, 0.09140494465827942, 0.15974640846252441, 0.2280879020690918, 0.2964293956756592, 0.3647708594799042, 0.43311232328414917, 0.5014538168907166, 0.5697953104972839, 0.6381367444992065, 0.7064782381057739, 0.7748197317123413, 0.8431612253189087, 0.9115027189254761, 0.9798441529273987, 1.0481855869293213, 1.1165270805358887, 1.184868574142456, 1.2532100677490234, 1.3215515613555908]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 8.0, 4.0, 5.0, 1.0, 2.0, 12.0, 6.0, 12.0, 20.0, 47.0, 112.0, 107.0, 71.0, 23.0, 11.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0941205024719238, -1.0543020963668823, -1.0144836902618408, -0.9746652841567993, -0.9348468780517578, -0.8950284719467163, -0.8552101254463196, -0.8153917193412781, -0.7755733132362366, -0.7357549071311951, -0.6959365010261536, -0.6561180949211121, -0.6162997484207153, -0.5764813423156738, -0.5366629362106323, -0.4968445301055908, -0.4570261240005493, -0.4172077178955078, -0.3773893117904663, -0.3375709354877472, -0.2977525293827057, -0.2579341232776642, -0.21811573207378387, -0.17829734086990356, -0.13847893476486206, -0.09866053611040115, -0.05884213745594025, -0.01902373880147934, 0.020794659852981567, 0.06061306595802307, 0.10043145716190338, 0.1402498483657837, 0.18006813526153564, 0.21988654136657715, 0.25970494747161865, 0.29952332377433777, 0.3393417298793793, 0.3791601359844208, 0.4189785122871399, 0.4587969183921814, 0.4986153244972229, 0.5384337306022644, 0.5782521367073059, 0.6180705428123474, 0.6578888893127441, 0.6977072954177856, 0.7375257015228271, 0.7773441076278687, 0.8171625137329102, 0.8569809198379517, 0.8967993259429932, 0.9366177320480347, 0.9764361381530762, 1.0162545442581177, 1.0560729503631592, 1.0958912372589111, 1.1357097625732422, 1.1755281686782837, 1.2153465747833252, 1.2551649808883667, 1.2949833869934082, 1.3348017930984497, 1.3746201992034912, 1.4144384860992432, 1.4542568922042847]}, "eval/loss": 0.3589690625667572, "eval/wer": 0.09641015470051567, "eval/runtime": 570.6282, "eval/samples_per_second": 4.63, "eval/steps_per_second": 0.58, "train/train_runtime": 51756.4072, "train/train_samples_per_second": 5.514, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 1.290548439615828} \ No newline at end of file +{"train/loss": 0.0134, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 10.0, "train/global_step": 2230, "_runtime": 52767, "_timestamp": 1648367457, "_step": 2235, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 30.0, 111.0, 200.0, 305.0, 216.0, 87.0, 40.0, 11.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3592593669891357, -2.3074288368225098, -2.255598545074463, -2.203768014907837, -2.151937484741211, -2.100106954574585, -2.048276662826538, -1.996446132659912, -1.9446156024932861, -1.8927851915359497, -1.8409546613693237, -1.7891242504119873, -1.7372937202453613, -1.685463309288025, -1.633632779121399, -1.5818023681640625, -1.5299718379974365, -1.4781414270401, -1.4263108968734741, -1.3744804859161377, -1.3226499557495117, -1.2708195447921753, -1.2189890146255493, -1.167158603668213, -1.1153281927108765, -1.06349778175354, -1.011667251586914, -0.9598367810249329, -0.9080063104629517, -0.8561758995056152, -0.8043453693389893, -0.7525149583816528, -0.7006843686103821, -0.6488538980484009, -0.5970234274864197, -0.5451929569244385, -0.4933624863624573, -0.44153204560279846, -0.38970157504081726, -0.33787110447883606, -0.28604063391685486, -0.23421016335487366, -0.18237969279289246, -0.13054923713207245, -0.07871876657009125, -0.02688831090927124, 0.02494215965270996, 0.07677263021469116, 0.12860310077667236, 0.18043357133865356, 0.23226404190063477, 0.28409451246261597, 0.33592498302459717, 0.387755423784256, 0.4395858943462372, 0.4914163649082184, 0.543246865272522, 0.5950773358345032, 0.6469078063964844, 0.6987382769584656, 0.7505687475204468, 0.8023991584777832, 0.8542296886444092, 0.9060600996017456, 0.9578905701637268]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 11.0, 15.0, 19.0, 22.0, 24.0, 39.0, 22.0, 38.0, 43.0, 41.0, 48.0, 48.0, 49.0, 51.0, 56.0, 44.0, 49.0, 42.0, 36.0, 39.0, 35.0, 28.0, 34.0, 18.0, 24.0, 25.0, 18.0, 17.0, 13.0, 6.0, 10.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4530882239341736, -0.4375229775905609, -0.42195773124694824, -0.40639248490333557, -0.3908272385597229, -0.37526199221611023, -0.35969674587249756, -0.3441315293312073, -0.3285662531852722, -0.31300100684165955, -0.2974357604980469, -0.2818705141544342, -0.26630526781082153, -0.25074002146720886, -0.23517479002475739, -0.21960954368114471, -0.20404431223869324, -0.18847906589508057, -0.1729138195514679, -0.15734857320785522, -0.14178332686424255, -0.12621808052062988, -0.1106528490781784, -0.09508760273456573, -0.07952235639095306, -0.0639571100473404, -0.04839186742901802, -0.03282662481069565, -0.017261378467082977, -0.0016961321234703064, 0.013869106769561768, 0.02943435311317444, 0.04499959945678711, 0.06056484580039978, 0.07613009214401245, 0.09169533103704453, 0.1072605773806572, 0.12282582372426987, 0.13839106261730194, 0.1539563089609146, 0.16952155530452728, 0.18508680164813995, 0.20065204799175262, 0.2162172794342041, 0.23178252577781677, 0.24734777212142944, 0.2629130184650421, 0.2784782648086548, 0.29404351115226746, 0.3096087574958801, 0.3251740038394928, 0.34073925018310547, 0.35630449652671814, 0.3718697428703308, 0.3874349594116211, 0.40300023555755615, 0.41856545209884644, 0.4341306984424591, 0.4496959447860718, 0.46526119112968445, 0.4808264374732971, 0.4963916838169098, 0.5119569301605225, 0.5275221467018127, 0.5430874228477478]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 14.0, 13.0, 14.0, 21.0, 30.0, 36.0, 48.0, 62.0, 98.0, 147.0, 212.0, 322.0, 507.0, 747.0, 1173.0, 1811.0, 3182.0, 6017.0, 12088.0, 30614.0, 128466.0, 602238.0, 2024053.0, 1052782.0, 239315.0, 55238.0, 17617.0, 7380.0, 3974.0, 2237.0, 1354.0, 854.0, 546.0, 349.0, 221.0, 154.0, 102.0, 71.0, 47.0, 35.0, 37.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.86083984375, -0.835296630859375, -0.80975341796875, -0.784210205078125, -0.7586669921875, -0.733123779296875, -0.70758056640625, -0.682037353515625, -0.656494140625, -0.630950927734375, -0.60540771484375, -0.579864501953125, -0.5543212890625, -0.528778076171875, -0.50323486328125, -0.477691650390625, -0.4521484375, -0.426605224609375, -0.40106201171875, -0.375518798828125, -0.3499755859375, -0.324432373046875, -0.29888916015625, -0.273345947265625, -0.247802734375, -0.222259521484375, -0.19671630859375, -0.171173095703125, -0.1456298828125, -0.120086669921875, -0.09454345703125, -0.069000244140625, -0.04345703125, -0.017913818359375, 0.00762939453125, 0.033172607421875, 0.0587158203125, 0.084259033203125, 0.10980224609375, 0.135345458984375, 0.160888671875, 0.186431884765625, 0.21197509765625, 0.237518310546875, 0.2630615234375, 0.288604736328125, 0.31414794921875, 0.339691162109375, 0.365234375, 0.390777587890625, 0.41632080078125, 0.441864013671875, 0.4674072265625, 0.492950439453125, 0.51849365234375, 0.544036865234375, 0.569580078125, 0.595123291015625, 0.62066650390625, 0.646209716796875, 0.6717529296875, 0.697296142578125, 0.72283935546875, 0.748382568359375, 0.77392578125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 2.0, 5.0, 15.0, 16.0, 10.0, 27.0, 24.0, 27.0, 25.0, 40.0, 51.0, 38.0, 33.0, 52.0, 66.0, 52.0, 44.0, 41.0, 41.0, 56.0, 35.0, 50.0, 41.0, 25.0, 27.0, 22.0, 25.0, 16.0, 19.0, 12.0, 14.0, 16.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69384765625, -0.668426513671875, -0.64300537109375, -0.617584228515625, -0.5921630859375, -0.566741943359375, -0.54132080078125, -0.515899658203125, -0.490478515625, -0.465057373046875, -0.43963623046875, -0.414215087890625, -0.3887939453125, -0.363372802734375, -0.33795166015625, -0.312530517578125, -0.287109375, -0.261688232421875, -0.23626708984375, -0.210845947265625, -0.1854248046875, -0.160003662109375, -0.13458251953125, -0.109161376953125, -0.083740234375, -0.058319091796875, -0.03289794921875, -0.007476806640625, 0.0179443359375, 0.043365478515625, 0.06878662109375, 0.094207763671875, 0.11962890625, 0.145050048828125, 0.17047119140625, 0.195892333984375, 0.2213134765625, 0.246734619140625, 0.27215576171875, 0.297576904296875, 0.322998046875, 0.348419189453125, 0.37384033203125, 0.399261474609375, 0.4246826171875, 0.450103759765625, 0.47552490234375, 0.500946044921875, 0.5263671875, 0.551788330078125, 0.57720947265625, 0.602630615234375, 0.6280517578125, 0.653472900390625, 0.67889404296875, 0.704315185546875, 0.729736328125, 0.755157470703125, 0.78057861328125, 0.805999755859375, 0.8314208984375, 0.856842041015625, 0.88226318359375, 0.907684326171875, 0.93310546875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 19.0, 37.0, 79.0, 590.0, 4178993.0, 14102.0, 338.0, 69.0, 27.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.251220703125, -16.42431640625, -15.597412109375, -14.7705078125, -13.943603515625, -13.11669921875, -12.289794921875, -11.462890625, -10.635986328125, -9.80908203125, -8.982177734375, -8.1552734375, -7.328369140625, -6.50146484375, -5.674560546875, -4.84765625, -4.020751953125, -3.19384765625, -2.366943359375, -1.5400390625, -0.713134765625, 0.11376953125, 0.940673828125, 1.767578125, 2.594482421875, 3.42138671875, 4.248291015625, 5.0751953125, 5.902099609375, 6.72900390625, 7.555908203125, 8.3828125, 9.209716796875, 10.03662109375, 10.863525390625, 11.6904296875, 12.517333984375, 13.34423828125, 14.171142578125, 14.998046875, 15.824951171875, 16.65185546875, 17.478759765625, 18.3056640625, 19.132568359375, 19.95947265625, 20.786376953125, 21.61328125, 22.440185546875, 23.26708984375, 24.093994140625, 24.9208984375, 25.747802734375, 26.57470703125, 27.401611328125, 28.228515625, 29.055419921875, 29.88232421875, 30.709228515625, 31.5361328125, 32.363037109375, 33.18994140625, 34.016845703125, 34.84375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 29.0, 38.0, 139.0, 570.0, 2697.0, 421.0, 114.0, 35.0, 13.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9287796020507812, -0.8922271728515625, -0.8556747436523438, -0.819122314453125, -0.7825698852539062, -0.7460174560546875, -0.7094650268554688, -0.67291259765625, -0.6363601684570312, -0.5998077392578125, -0.5632553100585938, -0.526702880859375, -0.49015045166015625, -0.4535980224609375, -0.41704559326171875, -0.3804931640625, -0.34394073486328125, -0.3073883056640625, -0.27083587646484375, -0.234283447265625, -0.19773101806640625, -0.1611785888671875, -0.12462615966796875, -0.08807373046875, -0.05152130126953125, -0.0149688720703125, 0.02158355712890625, 0.058135986328125, 0.09468841552734375, 0.1312408447265625, 0.16779327392578125, 0.204345703125, 0.24089813232421875, 0.2774505615234375, 0.31400299072265625, 0.350555419921875, 0.38710784912109375, 0.4236602783203125, 0.46021270751953125, 0.49676513671875, 0.5333175659179688, 0.5698699951171875, 0.6064224243164062, 0.642974853515625, 0.6795272827148438, 0.7160797119140625, 0.7526321411132812, 0.7891845703125, 0.8257369995117188, 0.8622894287109375, 0.8988418579101562, 0.935394287109375, 0.9719467163085938, 1.0084991455078125, 1.0450515747070312, 1.08160400390625, 1.1181564331054688, 1.1547088623046875, 1.1912612915039062, 1.227813720703125, 1.2643661499023438, 1.3009185791015625, 1.3374710083007812, 1.3740234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 11.0, 13.0, 15.0, 18.0, 31.0, 30.0, 35.0, 51.0, 69.0, 69.0, 78.0, 91.0, 106.0, 73.0, 57.0, 56.0, 46.0, 29.0, 34.0, 18.0, 14.0, 14.0, 6.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1353092193603516, -1.1050784587860107, -1.0748478174209595, -1.0446170568466187, -1.0143862962722778, -0.9841555953025818, -0.9539248943328857, -0.9236941337585449, -0.8934634327888489, -0.8632327318191528, -0.833001971244812, -0.802771270275116, -0.7725405693054199, -0.7423098087310791, -0.7120791077613831, -0.681848406791687, -0.6516176462173462, -0.6213869452476501, -0.5911561846733093, -0.5609254837036133, -0.5306947231292725, -0.5004640221595764, -0.47023332118988037, -0.44000259041786194, -0.4097718596458435, -0.3795411288738251, -0.34931039810180664, -0.3190796971321106, -0.28884896636009216, -0.25861823558807373, -0.2283875197172165, -0.19815680384635925, -0.16792601346969604, -0.1376952826976776, -0.10746456682682037, -0.07723384350538254, -0.0470031201839447, -0.01677238941192627, 0.01345832645893097, 0.04368904232978821, 0.07391977310180664, 0.10415049642324448, 0.1343812197446823, 0.16461193561553955, 0.19484266638755798, 0.22507339715957642, 0.25530409812927246, 0.2855348289012909, 0.3157655596733093, 0.34599629044532776, 0.3762270212173462, 0.40645772218704224, 0.43668845295906067, 0.4669191837310791, 0.49714988470077515, 0.5273805856704712, 0.557611346244812, 0.5878420472145081, 0.6180728077888489, 0.6483035087585449, 0.6785342693328857, 0.7087649703025818, 0.7389956712722778, 0.7692264318466187, 0.7994571328163147]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 8.0, 10.0, 8.0, 11.0, 26.0, 22.0, 29.0, 32.0, 23.0, 43.0, 37.0, 45.0, 41.0, 28.0, 50.0, 45.0, 46.0, 40.0, 44.0, 47.0, 35.0, 44.0, 53.0, 28.0, 36.0, 24.0, 25.0, 21.0, 9.0, 17.0, 11.0, 20.0, 9.0, 7.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6483617424964905, -0.6281723380088806, -0.607982873916626, -0.5877934694290161, -0.5676040053367615, -0.5474146008491516, -0.527225136756897, -0.5070357322692871, -0.48684626817703247, -0.4666568338871002, -0.44646739959716797, -0.4262779653072357, -0.40608853101730347, -0.3858990967273712, -0.36570966243743896, -0.3455202579498291, -0.32533082365989685, -0.3051413893699646, -0.28495195508003235, -0.2647625207901001, -0.24457308650016785, -0.2243836522102356, -0.20419423282146454, -0.1840047985315323, -0.16381536424160004, -0.14362592995166779, -0.12343649566173553, -0.10324706882238388, -0.08305763453245163, -0.06286820024251938, -0.042678773403167725, -0.022489339113235474, -0.0022999048233032227, 0.01788952760398388, 0.03807896003127098, 0.05826839059591293, 0.07845782488584518, 0.09864725917577744, 0.11883668601512909, 0.13902612030506134, 0.1592155545949936, 0.17940498888492584, 0.1995944231748581, 0.21978384256362915, 0.2399732768535614, 0.26016271114349365, 0.2803521454334259, 0.30054157972335815, 0.3207310140132904, 0.34092044830322266, 0.3611098825931549, 0.38129931688308716, 0.4014887511730194, 0.42167818546295166, 0.4418675899505615, 0.46205705404281616, 0.482246458530426, 0.5024358630180359, 0.5226253271102905, 0.5428147315979004, 0.563004195690155, 0.5831936001777649, 0.6033830642700195, 0.6235724687576294, 0.643761932849884]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 1.0, 7.0, 12.0, 21.0, 28.0, 34.0, 58.0, 73.0, 147.0, 208.0, 310.0, 539.0, 842.0, 1393.0, 2397.0, 4277.0, 7140.0, 12779.0, 23155.0, 42211.0, 77846.0, 141425.0, 236640.0, 218332.0, 125422.0, 68411.0, 37037.0, 20560.0, 11411.0, 6471.0, 3693.0, 2276.0, 1323.0, 760.0, 479.0, 308.0, 183.0, 101.0, 86.0, 43.0, 35.0, 21.0, 19.0, 14.0, 15.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2308349609375, -0.22359848022460938, -0.21636199951171875, -0.20912551879882812, -0.2018890380859375, -0.19465255737304688, -0.18741607666015625, -0.18017959594726562, -0.172943115234375, -0.16570663452148438, -0.15847015380859375, -0.15123367309570312, -0.1439971923828125, -0.13676071166992188, -0.12952423095703125, -0.12228775024414062, -0.11505126953125, -0.10781478881835938, -0.10057830810546875, -0.09334182739257812, -0.0861053466796875, -0.07886886596679688, -0.07163238525390625, -0.06439590454101562, -0.057159423828125, -0.049922943115234375, -0.04268646240234375, -0.035449981689453125, -0.0282135009765625, -0.020977020263671875, -0.01374053955078125, -0.006504058837890625, 0.000732421875, 0.007968902587890625, 0.01520538330078125, 0.022441864013671875, 0.0296783447265625, 0.036914825439453125, 0.04415130615234375, 0.051387786865234375, 0.058624267578125, 0.06586074829101562, 0.07309722900390625, 0.08033370971679688, 0.0875701904296875, 0.09480667114257812, 0.10204315185546875, 0.10927963256835938, 0.11651611328125, 0.12375259399414062, 0.13098907470703125, 0.13822555541992188, 0.1454620361328125, 0.15269851684570312, 0.15993499755859375, 0.16717147827148438, 0.174407958984375, 0.18164443969726562, 0.18888092041015625, 0.19611740112304688, 0.2033538818359375, 0.21059036254882812, 0.21782684326171875, 0.22506332397460938, 0.2322998046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 9.0, 13.0, 32.0, 21.0, 24.0, 29.0, 40.0, 30.0, 44.0, 37.0, 49.0, 35.0, 50.0, 51.0, 61.0, 40.0, 49.0, 45.0, 45.0, 35.0, 30.0, 40.0, 32.0, 22.0, 25.0, 19.0, 9.0, 11.0, 13.0, 11.0, 9.0, 6.0, 9.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45654296875, -0.4424400329589844, -0.42833709716796875, -0.4142341613769531, -0.4001312255859375, -0.3860282897949219, -0.37192535400390625, -0.3578224182128906, -0.343719482421875, -0.3296165466308594, -0.31551361083984375, -0.3014106750488281, -0.2873077392578125, -0.2732048034667969, -0.25910186767578125, -0.24499893188476562, -0.23089599609375, -0.21679306030273438, -0.20269012451171875, -0.18858718872070312, -0.1744842529296875, -0.16038131713867188, -0.14627838134765625, -0.13217544555664062, -0.118072509765625, -0.10396957397460938, -0.08986663818359375, -0.07576370239257812, -0.0616607666015625, -0.047557830810546875, -0.03345489501953125, -0.019351959228515625, -0.0052490234375, 0.008853912353515625, 0.02295684814453125, 0.037059783935546875, 0.0511627197265625, 0.06526565551757812, 0.07936859130859375, 0.09347152709960938, 0.107574462890625, 0.12167739868164062, 0.13578033447265625, 0.14988327026367188, 0.1639862060546875, 0.17808914184570312, 0.19219207763671875, 0.20629501342773438, 0.22039794921875, 0.23450088500976562, 0.24860382080078125, 0.2627067565917969, 0.2768096923828125, 0.2909126281738281, 0.30501556396484375, 0.3191184997558594, 0.333221435546875, 0.3473243713378906, 0.36142730712890625, 0.3755302429199219, 0.3896331787109375, 0.4037361145019531, 0.41783905029296875, 0.4319419860839844, 0.446044921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 16.0, 13.0, 30.0, 28.0, 52.0, 66.0, 109.0, 234.0, 364.0, 769.0, 1422.0, 3143.0, 8148.0, 23704.0, 77312.0, 283738.0, 445985.0, 140916.0, 40421.0, 13068.0, 4750.0, 2090.0, 991.0, 468.0, 267.0, 173.0, 94.0, 56.0, 43.0, 23.0, 16.0, 12.0, 7.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37480926513671875, -0.3624114990234375, -0.35001373291015625, -0.337615966796875, -0.32521820068359375, -0.3128204345703125, -0.30042266845703125, -0.28802490234375, -0.27562713623046875, -0.2632293701171875, -0.25083160400390625, -0.238433837890625, -0.22603607177734375, -0.2136383056640625, -0.20124053955078125, -0.1888427734375, -0.17644500732421875, -0.1640472412109375, -0.15164947509765625, -0.139251708984375, -0.12685394287109375, -0.1144561767578125, -0.10205841064453125, -0.08966064453125, -0.07726287841796875, -0.0648651123046875, -0.05246734619140625, -0.040069580078125, -0.02767181396484375, -0.0152740478515625, -0.00287628173828125, 0.009521484375, 0.02191925048828125, 0.0343170166015625, 0.04671478271484375, 0.059112548828125, 0.07151031494140625, 0.0839080810546875, 0.09630584716796875, 0.10870361328125, 0.12110137939453125, 0.1334991455078125, 0.14589691162109375, 0.158294677734375, 0.17069244384765625, 0.1830902099609375, 0.19548797607421875, 0.2078857421875, 0.22028350830078125, 0.2326812744140625, 0.24507904052734375, 0.257476806640625, 0.26987457275390625, 0.2822723388671875, 0.29467010498046875, 0.30706787109375, 0.31946563720703125, 0.3318634033203125, 0.34426116943359375, 0.356658935546875, 0.36905670166015625, 0.3814544677734375, 0.39385223388671875, 0.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 11.0, 11.0, 17.0, 12.0, 15.0, 14.0, 26.0, 29.0, 25.0, 29.0, 35.0, 21.0, 31.0, 49.0, 43.0, 46.0, 48.0, 44.0, 34.0, 36.0, 34.0, 32.0, 41.0, 32.0, 34.0, 25.0, 29.0, 26.0, 15.0, 24.0, 18.0, 17.0, 13.0, 12.0, 7.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7140655517578125, -0.688873291015625, -0.6636810302734375, -0.63848876953125, -0.6132965087890625, -0.588104248046875, -0.5629119873046875, -0.5377197265625, -0.5125274658203125, -0.487335205078125, -0.4621429443359375, -0.43695068359375, -0.4117584228515625, -0.386566162109375, -0.3613739013671875, -0.336181640625, -0.3109893798828125, -0.285797119140625, -0.2606048583984375, -0.23541259765625, -0.2102203369140625, -0.185028076171875, -0.1598358154296875, -0.1346435546875, -0.1094512939453125, -0.084259033203125, -0.0590667724609375, -0.03387451171875, -0.0086822509765625, 0.016510009765625, 0.0417022705078125, 0.06689453125, 0.0920867919921875, 0.117279052734375, 0.1424713134765625, 0.16766357421875, 0.1928558349609375, 0.218048095703125, 0.2432403564453125, 0.2684326171875, 0.2936248779296875, 0.318817138671875, 0.3440093994140625, 0.36920166015625, 0.3943939208984375, 0.419586181640625, 0.4447784423828125, 0.469970703125, 0.4951629638671875, 0.520355224609375, 0.5455474853515625, 0.57073974609375, 0.5959320068359375, 0.621124267578125, 0.6463165283203125, 0.6715087890625, 0.6967010498046875, 0.721893310546875, 0.7470855712890625, 0.77227783203125, 0.7974700927734375, 0.822662353515625, 0.8478546142578125, 0.873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 7.0, 5.0, 18.0, 31.0, 34.0, 57.0, 87.0, 134.0, 254.0, 420.0, 728.0, 1376.0, 2871.0, 5907.0, 13614.0, 37320.0, 123114.0, 424889.0, 309507.0, 81611.0, 26653.0, 10439.0, 4590.0, 2218.0, 1147.0, 629.0, 348.0, 219.0, 110.0, 88.0, 46.0, 32.0, 17.0, 12.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.06044912338256836, -0.05855083465576172, -0.05665254592895508, -0.05475425720214844, -0.0528559684753418, -0.050957679748535156, -0.049059391021728516, -0.047161102294921875, -0.045262813568115234, -0.043364524841308594, -0.04146623611450195, -0.03956794738769531, -0.03766965866088867, -0.03577136993408203, -0.03387308120727539, -0.03197479248046875, -0.03007650375366211, -0.02817821502685547, -0.026279926300048828, -0.024381637573242188, -0.022483348846435547, -0.020585060119628906, -0.018686771392822266, -0.016788482666015625, -0.014890193939208984, -0.012991905212402344, -0.011093616485595703, -0.009195327758789062, -0.007297039031982422, -0.005398750305175781, -0.0035004615783691406, -0.0016021728515625, 0.0002961158752441406, 0.0021944046020507812, 0.004092693328857422, 0.0059909820556640625, 0.007889270782470703, 0.009787559509277344, 0.011685848236083984, 0.013584136962890625, 0.015482425689697266, 0.017380714416503906, 0.019279003143310547, 0.021177291870117188, 0.023075580596923828, 0.02497386932373047, 0.02687215805053711, 0.02877044677734375, 0.03066873550415039, 0.03256702423095703, 0.03446531295776367, 0.03636360168457031, 0.03826189041137695, 0.040160179138183594, 0.042058467864990234, 0.043956756591796875, 0.045855045318603516, 0.047753334045410156, 0.0496516227722168, 0.05154991149902344, 0.05344820022583008, 0.05534648895263672, 0.05724477767944336, 0.05914306640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 22.0, 22.0, 14.0, 27.0, 43.0, 65.0, 87.0, 124.0, 128.0, 106.0, 103.0, 56.0, 58.0, 25.0, 28.0, 16.0, 13.0, 9.0, 4.0, 9.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-05, -4.5666471123695374e-05, -4.364922642707825e-05, -4.163198173046112e-05, -3.9614737033843994e-05, -3.759749233722687e-05, -3.558024764060974e-05, -3.3563002943992615e-05, -3.154575824737549e-05, -2.9528513550758362e-05, -2.7511268854141235e-05, -2.549402415752411e-05, -2.3476779460906982e-05, -2.1459534764289856e-05, -1.944229006767273e-05, -1.7425045371055603e-05, -1.5407800674438477e-05, -1.339055597782135e-05, -1.1373311281204224e-05, -9.356066584587097e-06, -7.338821887969971e-06, -5.321577191352844e-06, -3.3043324947357178e-06, -1.2870877981185913e-06, 7.301568984985352e-07, 2.7474015951156616e-06, 4.764646291732788e-06, 6.7818909883499146e-06, 8.799135684967041e-06, 1.0816380381584167e-05, 1.2833625078201294e-05, 1.485086977481842e-05, 1.6868114471435547e-05, 1.8885359168052673e-05, 2.09026038646698e-05, 2.2919848561286926e-05, 2.4937093257904053e-05, 2.695433795452118e-05, 2.8971582651138306e-05, 3.098882734775543e-05, 3.300607204437256e-05, 3.5023316740989685e-05, 3.704056143760681e-05, 3.905780613422394e-05, 4.1075050830841064e-05, 4.309229552745819e-05, 4.510954022407532e-05, 4.7126784920692444e-05, 4.914402961730957e-05, 5.11612743139267e-05, 5.317851901054382e-05, 5.519576370716095e-05, 5.7213008403778076e-05, 5.92302531003952e-05, 6.124749779701233e-05, 6.326474249362946e-05, 6.528198719024658e-05, 6.729923188686371e-05, 6.931647658348083e-05, 7.133372128009796e-05, 7.335096597671509e-05, 7.536821067333221e-05, 7.738545536994934e-05, 7.940270006656647e-05, 8.14199447631836e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 18.0, 15.0, 24.0, 30.0, 33.0, 62.0, 62.0, 156.0, 288.0, 586.0, 1592.0, 4758.0, 17727.0, 106463.0, 641518.0, 232467.0, 31445.0, 7188.0, 2350.0, 918.0, 338.0, 174.0, 99.0, 63.0, 47.0, 32.0, 20.0, 11.0, 13.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09949684143066406, -0.09602737426757812, -0.09255790710449219, -0.08908843994140625, -0.08561897277832031, -0.08214950561523438, -0.07868003845214844, -0.0752105712890625, -0.07174110412597656, -0.06827163696289062, -0.06480216979980469, -0.06133270263671875, -0.05786323547363281, -0.054393768310546875, -0.05092430114746094, -0.047454833984375, -0.04398536682128906, -0.040515899658203125, -0.03704643249511719, -0.03357696533203125, -0.030107498168945312, -0.026638031005859375, -0.023168563842773438, -0.0196990966796875, -0.016229629516601562, -0.012760162353515625, -0.009290695190429688, -0.00582122802734375, -0.0023517608642578125, 0.001117706298828125, 0.0045871734619140625, 0.008056640625, 0.011526107788085938, 0.014995574951171875, 0.018465042114257812, 0.02193450927734375, 0.025403976440429688, 0.028873443603515625, 0.03234291076660156, 0.0358123779296875, 0.03928184509277344, 0.042751312255859375, 0.04622077941894531, 0.04969024658203125, 0.05315971374511719, 0.056629180908203125, 0.06009864807128906, 0.063568115234375, 0.06703758239746094, 0.07050704956054688, 0.07397651672363281, 0.07744598388671875, 0.08091545104980469, 0.08438491821289062, 0.08785438537597656, 0.0913238525390625, 0.09479331970214844, 0.09826278686523438, 0.10173225402832031, 0.10520172119140625, 0.10867118835449219, 0.11214065551757812, 0.11561012268066406, 0.11907958984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 7.0, 5.0, 7.0, 11.0, 18.0, 15.0, 19.0, 21.0, 26.0, 30.0, 36.0, 51.0, 53.0, 56.0, 66.0, 68.0, 59.0, 71.0, 45.0, 57.0, 43.0, 45.0, 42.0, 28.0, 27.0, 17.0, 8.0, 5.0, 20.0, 7.0, 1.0, 7.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179901123046875, -0.0174102783203125, -0.0168304443359375, -0.0162506103515625, -0.0156707763671875, -0.0150909423828125, -0.0145111083984375, -0.0139312744140625, -0.0133514404296875, -0.0127716064453125, -0.0121917724609375, -0.0116119384765625, -0.0110321044921875, -0.0104522705078125, -0.0098724365234375, -0.0092926025390625, -0.0087127685546875, -0.0081329345703125, -0.0075531005859375, -0.0069732666015625, -0.0063934326171875, -0.0058135986328125, -0.0052337646484375, -0.0046539306640625, -0.0040740966796875, -0.0034942626953125, -0.0029144287109375, -0.0023345947265625, -0.0017547607421875, -0.0011749267578125, -0.0005950927734375, -1.52587890625e-05, 0.0005645751953125, 0.0011444091796875, 0.0017242431640625, 0.0023040771484375, 0.0028839111328125, 0.0034637451171875, 0.0040435791015625, 0.0046234130859375, 0.0052032470703125, 0.0057830810546875, 0.0063629150390625, 0.0069427490234375, 0.0075225830078125, 0.0081024169921875, 0.0086822509765625, 0.0092620849609375, 0.0098419189453125, 0.0104217529296875, 0.0110015869140625, 0.0115814208984375, 0.0121612548828125, 0.0127410888671875, 0.0133209228515625, 0.0139007568359375, 0.0144805908203125, 0.0150604248046875, 0.0156402587890625, 0.0162200927734375, 0.0167999267578125, 0.0173797607421875, 0.0179595947265625, 0.0185394287109375, 0.0191192626953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 16.0, 23.0, 64.0, 117.0, 210.0, 237.0, 164.0, 92.0, 37.0, 24.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1237847805023193, -2.073493719100952, -2.023202896118164, -1.9729118347167969, -1.9226207733154297, -1.872329831123352, -1.8220388889312744, -1.7717478275299072, -1.7214568853378296, -1.671165943145752, -1.6208748817443848, -1.5705839395523071, -1.5202929973602295, -1.4700019359588623, -1.4197109937667847, -1.369420051574707, -1.3191289901733398, -1.2688380479812622, -1.218546986579895, -1.1682560443878174, -1.1179649829864502, -1.0676740407943726, -1.017383098602295, -0.9670920968055725, -0.9168010950088501, -0.8665100932121277, -0.8162190914154053, -0.7659281492233276, -0.7156371474266052, -0.6653461456298828, -0.6150552034378052, -0.5647642016410828, -0.5144731998443604, -0.46418219804763794, -0.4138912260532379, -0.3636002540588379, -0.3133092522621155, -0.26301825046539307, -0.21272727847099304, -0.16243630647659302, -0.1121453046798706, -0.06185431778430939, -0.011563330888748169, 0.03872765600681305, 0.08901864290237427, 0.13930964469909668, 0.1896006166934967, 0.23989158868789673, 0.29018259048461914, 0.34047359228134155, 0.3907645642757416, 0.4410555362701416, 0.491346538066864, 0.5416375398635864, 0.5919284820556641, 0.6422194838523865, 0.6925104856491089, 0.7428014874458313, 0.7930924892425537, 0.8433834314346313, 0.8936744332313538, 0.9439654350280762, 0.9942563772201538, 1.0445473194122314, 1.0948383808135986]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 10.0, 14.0, 13.0, 13.0, 21.0, 32.0, 25.0, 25.0, 43.0, 35.0, 39.0, 36.0, 36.0, 37.0, 44.0, 45.0, 39.0, 41.0, 40.0, 43.0, 40.0, 40.0, 40.0, 35.0, 34.0, 24.0, 21.0, 24.0, 17.0, 15.0, 11.0, 9.0, 11.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.4222990870475769, -0.41003358364105225, -0.3977680802345276, -0.38550257682800293, -0.37323707342147827, -0.3609715700149536, -0.34870606660842896, -0.3364405632019043, -0.32417505979537964, -0.311909556388855, -0.2996440529823303, -0.28737854957580566, -0.275113046169281, -0.26284754276275635, -0.2505820393562317, -0.23831652104854584, -0.22605100274085999, -0.21378549933433533, -0.20151999592781067, -0.189254492521286, -0.17698898911476135, -0.1647234857082367, -0.15245796740055084, -0.14019246399402618, -0.12792696058750153, -0.11566145718097687, -0.10339595377445221, -0.09113044291734695, -0.0788649395108223, -0.06659943610429764, -0.05433392524719238, -0.042068421840667725, -0.02980288863182068, -0.01753738336265087, -0.005271878093481064, 0.006993629038333893, 0.01925913244485855, 0.03152463585138321, 0.043790146708488464, 0.05605565011501312, 0.06832115352153778, 0.08058665692806244, 0.0928521603345871, 0.10511767119169235, 0.11738317459821701, 0.12964868545532227, 0.14191418886184692, 0.15417969226837158, 0.16644519567489624, 0.1787106990814209, 0.19097620248794556, 0.20324170589447021, 0.21550720930099487, 0.22777271270751953, 0.24003823101520538, 0.25230371952056885, 0.2645692229270935, 0.27683472633361816, 0.2891002297401428, 0.3013657331466675, 0.31363123655319214, 0.3258967399597168, 0.33816224336624146, 0.3504277467727661, 0.36269327998161316]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 7.0, 15.0, 20.0, 26.0, 55.0, 78.0, 114.0, 155.0, 246.0, 389.0, 573.0, 1034.0, 1737.0, 3066.0, 5587.0, 10471.0, 22530.0, 57423.0, 212048.0, 499490.0, 149416.0, 45008.0, 18690.0, 9018.0, 4624.0, 2624.0, 1553.0, 992.0, 551.0, 370.0, 211.0, 143.0, 99.0, 59.0, 41.0, 36.0, 19.0, 15.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.16472816467285156, -0.15892410278320312, -0.1531200408935547, -0.14731597900390625, -0.1415119171142578, -0.13570785522460938, -0.12990379333496094, -0.1240997314453125, -0.11829566955566406, -0.11249160766601562, -0.10668754577636719, -0.10088348388671875, -0.09507942199707031, -0.08927536010742188, -0.08347129821777344, -0.077667236328125, -0.07186317443847656, -0.06605911254882812, -0.06025505065917969, -0.05445098876953125, -0.04864692687988281, -0.042842864990234375, -0.03703880310058594, -0.0312347412109375, -0.025430679321289062, -0.019626617431640625, -0.013822555541992188, -0.00801849365234375, -0.0022144317626953125, 0.003589630126953125, 0.009393692016601562, 0.01519775390625, 0.021001815795898438, 0.026805877685546875, 0.03260993957519531, 0.03841400146484375, 0.04421806335449219, 0.050022125244140625, 0.05582618713378906, 0.0616302490234375, 0.06743431091308594, 0.07323837280273438, 0.07904243469238281, 0.08484649658203125, 0.09065055847167969, 0.09645462036132812, 0.10225868225097656, 0.108062744140625, 0.11386680603027344, 0.11967086791992188, 0.1254749298095703, 0.13127899169921875, 0.1370830535888672, 0.14288711547851562, 0.14869117736816406, 0.1544952392578125, 0.16029930114746094, 0.16610336303710938, 0.1719074249267578, 0.17771148681640625, 0.1835155487060547, 0.18931961059570312, 0.19512367248535156, 0.200927734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 18.0, 15.0, 9.0, 27.0, 25.0, 19.0, 23.0, 33.0, 33.0, 37.0, 33.0, 53.0, 38.0, 44.0, 32.0, 49.0, 47.0, 55.0, 28.0, 51.0, 46.0, 27.0, 40.0, 19.0, 34.0, 18.0, 23.0, 20.0, 14.0, 14.0, 13.0, 6.0, 12.0, 1.0, 5.0, 9.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6416015625, -0.6213302612304688, -0.6010589599609375, -0.5807876586914062, -0.560516357421875, -0.5402450561523438, -0.5199737548828125, -0.49970245361328125, -0.47943115234375, -0.45915985107421875, -0.4388885498046875, -0.41861724853515625, -0.398345947265625, -0.37807464599609375, -0.3578033447265625, -0.33753204345703125, -0.3172607421875, -0.29698944091796875, -0.2767181396484375, -0.25644683837890625, -0.236175537109375, -0.21590423583984375, -0.1956329345703125, -0.17536163330078125, -0.15509033203125, -0.13481903076171875, -0.1145477294921875, -0.09427642822265625, -0.074005126953125, -0.05373382568359375, -0.0334625244140625, -0.01319122314453125, 0.007080078125, 0.02735137939453125, 0.0476226806640625, 0.06789398193359375, 0.088165283203125, 0.10843658447265625, 0.1287078857421875, 0.14897918701171875, 0.16925048828125, 0.18952178955078125, 0.2097930908203125, 0.23006439208984375, 0.250335693359375, 0.27060699462890625, 0.2908782958984375, 0.31114959716796875, 0.3314208984375, 0.35169219970703125, 0.3719635009765625, 0.39223480224609375, 0.412506103515625, 0.43277740478515625, 0.4530487060546875, 0.47332000732421875, 0.49359130859375, 0.5138626098632812, 0.5341339111328125, 0.5544052124023438, 0.574676513671875, 0.5949478149414062, 0.6152191162109375, 0.6354904174804688, 0.65576171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 5.0, 7.0, 7.0, 11.0, 20.0, 20.0, 31.0, 45.0, 35.0, 64.0, 63.0, 105.0, 140.0, 230.0, 399.0, 907.0, 2536.0, 8960.0, 50186.0, 777342.0, 182263.0, 17903.0, 4347.0, 1399.0, 565.0, 298.0, 182.0, 116.0, 78.0, 53.0, 47.0, 47.0, 28.0, 34.0, 18.0, 17.0, 13.0, 5.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.51806640625, -0.5035667419433594, -0.48906707763671875, -0.4745674133300781, -0.4600677490234375, -0.4455680847167969, -0.43106842041015625, -0.4165687561035156, -0.402069091796875, -0.3875694274902344, -0.37306976318359375, -0.3585700988769531, -0.3440704345703125, -0.3295707702636719, -0.31507110595703125, -0.3005714416503906, -0.28607177734375, -0.2715721130371094, -0.25707244873046875, -0.24257278442382812, -0.2280731201171875, -0.21357345581054688, -0.19907379150390625, -0.18457412719726562, -0.170074462890625, -0.15557479858398438, -0.14107513427734375, -0.12657546997070312, -0.1120758056640625, -0.09757614135742188, -0.08307647705078125, -0.06857681274414062, -0.0540771484375, -0.039577484130859375, -0.02507781982421875, -0.010578155517578125, 0.0039215087890625, 0.018421173095703125, 0.03292083740234375, 0.047420501708984375, 0.061920166015625, 0.07641983032226562, 0.09091949462890625, 0.10541915893554688, 0.1199188232421875, 0.13441848754882812, 0.14891815185546875, 0.16341781616210938, 0.17791748046875, 0.19241714477539062, 0.20691680908203125, 0.22141647338867188, 0.2359161376953125, 0.2504158020019531, 0.26491546630859375, 0.2794151306152344, 0.293914794921875, 0.3084144592285156, 0.32291412353515625, 0.3374137878417969, 0.3519134521484375, 0.3664131164550781, 0.38091278076171875, 0.3954124450683594, 0.409912109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 3.0, 7.0, 8.0, 12.0, 12.0, 16.0, 28.0, 24.0, 14.0, 23.0, 31.0, 29.0, 35.0, 37.0, 33.0, 51.0, 57.0, 47.0, 51.0, 57.0, 47.0, 36.0, 50.0, 50.0, 36.0, 29.0, 27.0, 23.0, 30.0, 26.0, 10.0, 20.0, 7.0, 8.0, 7.0, 6.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79541015625, -0.7721786499023438, -0.7489471435546875, -0.7257156372070312, -0.702484130859375, -0.6792526245117188, -0.6560211181640625, -0.6327896118164062, -0.60955810546875, -0.5863265991210938, -0.5630950927734375, -0.5398635864257812, -0.516632080078125, -0.49340057373046875, -0.4701690673828125, -0.44693756103515625, -0.4237060546875, -0.40047454833984375, -0.3772430419921875, -0.35401153564453125, -0.330780029296875, -0.30754852294921875, -0.2843170166015625, -0.26108551025390625, -0.23785400390625, -0.21462249755859375, -0.1913909912109375, -0.16815948486328125, -0.144927978515625, -0.12169647216796875, -0.0984649658203125, -0.07523345947265625, -0.052001953125, -0.02877044677734375, -0.0055389404296875, 0.01769256591796875, 0.040924072265625, 0.06415557861328125, 0.0873870849609375, 0.11061859130859375, 0.13385009765625, 0.15708160400390625, 0.1803131103515625, 0.20354461669921875, 0.226776123046875, 0.25000762939453125, 0.2732391357421875, 0.29647064208984375, 0.3197021484375, 0.34293365478515625, 0.3661651611328125, 0.38939666748046875, 0.412628173828125, 0.43585968017578125, 0.4590911865234375, 0.48232269287109375, 0.50555419921875, 0.5287857055664062, 0.5520172119140625, 0.5752487182617188, 0.598480224609375, 0.6217117309570312, 0.6449432373046875, 0.6681747436523438, 0.69140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 9.0, 12.0, 24.0, 27.0, 50.0, 88.0, 114.0, 242.0, 440.0, 1079.0, 2847.0, 10486.0, 65506.0, 848404.0, 99958.0, 13405.0, 3406.0, 1276.0, 535.0, 269.0, 148.0, 73.0, 55.0, 26.0, 18.0, 10.0, 10.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1649169921875, -0.1607503890991211, -0.1565837860107422, -0.15241718292236328, -0.14825057983398438, -0.14408397674560547, -0.13991737365722656, -0.13575077056884766, -0.13158416748046875, -0.12741756439208984, -0.12325096130371094, -0.11908435821533203, -0.11491775512695312, -0.11075115203857422, -0.10658454895019531, -0.1024179458618164, -0.0982513427734375, -0.0940847396850586, -0.08991813659667969, -0.08575153350830078, -0.08158493041992188, -0.07741832733154297, -0.07325172424316406, -0.06908512115478516, -0.06491851806640625, -0.060751914978027344, -0.05658531188964844, -0.05241870880126953, -0.048252105712890625, -0.04408550262451172, -0.03991889953613281, -0.035752296447753906, -0.031585693359375, -0.027419090270996094, -0.023252487182617188, -0.01908588409423828, -0.014919281005859375, -0.010752677917480469, -0.0065860748291015625, -0.0024194717407226562, 0.00174713134765625, 0.005913734436035156, 0.010080337524414062, 0.014246940612792969, 0.018413543701171875, 0.02258014678955078, 0.026746749877929688, 0.030913352966308594, 0.0350799560546875, 0.039246559143066406, 0.04341316223144531, 0.04757976531982422, 0.051746368408203125, 0.05591297149658203, 0.06007957458496094, 0.06424617767333984, 0.06841278076171875, 0.07257938385009766, 0.07674598693847656, 0.08091259002685547, 0.08507919311523438, 0.08924579620361328, 0.09341239929199219, 0.0975790023803711, 0.10174560546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 10.0, 10.0, 12.0, 16.0, 19.0, 28.0, 44.0, 75.0, 152.0, 149.0, 176.0, 83.0, 64.0, 38.0, 23.0, 27.0, 23.0, 7.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8656253814697266e-05, -1.815054565668106e-05, -1.7644837498664856e-05, -1.713912934064865e-05, -1.6633421182632446e-05, -1.612771302461624e-05, -1.5622004866600037e-05, -1.5116296708583832e-05, -1.4610588550567627e-05, -1.4104880392551422e-05, -1.3599172234535217e-05, -1.3093464076519012e-05, -1.2587755918502808e-05, -1.2082047760486603e-05, -1.1576339602470398e-05, -1.1070631444454193e-05, -1.0564923286437988e-05, -1.0059215128421783e-05, -9.553506970405579e-06, -9.047798812389374e-06, -8.542090654373169e-06, -8.036382496356964e-06, -7.530674338340759e-06, -7.0249661803245544e-06, -6.51925802230835e-06, -6.013549864292145e-06, -5.50784170627594e-06, -5.002133548259735e-06, -4.49642539024353e-06, -3.9907172322273254e-06, -3.4850090742111206e-06, -2.9793009161949158e-06, -2.473592758178711e-06, -1.967884600162506e-06, -1.4621764421463013e-06, -9.564682841300964e-07, -4.507601261138916e-07, 5.494803190231323e-08, 5.606561899185181e-07, 1.066364347934723e-06, 1.5720725059509277e-06, 2.0777806639671326e-06, 2.5834888219833374e-06, 3.0891969799995422e-06, 3.594905138015747e-06, 4.100613296031952e-06, 4.606321454048157e-06, 5.1120296120643616e-06, 5.617737770080566e-06, 6.123445928096771e-06, 6.629154086112976e-06, 7.134862244129181e-06, 7.640570402145386e-06, 8.14627856016159e-06, 8.651986718177795e-06, 9.157694876194e-06, 9.663403034210205e-06, 1.016911119222641e-05, 1.0674819350242615e-05, 1.118052750825882e-05, 1.1686235666275024e-05, 1.219194382429123e-05, 1.2697651982307434e-05, 1.3203360140323639e-05, 1.3709068298339844e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 13.0, 8.0, 19.0, 37.0, 35.0, 71.0, 133.0, 259.0, 518.0, 1150.0, 3111.0, 9861.0, 45615.0, 672559.0, 275747.0, 28397.0, 6984.0, 2262.0, 848.0, 396.0, 192.0, 120.0, 70.0, 40.0, 23.0, 21.0, 8.0, 11.0, 7.0, 5.0, 8.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.101806640625, -0.09839725494384766, -0.09498786926269531, -0.09157848358154297, -0.08816909790039062, -0.08475971221923828, -0.08135032653808594, -0.0779409408569336, -0.07453155517578125, -0.0711221694946289, -0.06771278381347656, -0.06430339813232422, -0.060894012451171875, -0.05748462677001953, -0.05407524108886719, -0.050665855407714844, -0.0472564697265625, -0.043847084045410156, -0.04043769836425781, -0.03702831268310547, -0.033618927001953125, -0.03020954132080078, -0.026800155639648438, -0.023390769958496094, -0.01998138427734375, -0.016571998596191406, -0.013162612915039062, -0.009753227233886719, -0.006343841552734375, -0.0029344558715820312, 0.0004749298095703125, 0.0038843154907226562, 0.007293701171875, 0.010703086853027344, 0.014112472534179688, 0.01752185821533203, 0.020931243896484375, 0.02434062957763672, 0.027750015258789062, 0.031159400939941406, 0.03456878662109375, 0.037978172302246094, 0.04138755798339844, 0.04479694366455078, 0.048206329345703125, 0.05161571502685547, 0.05502510070800781, 0.058434486389160156, 0.0618438720703125, 0.06525325775146484, 0.06866264343261719, 0.07207202911376953, 0.07548141479492188, 0.07889080047607422, 0.08230018615722656, 0.0857095718383789, 0.08911895751953125, 0.0925283432006836, 0.09593772888183594, 0.09934711456298828, 0.10275650024414062, 0.10616588592529297, 0.10957527160644531, 0.11298465728759766, 0.11639404296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 7.0, 9.0, 20.0, 24.0, 39.0, 44.0, 70.0, 94.0, 139.0, 147.0, 114.0, 70.0, 47.0, 38.0, 27.0, 18.0, 16.0, 11.0, 13.0, 9.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.037109375, -0.03587675094604492, -0.034644126892089844, -0.033411502838134766, -0.03217887878417969, -0.03094625473022461, -0.02971363067626953, -0.028481006622314453, -0.027248382568359375, -0.026015758514404297, -0.02478313446044922, -0.02355051040649414, -0.022317886352539062, -0.021085262298583984, -0.019852638244628906, -0.018620014190673828, -0.01738739013671875, -0.016154766082763672, -0.014922142028808594, -0.013689517974853516, -0.012456893920898438, -0.01122426986694336, -0.009991645812988281, -0.008759021759033203, -0.007526397705078125, -0.006293773651123047, -0.005061149597167969, -0.0038285255432128906, -0.0025959014892578125, -0.0013632774353027344, -0.00013065338134765625, 0.0011019706726074219, 0.0023345947265625, 0.003567218780517578, 0.004799842834472656, 0.006032466888427734, 0.0072650909423828125, 0.00849771499633789, 0.009730339050292969, 0.010962963104248047, 0.012195587158203125, 0.013428211212158203, 0.014660835266113281, 0.01589345932006836, 0.017126083374023438, 0.018358707427978516, 0.019591331481933594, 0.020823955535888672, 0.02205657958984375, 0.023289203643798828, 0.024521827697753906, 0.025754451751708984, 0.026987075805664062, 0.02821969985961914, 0.02945232391357422, 0.030684947967529297, 0.031917572021484375, 0.03315019607543945, 0.03438282012939453, 0.03561544418334961, 0.03684806823730469, 0.038080692291259766, 0.039313316345214844, 0.04054594039916992, 0.041778564453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 23.0, 50.0, 110.0, 205.0, 255.0, 197.0, 95.0, 37.0, 19.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.405527591705322, -4.316229820251465, -4.226932048797607, -4.13763427734375, -4.048336505889893, -3.959038734436035, -3.8697409629821777, -3.780442953109741, -3.691145181655884, -3.6018474102020264, -3.512549638748169, -3.4232518672943115, -3.333954095840454, -3.2446560859680176, -3.15535831451416, -3.0660605430603027, -2.9767627716064453, -2.887465000152588, -2.7981672286987305, -2.708869457244873, -2.6195716857910156, -2.530273914337158, -2.440976142883301, -2.3516781330108643, -2.262380599975586, -2.1730828285217285, -2.083785057067871, -1.9944872856140137, -1.9051893949508667, -1.8158916234970093, -1.7265938520431519, -1.6372959613800049, -1.547998070716858, -1.4587002992630005, -1.369402527809143, -1.280104637145996, -1.1908068656921387, -1.1015090942382812, -1.0122113227844238, -0.9229134917259216, -0.8336157202720642, -0.7443179488182068, -0.6550201177597046, -0.5657223463058472, -0.47642454504966736, -0.38712674379348755, -0.2978289723396301, -0.20853114128112793, -0.11923336982727051, -0.029935576021671295, 0.05936221778392792, 0.14866000413894653, 0.23795780539512634, 0.32725560665130615, 0.4165533781051636, 0.5058512091636658, 0.5951489806175232, 0.6844467520713806, 0.7737445831298828, 0.8630423545837402, 0.9523401260375977, 1.041637897491455, 1.1309356689453125, 1.2202335596084595, 1.309531331062317]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 6.0, 2.0, 6.0, 12.0, 8.0, 7.0, 11.0, 10.0, 23.0, 15.0, 15.0, 23.0, 26.0, 38.0, 32.0, 45.0, 34.0, 37.0, 41.0, 34.0, 48.0, 40.0, 47.0, 47.0, 38.0, 29.0, 31.0, 35.0, 23.0, 21.0, 33.0, 28.0, 24.0, 20.0, 22.0, 13.0, 11.0, 12.0, 10.0, 8.0, 5.0, 7.0, 4.0, 10.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0377143621444702, -1.0079102516174316, -0.9781060218811035, -0.9483018517494202, -0.9184976816177368, -0.8886935710906982, -0.8588893413543701, -0.8290852308273315, -0.7992810606956482, -0.7694768905639648, -0.7396727204322815, -0.7098685503005981, -0.6800643801689148, -0.6502602100372314, -0.6204560995101929, -0.5906519293785095, -0.5608477592468262, -0.5310435891151428, -0.5012394189834595, -0.4714352488517761, -0.44163110852241516, -0.4118269383907318, -0.38202276825904846, -0.3522186279296875, -0.3224143981933594, -0.292610228061676, -0.2628060579299927, -0.23300190269947052, -0.20319774746894836, -0.17339357733726501, -0.14358940720558167, -0.11378525197505951, -0.08398109674453735, -0.0541769340634346, -0.02437276765704155, 0.0054313987493515015, 0.035235561430454254, 0.065039724111557, 0.09484389424324036, 0.12464804947376251, 0.15445221960544586, 0.1842563897371292, 0.21406054496765137, 0.24386471509933472, 0.27366888523101807, 0.3034730553627014, 0.33327722549438477, 0.3630813658237457, 0.3928855359554291, 0.4226897060871124, 0.4524938762187958, 0.48229801654815674, 0.5121021866798401, 0.5419063568115234, 0.5717105269432068, 0.6015146970748901, 0.6313188672065735, 0.6611230373382568, 0.6909272074699402, 0.7207313776016235, 0.7505355477333069, 0.7803397178649902, 0.8101438283920288, 0.8399479985237122, 0.8697521686553955]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 7.0, 6.0, 11.0, 12.0, 20.0, 28.0, 38.0, 52.0, 101.0, 191.0, 368.0, 665.0, 1303.0, 2569.0, 5659.0, 14074.0, 48434.0, 298387.0, 2137336.0, 1473472.0, 161060.0, 30380.0, 10894.0, 4602.0, 2203.0, 1074.0, 563.0, 309.0, 161.0, 112.0, 62.0, 42.0, 22.0, 13.0, 17.0, 16.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66943359375, -0.6462478637695312, -0.6230621337890625, -0.5998764038085938, -0.576690673828125, -0.5535049438476562, -0.5303192138671875, -0.5071334838867188, -0.48394775390625, -0.46076202392578125, -0.4375762939453125, -0.41439056396484375, -0.391204833984375, -0.36801910400390625, -0.3448333740234375, -0.32164764404296875, -0.2984619140625, -0.27527618408203125, -0.2520904541015625, -0.22890472412109375, -0.205718994140625, -0.18253326416015625, -0.1593475341796875, -0.13616180419921875, -0.11297607421875, -0.08979034423828125, -0.0666046142578125, -0.04341888427734375, -0.020233154296875, 0.00295257568359375, 0.0261383056640625, 0.04932403564453125, 0.072509765625, 0.09569549560546875, 0.1188812255859375, 0.14206695556640625, 0.165252685546875, 0.18843841552734375, 0.2116241455078125, 0.23480987548828125, 0.25799560546875, 0.28118133544921875, 0.3043670654296875, 0.32755279541015625, 0.350738525390625, 0.37392425537109375, 0.3971099853515625, 0.42029571533203125, 0.4434814453125, 0.46666717529296875, 0.4898529052734375, 0.5130386352539062, 0.536224365234375, 0.5594100952148438, 0.5825958251953125, 0.6057815551757812, 0.62896728515625, 0.6521530151367188, 0.6753387451171875, 0.6985244750976562, 0.721710205078125, 0.7448959350585938, 0.7680816650390625, 0.7912673950195312, 0.814453125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 8.0, 8.0, 6.0, 12.0, 17.0, 36.0, 21.0, 36.0, 31.0, 43.0, 45.0, 47.0, 51.0, 50.0, 48.0, 64.0, 46.0, 59.0, 51.0, 44.0, 53.0, 45.0, 28.0, 23.0, 24.0, 21.0, 18.0, 12.0, 12.0, 11.0, 4.0, 5.0, 2.0, 1.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4658851623535156, -0.44959259033203125, -0.4333000183105469, -0.4170074462890625, -0.4007148742675781, -0.38442230224609375, -0.3681297302246094, -0.351837158203125, -0.3355445861816406, -0.31925201416015625, -0.3029594421386719, -0.2866668701171875, -0.2703742980957031, -0.25408172607421875, -0.23778915405273438, -0.22149658203125, -0.20520401000976562, -0.18891143798828125, -0.17261886596679688, -0.1563262939453125, -0.14003372192382812, -0.12374114990234375, -0.10744857788085938, -0.091156005859375, -0.07486343383789062, -0.05857086181640625, -0.042278289794921875, -0.0259857177734375, -0.009693145751953125, 0.00659942626953125, 0.022891998291015625, 0.0391845703125, 0.055477142333984375, 0.07176971435546875, 0.08806228637695312, 0.1043548583984375, 0.12064743041992188, 0.13694000244140625, 0.15323257446289062, 0.169525146484375, 0.18581771850585938, 0.20211029052734375, 0.21840286254882812, 0.2346954345703125, 0.2509880065917969, 0.26728057861328125, 0.2835731506347656, 0.29986572265625, 0.3161582946777344, 0.33245086669921875, 0.3487434387207031, 0.3650360107421875, 0.3813285827636719, 0.39762115478515625, 0.4139137268066406, 0.430206298828125, 0.4464988708496094, 0.46279144287109375, 0.4790840148925781, 0.4953765869140625, 0.5116691589355469, 0.5279617309570312, 0.5442543029785156, 0.560546875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 2.0, 11.0, 10.0, 20.0, 57.0, 127.0, 377.0, 2546.0, 721511.0, 3465932.0, 2991.0, 436.0, 130.0, 60.0, 23.0, 17.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.04296875, -6.871368408203125, -6.69976806640625, -6.528167724609375, -6.3565673828125, -6.184967041015625, -6.01336669921875, -5.841766357421875, -5.670166015625, -5.498565673828125, -5.32696533203125, -5.155364990234375, -4.9837646484375, -4.812164306640625, -4.64056396484375, -4.468963623046875, -4.29736328125, -4.125762939453125, -3.95416259765625, -3.782562255859375, -3.6109619140625, -3.439361572265625, -3.26776123046875, -3.096160888671875, -2.924560546875, -2.752960205078125, -2.58135986328125, -2.409759521484375, -2.2381591796875, -2.066558837890625, -1.89495849609375, -1.723358154296875, -1.5517578125, -1.380157470703125, -1.20855712890625, -1.036956787109375, -0.8653564453125, -0.693756103515625, -0.52215576171875, -0.350555419921875, -0.178955078125, -0.007354736328125, 0.16424560546875, 0.335845947265625, 0.5074462890625, 0.679046630859375, 0.85064697265625, 1.022247314453125, 1.19384765625, 1.365447998046875, 1.53704833984375, 1.708648681640625, 1.8802490234375, 2.051849365234375, 2.22344970703125, 2.395050048828125, 2.566650390625, 2.738250732421875, 2.90985107421875, 3.081451416015625, 3.2530517578125, 3.424652099609375, 3.59625244140625, 3.767852783203125, 3.939453125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 8.0, 11.0, 21.0, 39.0, 69.0, 104.0, 168.0, 361.0, 755.0, 1198.0, 629.0, 297.0, 147.0, 83.0, 63.0, 29.0, 23.0, 12.0, 14.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.415283203125, -0.4035491943359375, -0.391815185546875, -0.3800811767578125, -0.36834716796875, -0.3566131591796875, -0.344879150390625, -0.3331451416015625, -0.3214111328125, -0.3096771240234375, -0.297943115234375, -0.2862091064453125, -0.27447509765625, -0.2627410888671875, -0.251007080078125, -0.2392730712890625, -0.2275390625, -0.2158050537109375, -0.204071044921875, -0.1923370361328125, -0.18060302734375, -0.1688690185546875, -0.157135009765625, -0.1454010009765625, -0.1336669921875, -0.1219329833984375, -0.110198974609375, -0.0984649658203125, -0.08673095703125, -0.0749969482421875, -0.063262939453125, -0.0515289306640625, -0.039794921875, -0.0280609130859375, -0.016326904296875, -0.0045928955078125, 0.00714111328125, 0.0188751220703125, 0.030609130859375, 0.0423431396484375, 0.0540771484375, 0.0658111572265625, 0.077545166015625, 0.0892791748046875, 0.10101318359375, 0.1127471923828125, 0.124481201171875, 0.1362152099609375, 0.14794921875, 0.1596832275390625, 0.171417236328125, 0.1831512451171875, 0.19488525390625, 0.2066192626953125, 0.218353271484375, 0.2300872802734375, 0.2418212890625, 0.2535552978515625, 0.265289306640625, 0.2770233154296875, 0.28875732421875, 0.3004913330078125, 0.312225341796875, 0.3239593505859375, 0.335693359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 13.0, 15.0, 23.0, 34.0, 37.0, 67.0, 96.0, 103.0, 117.0, 106.0, 96.0, 81.0, 77.0, 39.0, 31.0, 21.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5571964979171753, -1.5232477188110352, -1.4892988204956055, -1.4553499221801758, -1.4214011430740356, -1.3874523639678955, -1.3535034656524658, -1.3195545673370361, -1.285605788230896, -1.2516570091247559, -1.2177081108093262, -1.1837592124938965, -1.1498104333877563, -1.1158616542816162, -1.0819127559661865, -1.0479638576507568, -1.0140150785446167, -0.9800662398338318, -0.9461174011230469, -0.912168562412262, -0.878219723701477, -0.8442708849906921, -0.8103220462799072, -0.7763732075691223, -0.7424243688583374, -0.7084755301475525, -0.6745266914367676, -0.6405778527259827, -0.6066290140151978, -0.5726801753044128, -0.5387313365936279, -0.504782497882843, -0.47083377838134766, -0.43688493967056274, -0.40293610095977783, -0.3689872622489929, -0.335038423538208, -0.3010895848274231, -0.2671407461166382, -0.23319190740585327, -0.19924306869506836, -0.16529422998428345, -0.13134539127349854, -0.09739655256271362, -0.06344771385192871, -0.0294988751411438, 0.004449963569641113, 0.038398802280426025, 0.07234764099121094, 0.10629647970199585, 0.14024531841278076, 0.17419415712356567, 0.20814299583435059, 0.2420918345451355, 0.2760406732559204, 0.3099895119667053, 0.34393835067749023, 0.37788718938827515, 0.41183602809906006, 0.44578486680984497, 0.4797337055206299, 0.5136825442314148, 0.5476313829421997, 0.5815802216529846, 0.6155290603637695]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 18.0, 20.0, 17.0, 18.0, 28.0, 32.0, 41.0, 41.0, 33.0, 36.0, 41.0, 51.0, 58.0, 51.0, 48.0, 40.0, 44.0, 42.0, 41.0, 32.0, 35.0, 24.0, 30.0, 14.0, 20.0, 15.0, 22.0, 23.0, 14.0, 8.0, 8.0, 8.0, 10.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5627540349960327, -0.5461817383766174, -0.5296093821525574, -0.5130370855331421, -0.4964647889137268, -0.47989246249198914, -0.46332013607025146, -0.4467478394508362, -0.4301755130290985, -0.41360318660736084, -0.39703088998794556, -0.3804585635662079, -0.3638862371444702, -0.34731394052505493, -0.33074161410331726, -0.3141692876815796, -0.2975969910621643, -0.28102466464042664, -0.26445236802101135, -0.24788004159927368, -0.2313077300786972, -0.21473541855812073, -0.19816309213638306, -0.18159078061580658, -0.1650184690952301, -0.14844615757465363, -0.13187384605407715, -0.11530151963233948, -0.098729208111763, -0.08215689659118652, -0.06558457762002945, -0.049012258648872375, -0.03243991732597351, -0.015867602080106735, 0.0007047131657600403, 0.017277028411626816, 0.03384934365749359, 0.05042165517807007, 0.06699397414922714, 0.08356629312038422, 0.1001386046409607, 0.11671091616153717, 0.13328322768211365, 0.14985555410385132, 0.1664278656244278, 0.18300017714500427, 0.19957250356674194, 0.21614481508731842, 0.2327171266078949, 0.24928943812847137, 0.26586174964904785, 0.2824340760707855, 0.2990064024925232, 0.3155786991119385, 0.33215102553367615, 0.3487233519554138, 0.3652956485748291, 0.3818679749965668, 0.39844027161598206, 0.4150125980377197, 0.431584894657135, 0.4481572210788727, 0.46472954750061035, 0.48130184412002563, 0.4978741705417633]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 22.0, 34.0, 77.0, 107.0, 210.0, 367.0, 718.0, 1344.0, 2875.0, 5810.0, 13400.0, 31588.0, 76092.0, 184385.0, 356732.0, 217726.0, 90977.0, 37119.0, 15361.0, 7021.0, 3207.0, 1602.0, 818.0, 409.0, 243.0, 134.0, 63.0, 37.0, 23.0, 15.0, 11.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24895668029785156, -0.24107742309570312, -0.2331981658935547, -0.22531890869140625, -0.2174396514892578, -0.20956039428710938, -0.20168113708496094, -0.1938018798828125, -0.18592262268066406, -0.17804336547851562, -0.1701641082763672, -0.16228485107421875, -0.1544055938720703, -0.14652633666992188, -0.13864707946777344, -0.130767822265625, -0.12288856506347656, -0.11500930786132812, -0.10713005065917969, -0.09925079345703125, -0.09137153625488281, -0.08349227905273438, -0.07561302185058594, -0.0677337646484375, -0.05985450744628906, -0.051975250244140625, -0.04409599304199219, -0.03621673583984375, -0.028337478637695312, -0.020458221435546875, -0.012578964233398438, -0.00469970703125, 0.0031795501708984375, 0.011058807373046875, 0.018938064575195312, 0.02681732177734375, 0.03469657897949219, 0.042575836181640625, 0.05045509338378906, 0.0583343505859375, 0.06621360778808594, 0.07409286499023438, 0.08197212219238281, 0.08985137939453125, 0.09773063659667969, 0.10560989379882812, 0.11348915100097656, 0.121368408203125, 0.12924766540527344, 0.13712692260742188, 0.1450061798095703, 0.15288543701171875, 0.1607646942138672, 0.16864395141601562, 0.17652320861816406, 0.1844024658203125, 0.19228172302246094, 0.20016098022460938, 0.2080402374267578, 0.21591949462890625, 0.2237987518310547, 0.23167800903320312, 0.23955726623535156, 0.2474365234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 14.0, 16.0, 17.0, 17.0, 29.0, 29.0, 38.0, 32.0, 42.0, 41.0, 48.0, 56.0, 55.0, 64.0, 58.0, 48.0, 52.0, 45.0, 54.0, 42.0, 26.0, 30.0, 28.0, 19.0, 19.0, 23.0, 14.0, 10.0, 15.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.42119598388671875, -0.4080657958984375, -0.39493560791015625, -0.381805419921875, -0.36867523193359375, -0.3555450439453125, -0.34241485595703125, -0.32928466796875, -0.31615447998046875, -0.3030242919921875, -0.28989410400390625, -0.276763916015625, -0.26363372802734375, -0.2505035400390625, -0.23737335205078125, -0.2242431640625, -0.21111297607421875, -0.1979827880859375, -0.18485260009765625, -0.171722412109375, -0.15859222412109375, -0.1454620361328125, -0.13233184814453125, -0.11920166015625, -0.10607147216796875, -0.0929412841796875, -0.07981109619140625, -0.066680908203125, -0.05355072021484375, -0.0404205322265625, -0.02729034423828125, -0.01416015625, -0.00102996826171875, 0.0121002197265625, 0.02523040771484375, 0.038360595703125, 0.05149078369140625, 0.0646209716796875, 0.07775115966796875, 0.09088134765625, 0.10401153564453125, 0.1171417236328125, 0.13027191162109375, 0.143402099609375, 0.15653228759765625, 0.1696624755859375, 0.18279266357421875, 0.1959228515625, 0.20905303955078125, 0.2221832275390625, 0.23531341552734375, 0.248443603515625, 0.26157379150390625, 0.2747039794921875, 0.28783416748046875, 0.30096435546875, 0.31409454345703125, 0.3272247314453125, 0.34035491943359375, 0.353485107421875, 0.36661529541015625, 0.3797454833984375, 0.39287567138671875, 0.406005859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 12.0, 16.0, 27.0, 43.0, 70.0, 176.0, 423.0, 959.0, 3360.0, 13699.0, 78940.0, 528683.0, 358609.0, 50168.0, 9350.0, 2519.0, 848.0, 325.0, 137.0, 68.0, 44.0, 21.0, 24.0, 5.0, 7.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5400390625, -0.5245552062988281, -0.5090713500976562, -0.4935874938964844, -0.4781036376953125, -0.4626197814941406, -0.44713592529296875, -0.4316520690917969, -0.416168212890625, -0.4006843566894531, -0.38520050048828125, -0.3697166442871094, -0.3542327880859375, -0.3387489318847656, -0.32326507568359375, -0.3077812194824219, -0.29229736328125, -0.2768135070800781, -0.26132965087890625, -0.24584579467773438, -0.2303619384765625, -0.21487808227539062, -0.19939422607421875, -0.18391036987304688, -0.168426513671875, -0.15294265747070312, -0.13745880126953125, -0.12197494506835938, -0.1064910888671875, -0.09100723266601562, -0.07552337646484375, -0.060039520263671875, -0.0445556640625, -0.029071807861328125, -0.01358795166015625, 0.001895904541015625, 0.0173797607421875, 0.032863616943359375, 0.04834747314453125, 0.06383132934570312, 0.079315185546875, 0.09479904174804688, 0.11028289794921875, 0.12576675415039062, 0.1412506103515625, 0.15673446655273438, 0.17221832275390625, 0.18770217895507812, 0.20318603515625, 0.21866989135742188, 0.23415374755859375, 0.24963760375976562, 0.2651214599609375, 0.2806053161621094, 0.29608917236328125, 0.3115730285644531, 0.327056884765625, 0.3425407409667969, 0.35802459716796875, 0.3735084533691406, 0.3889923095703125, 0.4044761657714844, 0.41996002197265625, 0.4354438781738281, 0.450927734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 3.0, 7.0, 11.0, 7.0, 12.0, 17.0, 25.0, 20.0, 22.0, 24.0, 35.0, 27.0, 35.0, 35.0, 24.0, 32.0, 35.0, 46.0, 37.0, 31.0, 44.0, 42.0, 39.0, 39.0, 37.0, 33.0, 46.0, 32.0, 29.0, 21.0, 22.0, 16.0, 18.0, 25.0, 7.0, 12.0, 9.0, 8.0, 8.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.59521484375, -0.5749588012695312, -0.5547027587890625, -0.5344467163085938, -0.514190673828125, -0.49393463134765625, -0.4736785888671875, -0.45342254638671875, -0.43316650390625, -0.41291046142578125, -0.3926544189453125, -0.37239837646484375, -0.352142333984375, -0.33188629150390625, -0.3116302490234375, -0.29137420654296875, -0.2711181640625, -0.25086212158203125, -0.2306060791015625, -0.21035003662109375, -0.190093994140625, -0.16983795166015625, -0.1495819091796875, -0.12932586669921875, -0.10906982421875, -0.08881378173828125, -0.0685577392578125, -0.04830169677734375, -0.028045654296875, -0.00778961181640625, 0.0124664306640625, 0.03272247314453125, 0.052978515625, 0.07323455810546875, 0.0934906005859375, 0.11374664306640625, 0.134002685546875, 0.15425872802734375, 0.1745147705078125, 0.19477081298828125, 0.21502685546875, 0.23528289794921875, 0.2555389404296875, 0.27579498291015625, 0.296051025390625, 0.31630706787109375, 0.3365631103515625, 0.35681915283203125, 0.3770751953125, 0.39733123779296875, 0.4175872802734375, 0.43784332275390625, 0.458099365234375, 0.47835540771484375, 0.4986114501953125, 0.5188674926757812, 0.53912353515625, 0.5593795776367188, 0.5796356201171875, 0.5998916625976562, 0.620147705078125, 0.6404037475585938, 0.6606597900390625, 0.6809158325195312, 0.701171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 15.0, 29.0, 51.0, 75.0, 135.0, 225.0, 364.0, 649.0, 1301.0, 2535.0, 5617.0, 13629.0, 40155.0, 158484.0, 516153.0, 224654.0, 53934.0, 17226.0, 6829.0, 3153.0, 1475.0, 788.0, 446.0, 255.0, 131.0, 96.0, 50.0, 28.0, 23.0, 14.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05572509765625, -0.0540165901184082, -0.052308082580566406, -0.05059957504272461, -0.04889106750488281, -0.047182559967041016, -0.04547405242919922, -0.04376554489135742, -0.042057037353515625, -0.04034852981567383, -0.03864002227783203, -0.036931514739990234, -0.03522300720214844, -0.03351449966430664, -0.031805992126464844, -0.030097484588623047, -0.02838897705078125, -0.026680469512939453, -0.024971961975097656, -0.02326345443725586, -0.021554946899414062, -0.019846439361572266, -0.01813793182373047, -0.016429424285888672, -0.014720916748046875, -0.013012409210205078, -0.011303901672363281, -0.009595394134521484, -0.007886886596679688, -0.006178379058837891, -0.004469871520996094, -0.002761363983154297, -0.0010528564453125, 0.0006556510925292969, 0.0023641586303710938, 0.004072666168212891, 0.0057811737060546875, 0.007489681243896484, 0.009198188781738281, 0.010906696319580078, 0.012615203857421875, 0.014323711395263672, 0.01603221893310547, 0.017740726470947266, 0.019449234008789062, 0.02115774154663086, 0.022866249084472656, 0.024574756622314453, 0.02628326416015625, 0.027991771697998047, 0.029700279235839844, 0.03140878677368164, 0.03311729431152344, 0.034825801849365234, 0.03653430938720703, 0.03824281692504883, 0.039951324462890625, 0.04165983200073242, 0.04336833953857422, 0.045076847076416016, 0.04678535461425781, 0.04849386215209961, 0.050202369689941406, 0.0519108772277832, 0.053619384765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 6.0, 15.0, 25.0, 29.0, 54.0, 97.0, 152.0, 173.0, 130.0, 108.0, 70.0, 31.0, 34.0, 17.0, 11.0, 6.0, 7.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.838010787963867e-05, -7.603969424962997e-05, -7.369928061962128e-05, -7.135886698961258e-05, -6.901845335960388e-05, -6.667803972959518e-05, -6.433762609958649e-05, -6.199721246957779e-05, -5.965679883956909e-05, -5.7316385209560394e-05, -5.49759715795517e-05, -5.2635557949543e-05, -5.02951443195343e-05, -4.7954730689525604e-05, -4.561431705951691e-05, -4.327390342950821e-05, -4.093348979949951e-05, -3.8593076169490814e-05, -3.625266253948212e-05, -3.391224890947342e-05, -3.157183527946472e-05, -2.9231421649456024e-05, -2.6891008019447327e-05, -2.455059438943863e-05, -2.221018075942993e-05, -1.9869767129421234e-05, -1.7529353499412537e-05, -1.5188939869403839e-05, -1.2848526239395142e-05, -1.0508112609386444e-05, -8.167698979377747e-06, -5.827285349369049e-06, -3.4868717193603516e-06, -1.146458089351654e-06, 1.1939555406570435e-06, 3.534369170665741e-06, 5.8747828006744385e-06, 8.215196430683136e-06, 1.0555610060691833e-05, 1.2896023690700531e-05, 1.5236437320709229e-05, 1.7576850950717926e-05, 1.9917264580726624e-05, 2.225767821073532e-05, 2.459809184074402e-05, 2.6938505470752716e-05, 2.9278919100761414e-05, 3.161933273077011e-05, 3.395974636077881e-05, 3.6300159990787506e-05, 3.8640573620796204e-05, 4.09809872508049e-05, 4.33214008808136e-05, 4.5661814510822296e-05, 4.8002228140830994e-05, 5.034264177083969e-05, 5.268305540084839e-05, 5.5023469030857086e-05, 5.7363882660865784e-05, 5.970429629087448e-05, 6.204470992088318e-05, 6.438512355089188e-05, 6.672553718090057e-05, 6.906595081090927e-05, 7.140636444091797e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 15.0, 18.0, 27.0, 50.0, 78.0, 125.0, 231.0, 385.0, 850.0, 1974.0, 5439.0, 16495.0, 63447.0, 292651.0, 494909.0, 127484.0, 30042.0, 8807.0, 3065.0, 1239.0, 549.0, 283.0, 137.0, 77.0, 37.0, 37.0, 21.0, 22.0, 7.0, 9.0, 7.0, 1.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.051788330078125, -0.04995393753051758, -0.048119544982910156, -0.046285152435302734, -0.04445075988769531, -0.04261636734008789, -0.04078197479248047, -0.03894758224487305, -0.037113189697265625, -0.0352787971496582, -0.03344440460205078, -0.03161001205444336, -0.029775619506835938, -0.027941226959228516, -0.026106834411621094, -0.024272441864013672, -0.02243804931640625, -0.020603656768798828, -0.018769264221191406, -0.016934871673583984, -0.015100479125976562, -0.01326608657836914, -0.011431694030761719, -0.009597301483154297, -0.007762908935546875, -0.005928516387939453, -0.004094123840332031, -0.0022597312927246094, -0.0004253387451171875, 0.0014090538024902344, 0.0032434463500976562, 0.005077838897705078, 0.0069122314453125, 0.008746623992919922, 0.010581016540527344, 0.012415409088134766, 0.014249801635742188, 0.01608419418334961, 0.01791858673095703, 0.019752979278564453, 0.021587371826171875, 0.023421764373779297, 0.02525615692138672, 0.02709054946899414, 0.028924942016601562, 0.030759334564208984, 0.032593727111816406, 0.03442811965942383, 0.03626251220703125, 0.03809690475463867, 0.039931297302246094, 0.041765689849853516, 0.04360008239746094, 0.04543447494506836, 0.04726886749267578, 0.0491032600402832, 0.050937652587890625, 0.05277204513549805, 0.05460643768310547, 0.05644083023071289, 0.05827522277832031, 0.060109615325927734, 0.061944007873535156, 0.06377840042114258, 0.06561279296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 13.0, 7.0, 10.0, 10.0, 16.0, 18.0, 17.0, 23.0, 28.0, 35.0, 46.0, 63.0, 69.0, 84.0, 90.0, 78.0, 87.0, 68.0, 48.0, 42.0, 25.0, 34.0, 21.0, 14.0, 11.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01470947265625, -0.014224767684936523, -0.013740062713623047, -0.01325535774230957, -0.012770652770996094, -0.012285947799682617, -0.01180124282836914, -0.011316537857055664, -0.010831832885742188, -0.010347127914428711, -0.009862422943115234, -0.009377717971801758, -0.008893013000488281, -0.008408308029174805, -0.007923603057861328, -0.0074388980865478516, -0.006954193115234375, -0.0064694881439208984, -0.005984783172607422, -0.005500078201293945, -0.005015373229980469, -0.004530668258666992, -0.004045963287353516, -0.003561258316040039, -0.0030765533447265625, -0.002591848373413086, -0.0021071434020996094, -0.0016224384307861328, -0.0011377334594726562, -0.0006530284881591797, -0.00016832351684570312, 0.00031638145446777344, 0.00080108642578125, 0.0012857913970947266, 0.0017704963684082031, 0.0022552013397216797, 0.0027399063110351562, 0.003224611282348633, 0.0037093162536621094, 0.004194021224975586, 0.0046787261962890625, 0.005163431167602539, 0.005648136138916016, 0.006132841110229492, 0.006617546081542969, 0.007102251052856445, 0.007586956024169922, 0.008071660995483398, 0.008556365966796875, 0.009041070938110352, 0.009525775909423828, 0.010010480880737305, 0.010495185852050781, 0.010979890823364258, 0.011464595794677734, 0.011949300765991211, 0.012434005737304688, 0.012918710708618164, 0.01340341567993164, 0.013888120651245117, 0.014372825622558594, 0.01485753059387207, 0.015342235565185547, 0.015826940536499023, 0.0163116455078125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 11.0, 23.0, 39.0, 34.0, 76.0, 93.0, 108.0, 110.0, 120.0, 96.0, 72.0, 74.0, 31.0, 26.0, 23.0, 11.0, 12.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.8066639304161072, -0.7877929210662842, -0.768921971321106, -0.750050961971283, -0.7311800122261047, -0.7123090028762817, -0.6934380531311035, -0.6745670437812805, -0.6556960344314575, -0.6368250250816345, -0.6179540753364563, -0.5990830659866333, -0.5802121162414551, -0.5613411068916321, -0.5424701571464539, -0.5235991477966309, -0.5047281980514526, -0.485857218503952, -0.4669862389564514, -0.4481152594089508, -0.4292442798614502, -0.4103732705116272, -0.3915022909641266, -0.372631311416626, -0.35376033186912537, -0.33488935232162476, -0.31601837277412415, -0.29714739322662354, -0.27827638387680054, -0.2594054341316223, -0.24053442478179932, -0.2216634452342987, -0.20279240608215332, -0.1839214265346527, -0.1650504469871521, -0.1461794525384903, -0.12730847299098969, -0.10843749344348907, -0.08956650644540787, -0.07069551944732666, -0.05182453989982605, -0.03295355662703514, -0.014082573354244232, 0.004788409918546677, 0.023659393191337585, 0.042530372738838196, 0.0614013597369194, 0.08027234673500061, 0.09914332628250122, 0.11801430583000183, 0.13688528537750244, 0.15575627982616425, 0.17462725937366486, 0.19349823892116547, 0.21236923336982727, 0.23124021291732788, 0.2501111924648285, 0.2689821720123291, 0.2878531515598297, 0.3067241311073303, 0.3255951404571533, 0.34446609020233154, 0.36333709955215454, 0.38220807909965515, 0.40107905864715576]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 5.0, 10.0, 14.0, 17.0, 21.0, 17.0, 23.0, 26.0, 46.0, 42.0, 36.0, 40.0, 46.0, 42.0, 57.0, 59.0, 51.0, 46.0, 54.0, 40.0, 42.0, 35.0, 39.0, 29.0, 19.0, 17.0, 29.0, 15.0, 20.0, 11.0, 11.0, 11.0, 12.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3913864493370056, -0.3797988295555115, -0.36821120977401733, -0.3566235899925232, -0.34503600001335144, -0.3334483802318573, -0.32186076045036316, -0.310273140668869, -0.2986855208873749, -0.28709790110588074, -0.2755102813243866, -0.26392269134521484, -0.2523350715637207, -0.24074745178222656, -0.22915983200073242, -0.21757221221923828, -0.20598460733890533, -0.1943969875574112, -0.18280938267707825, -0.1712217628955841, -0.15963414311408997, -0.14804652333259583, -0.13645891845226288, -0.12487129867076874, -0.1132836863398552, -0.10169607400894165, -0.09010845422744751, -0.07852084189653397, -0.06693322956562042, -0.05534560978412628, -0.04375799745321274, -0.0321703776717186, -0.020582765340805054, -0.008995150215923786, 0.0025924649089574814, 0.014180079102516174, 0.025767695158720016, 0.03735531121492386, 0.0489429235458374, 0.06053054332733154, 0.07211815565824509, 0.08370576798915863, 0.09529338777065277, 0.10688100010156631, 0.11846861243247986, 0.130056232213974, 0.14164385199546814, 0.15323147177696228, 0.16481907665729523, 0.17640669643878937, 0.18799430131912231, 0.19958192110061646, 0.2111695408821106, 0.22275716066360474, 0.23434476554393768, 0.24593238532543182, 0.25751999020576477, 0.2691076099872589, 0.28069522976875305, 0.2922828197479248, 0.30387043952941895, 0.3154580593109131, 0.3270456790924072, 0.33863329887390137, 0.3502209186553955]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 10.0, 18.0, 23.0, 41.0, 65.0, 82.0, 124.0, 199.0, 296.0, 416.0, 618.0, 918.0, 1441.0, 2015.0, 3241.0, 5295.0, 8581.0, 14935.0, 27754.0, 57524.0, 145658.0, 393674.0, 224425.0, 78790.0, 35759.0, 18661.0, 10564.0, 6178.0, 3891.0, 2531.0, 1609.0, 1058.0, 703.0, 448.0, 317.0, 203.0, 144.0, 98.0, 71.0, 60.0, 34.0, 23.0, 27.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.20263671875, -0.197113037109375, -0.19158935546875, -0.186065673828125, -0.1805419921875, -0.175018310546875, -0.16949462890625, -0.163970947265625, -0.158447265625, -0.152923583984375, -0.14739990234375, -0.141876220703125, -0.1363525390625, -0.130828857421875, -0.12530517578125, -0.119781494140625, -0.1142578125, -0.108734130859375, -0.10321044921875, -0.097686767578125, -0.0921630859375, -0.086639404296875, -0.08111572265625, -0.075592041015625, -0.070068359375, -0.064544677734375, -0.05902099609375, -0.053497314453125, -0.0479736328125, -0.042449951171875, -0.03692626953125, -0.031402587890625, -0.02587890625, -0.020355224609375, -0.01483154296875, -0.009307861328125, -0.0037841796875, 0.001739501953125, 0.00726318359375, 0.012786865234375, 0.018310546875, 0.023834228515625, 0.02935791015625, 0.034881591796875, 0.0404052734375, 0.045928955078125, 0.05145263671875, 0.056976318359375, 0.0625, 0.068023681640625, 0.07354736328125, 0.079071044921875, 0.0845947265625, 0.090118408203125, 0.09564208984375, 0.101165771484375, 0.106689453125, 0.112213134765625, 0.11773681640625, 0.123260498046875, 0.1287841796875, 0.134307861328125, 0.13983154296875, 0.145355224609375, 0.15087890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 9.0, 16.0, 11.0, 16.0, 26.0, 20.0, 18.0, 34.0, 34.0, 41.0, 35.0, 40.0, 40.0, 57.0, 47.0, 55.0, 50.0, 46.0, 48.0, 52.0, 47.0, 25.0, 35.0, 30.0, 27.0, 26.0, 16.0, 17.0, 8.0, 12.0, 11.0, 12.0, 7.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74853515625, -0.7275390625, -0.70654296875, -0.685546875, -0.66455078125, -0.6435546875, -0.62255859375, -0.6015625, -0.58056640625, -0.5595703125, -0.53857421875, -0.517578125, -0.49658203125, -0.4755859375, -0.45458984375, -0.43359375, -0.41259765625, -0.3916015625, -0.37060546875, -0.349609375, -0.32861328125, -0.3076171875, -0.28662109375, -0.265625, -0.24462890625, -0.2236328125, -0.20263671875, -0.181640625, -0.16064453125, -0.1396484375, -0.11865234375, -0.09765625, -0.07666015625, -0.0556640625, -0.03466796875, -0.013671875, 0.00732421875, 0.0283203125, 0.04931640625, 0.0703125, 0.09130859375, 0.1123046875, 0.13330078125, 0.154296875, 0.17529296875, 0.1962890625, 0.21728515625, 0.23828125, 0.25927734375, 0.2802734375, 0.30126953125, 0.322265625, 0.34326171875, 0.3642578125, 0.38525390625, 0.40625, 0.42724609375, 0.4482421875, 0.46923828125, 0.490234375, 0.51123046875, 0.5322265625, 0.55322265625, 0.57421875, 0.59521484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 14.0, 18.0, 9.0, 9.0, 25.0, 26.0, 40.0, 60.0, 61.0, 74.0, 100.0, 223.0, 2284.0, 1000399.0, 44165.0, 484.0, 139.0, 87.0, 69.0, 59.0, 39.0, 42.0, 27.0, 26.0, 16.0, 15.0, 10.0, 7.0, 7.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.173736572265625, -2.10528564453125, -2.036834716796875, -1.9683837890625, -1.899932861328125, -1.83148193359375, -1.763031005859375, -1.694580078125, -1.626129150390625, -1.55767822265625, -1.489227294921875, -1.4207763671875, -1.352325439453125, -1.28387451171875, -1.215423583984375, -1.14697265625, -1.078521728515625, -1.01007080078125, -0.941619873046875, -0.8731689453125, -0.804718017578125, -0.73626708984375, -0.667816162109375, -0.599365234375, -0.530914306640625, -0.46246337890625, -0.394012451171875, -0.3255615234375, -0.257110595703125, -0.18865966796875, -0.120208740234375, -0.0517578125, 0.016693115234375, 0.08514404296875, 0.153594970703125, 0.2220458984375, 0.290496826171875, 0.35894775390625, 0.427398681640625, 0.495849609375, 0.564300537109375, 0.63275146484375, 0.701202392578125, 0.7696533203125, 0.838104248046875, 0.90655517578125, 0.975006103515625, 1.04345703125, 1.111907958984375, 1.18035888671875, 1.248809814453125, 1.3172607421875, 1.385711669921875, 1.45416259765625, 1.522613525390625, 1.591064453125, 1.659515380859375, 1.72796630859375, 1.796417236328125, 1.8648681640625, 1.933319091796875, 2.00177001953125, 2.070220947265625, 2.138671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 10.0, 16.0, 12.0, 11.0, 15.0, 14.0, 28.0, 30.0, 52.0, 51.0, 48.0, 41.0, 54.0, 57.0, 57.0, 65.0, 50.0, 47.0, 46.0, 47.0, 38.0, 38.0, 34.0, 26.0, 27.0, 18.0, 16.0, 15.0, 9.0, 5.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90185546875, -0.8743362426757812, -0.8468170166015625, -0.8192977905273438, -0.791778564453125, -0.7642593383789062, -0.7367401123046875, -0.7092208862304688, -0.68170166015625, -0.6541824340820312, -0.6266632080078125, -0.5991439819335938, -0.571624755859375, -0.5441055297851562, -0.5165863037109375, -0.48906707763671875, -0.4615478515625, -0.43402862548828125, -0.4065093994140625, -0.37899017333984375, -0.351470947265625, -0.32395172119140625, -0.2964324951171875, -0.26891326904296875, -0.24139404296875, -0.21387481689453125, -0.1863555908203125, -0.15883636474609375, -0.131317138671875, -0.10379791259765625, -0.0762786865234375, -0.04875946044921875, -0.021240234375, 0.00627899169921875, 0.0337982177734375, 0.06131744384765625, 0.088836669921875, 0.11635589599609375, 0.1438751220703125, 0.17139434814453125, 0.19891357421875, 0.22643280029296875, 0.2539520263671875, 0.28147125244140625, 0.308990478515625, 0.33650970458984375, 0.3640289306640625, 0.39154815673828125, 0.4190673828125, 0.44658660888671875, 0.4741058349609375, 0.5016250610351562, 0.529144287109375, 0.5566635131835938, 0.5841827392578125, 0.6117019653320312, 0.63922119140625, 0.6667404174804688, 0.6942596435546875, 0.7217788696289062, 0.749298095703125, 0.7768173217773438, 0.8043365478515625, 0.8318557739257812, 0.859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 6.0, 9.0, 20.0, 25.0, 30.0, 50.0, 80.0, 170.0, 472.0, 1888.0, 12088.0, 718777.0, 302768.0, 9614.0, 1701.0, 451.0, 163.0, 82.0, 40.0, 28.0, 15.0, 13.0, 9.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.434326171875, -0.41982269287109375, -0.4053192138671875, -0.39081573486328125, -0.376312255859375, -0.36180877685546875, -0.3473052978515625, -0.33280181884765625, -0.31829833984375, -0.30379486083984375, -0.2892913818359375, -0.27478790283203125, -0.260284423828125, -0.24578094482421875, -0.2312774658203125, -0.21677398681640625, -0.2022705078125, -0.18776702880859375, -0.1732635498046875, -0.15876007080078125, -0.144256591796875, -0.12975311279296875, -0.1152496337890625, -0.10074615478515625, -0.08624267578125, -0.07173919677734375, -0.0572357177734375, -0.04273223876953125, -0.028228759765625, -0.01372528076171875, 0.0007781982421875, 0.01528167724609375, 0.02978515625, 0.04428863525390625, 0.0587921142578125, 0.07329559326171875, 0.087799072265625, 0.10230255126953125, 0.1168060302734375, 0.13130950927734375, 0.14581298828125, 0.16031646728515625, 0.1748199462890625, 0.18932342529296875, 0.203826904296875, 0.21833038330078125, 0.2328338623046875, 0.24733734130859375, 0.2618408203125, 0.27634429931640625, 0.2908477783203125, 0.30535125732421875, 0.319854736328125, 0.33435821533203125, 0.3488616943359375, 0.36336517333984375, 0.37786865234375, 0.39237213134765625, 0.4068756103515625, 0.42137908935546875, 0.435882568359375, 0.45038604736328125, 0.4648895263671875, 0.47939300537109375, 0.493896484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 22.0, 28.0, 31.0, 64.0, 194.0, 343.0, 131.0, 58.0, 26.0, 23.0, 16.0, 7.0, 7.0, 1.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2498111724853516e-05, -4.1048042476177216e-05, -3.9597973227500916e-05, -3.8147903978824615e-05, -3.6697834730148315e-05, -3.5247765481472015e-05, -3.3797696232795715e-05, -3.2347626984119415e-05, -3.0897557735443115e-05, -2.9447488486766815e-05, -2.7997419238090515e-05, -2.6547349989414215e-05, -2.5097280740737915e-05, -2.3647211492061615e-05, -2.2197142243385315e-05, -2.0747072994709015e-05, -1.9297003746032715e-05, -1.7846934497356415e-05, -1.6396865248680115e-05, -1.4946796000003815e-05, -1.3496726751327515e-05, -1.2046657502651215e-05, -1.0596588253974915e-05, -9.146519005298615e-06, -7.696449756622314e-06, -6.246380507946014e-06, -4.796311259269714e-06, -3.3462420105934143e-06, -1.8961727619171143e-06, -4.461035132408142e-07, 1.0039657354354858e-06, 2.454034984111786e-06, 3.904104232788086e-06, 5.354173481464386e-06, 6.804242730140686e-06, 8.254311978816986e-06, 9.704381227493286e-06, 1.1154450476169586e-05, 1.2604519724845886e-05, 1.4054588973522186e-05, 1.5504658222198486e-05, 1.6954727470874786e-05, 1.8404796719551086e-05, 1.9854865968227386e-05, 2.1304935216903687e-05, 2.2755004465579987e-05, 2.4205073714256287e-05, 2.5655142962932587e-05, 2.7105212211608887e-05, 2.8555281460285187e-05, 3.0005350708961487e-05, 3.145541995763779e-05, 3.290548920631409e-05, 3.435555845499039e-05, 3.580562770366669e-05, 3.725569695234299e-05, 3.870576620101929e-05, 4.015583544969559e-05, 4.160590469837189e-05, 4.305597394704819e-05, 4.450604319572449e-05, 4.595611244440079e-05, 4.740618169307709e-05, 4.885625094175339e-05, 5.030632019042969e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 13.0, 11.0, 58.0, 116.0, 452.0, 3053.0, 166903.0, 872791.0, 4281.0, 585.0, 147.0, 54.0, 26.0, 21.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76220703125, -0.7360000610351562, -0.7097930908203125, -0.6835861206054688, -0.657379150390625, -0.6311721801757812, -0.6049652099609375, -0.5787582397460938, -0.55255126953125, -0.5263442993164062, -0.5001373291015625, -0.47393035888671875, -0.447723388671875, -0.42151641845703125, -0.3953094482421875, -0.36910247802734375, -0.3428955078125, -0.31668853759765625, -0.2904815673828125, -0.26427459716796875, -0.238067626953125, -0.21186065673828125, -0.1856536865234375, -0.15944671630859375, -0.13323974609375, -0.10703277587890625, -0.0808258056640625, -0.05461883544921875, -0.028411865234375, -0.00220489501953125, 0.0240020751953125, 0.05020904541015625, 0.076416015625, 0.10262298583984375, 0.1288299560546875, 0.15503692626953125, 0.181243896484375, 0.20745086669921875, 0.2336578369140625, 0.25986480712890625, 0.28607177734375, 0.31227874755859375, 0.3384857177734375, 0.36469268798828125, 0.390899658203125, 0.41710662841796875, 0.4433135986328125, 0.46952056884765625, 0.4957275390625, 0.5219345092773438, 0.5481414794921875, 0.5743484497070312, 0.600555419921875, 0.6267623901367188, 0.6529693603515625, 0.6791763305664062, 0.70538330078125, 0.7315902709960938, 0.7577972412109375, 0.7840042114257812, 0.810211181640625, 0.8364181518554688, 0.8626251220703125, 0.8888320922851562, 0.9150390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 15.0, 11.0, 21.0, 20.0, 47.0, 83.0, 164.0, 297.0, 132.0, 76.0, 42.0, 27.0, 11.0, 15.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.11989498138427734, -0.11607170104980469, -0.11224842071533203, -0.10842514038085938, -0.10460186004638672, -0.10077857971191406, -0.0969552993774414, -0.09313201904296875, -0.0893087387084961, -0.08548545837402344, -0.08166217803955078, -0.07783889770507812, -0.07401561737060547, -0.07019233703613281, -0.06636905670166016, -0.0625457763671875, -0.058722496032714844, -0.05489921569824219, -0.05107593536376953, -0.047252655029296875, -0.04342937469482422, -0.03960609436035156, -0.035782814025878906, -0.03195953369140625, -0.028136253356933594, -0.024312973022460938, -0.02048969268798828, -0.016666412353515625, -0.012843132019042969, -0.009019851684570312, -0.005196571350097656, -0.001373291015625, 0.0024499893188476562, 0.0062732696533203125, 0.010096549987792969, 0.013919830322265625, 0.01774311065673828, 0.021566390991210938, 0.025389671325683594, 0.02921295166015625, 0.033036231994628906, 0.03685951232910156, 0.04068279266357422, 0.044506072998046875, 0.04832935333251953, 0.05215263366699219, 0.055975914001464844, 0.0597991943359375, 0.06362247467041016, 0.06744575500488281, 0.07126903533935547, 0.07509231567382812, 0.07891559600830078, 0.08273887634277344, 0.0865621566772461, 0.09038543701171875, 0.0942087173461914, 0.09803199768066406, 0.10185527801513672, 0.10567855834960938, 0.10950183868408203, 0.11332511901855469, 0.11714839935302734, 0.1209716796875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [19.0, 374.0, 585.0, 39.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6702286005020142, -0.35472747683525085, -0.03922635316848755, 0.27627480030059814, 0.5917758941650391, 0.90727698802948, 1.2227782011032104, 1.5382791757583618, 1.8537803888320923, 2.169281482696533, 2.4847826957702637, 2.800283908843994, 3.1157848834991455, 3.431285858154297, 3.7467870712280273, 4.062288284301758, 4.377789497375488, 4.693290710449219, 5.008791923522949, 5.32429313659668, 5.639793872833252, 5.955295085906982, 6.270796298980713, 6.586297035217285, 6.901798248291016, 7.217299461364746, 7.532800674438477, 7.848301887512207, 8.163803100585938, 8.479303359985352, 8.794805526733398, 9.110305786132812, 9.425806999206543, 9.741308212280273, 10.056809425354004, 10.372310638427734, 10.687811851501465, 11.003313064575195, 11.31881332397461, 11.63431453704834, 11.94981575012207, 12.2653169631958, 12.580818176269531, 12.896319389343262, 13.211820602416992, 13.527320861816406, 13.842823028564453, 14.158323287963867, 14.473825454711914, 14.789326667785645, 15.104827880859375, 15.420329093933105, 15.735830307006836, 16.05133056640625, 16.366832733154297, 16.68233299255371, 16.997833251953125, 17.31333351135254, 17.628835678100586, 17.9443359375, 18.259838104248047, 18.57533836364746, 18.890840530395508, 19.206340789794922, 19.52184295654297]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 13.0, 11.0, 12.0, 7.0, 10.0, 18.0, 27.0, 20.0, 28.0, 29.0, 24.0, 35.0, 28.0, 31.0, 45.0, 41.0, 49.0, 50.0, 34.0, 34.0, 37.0, 52.0, 44.0, 39.0, 39.0, 33.0, 25.0, 29.0, 25.0, 21.0, 14.0, 17.0, 16.0, 12.0, 10.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.803426206111908, -0.7724162340164185, -0.7414062023162842, -0.7103962302207947, -0.6793862581253052, -0.6483762264251709, -0.6173662543296814, -0.5863562822341919, -0.5553462505340576, -0.5243362784385681, -0.49332624673843384, -0.46231627464294434, -0.43130627274513245, -0.40029627084732056, -0.36928629875183105, -0.33827629685401917, -0.3072662949562073, -0.2762562930583954, -0.2452463060617447, -0.214236319065094, -0.1832263171672821, -0.15221631526947021, -0.12120632827281952, -0.09019634127616882, -0.059186339378356934, -0.02817634493112564, 0.002833649516105652, 0.033843643963336945, 0.06485363841056824, 0.09586364030838013, 0.12687362730503082, 0.15788361430168152, 0.18889367580413818, 0.21990367770195007, 0.25091367959976196, 0.28192365169525146, 0.31293365359306335, 0.34394365549087524, 0.37495362758636475, 0.40596362948417664, 0.4369736313819885, 0.4679836332798004, 0.4989936351776123, 0.5300036072731018, 0.5610135793685913, 0.5920236110687256, 0.6230335831642151, 0.6540435552597046, 0.6850535869598389, 0.7160635590553284, 0.7470735907554626, 0.7780835628509521, 0.8090935945510864, 0.8401035666465759, 0.8711135387420654, 0.9021235704421997, 0.9331335425376892, 0.9641435146331787, 0.995153546333313, 1.0261635780334473, 1.057173490524292, 1.0881835222244263, 1.1191935539245605, 1.1502034664154053, 1.1812134981155396]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 9.0, 12.0, 13.0, 24.0, 25.0, 26.0, 53.0, 60.0, 93.0, 160.0, 195.0, 295.0, 579.0, 948.0, 1631.0, 3216.0, 6991.0, 18275.0, 64984.0, 407807.0, 2128040.0, 1307615.0, 192519.0, 37977.0, 11951.0, 4904.0, 2497.0, 1314.0, 775.0, 475.0, 256.0, 172.0, 127.0, 65.0, 57.0, 46.0, 24.0, 23.0, 18.0, 6.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59375, -0.5744781494140625, -0.555206298828125, -0.5359344482421875, -0.51666259765625, -0.4973907470703125, -0.478118896484375, -0.4588470458984375, -0.4395751953125, -0.4203033447265625, -0.401031494140625, -0.3817596435546875, -0.36248779296875, -0.3432159423828125, -0.323944091796875, -0.3046722412109375, -0.285400390625, -0.2661285400390625, -0.246856689453125, -0.2275848388671875, -0.20831298828125, -0.1890411376953125, -0.169769287109375, -0.1504974365234375, -0.1312255859375, -0.1119537353515625, -0.092681884765625, -0.0734100341796875, -0.05413818359375, -0.0348663330078125, -0.015594482421875, 0.0036773681640625, 0.02294921875, 0.0422210693359375, 0.061492919921875, 0.0807647705078125, 0.10003662109375, 0.1193084716796875, 0.138580322265625, 0.1578521728515625, 0.1771240234375, 0.1963958740234375, 0.215667724609375, 0.2349395751953125, 0.25421142578125, 0.2734832763671875, 0.292755126953125, 0.3120269775390625, 0.331298828125, 0.3505706787109375, 0.369842529296875, 0.3891143798828125, 0.40838623046875, 0.4276580810546875, 0.446929931640625, 0.4662017822265625, 0.4854736328125, 0.5047454833984375, 0.524017333984375, 0.5432891845703125, 0.56256103515625, 0.5818328857421875, 0.601104736328125, 0.6203765869140625, 0.6396484375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 7.0, 9.0, 17.0, 14.0, 18.0, 29.0, 19.0, 27.0, 37.0, 30.0, 49.0, 42.0, 44.0, 38.0, 39.0, 53.0, 46.0, 53.0, 57.0, 46.0, 43.0, 53.0, 37.0, 27.0, 29.0, 23.0, 25.0, 16.0, 16.0, 11.0, 11.0, 2.0, 6.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.438720703125, -0.42501068115234375, -0.4113006591796875, -0.39759063720703125, -0.383880615234375, -0.37017059326171875, -0.3564605712890625, -0.34275054931640625, -0.32904052734375, -0.31533050537109375, -0.3016204833984375, -0.28791046142578125, -0.274200439453125, -0.26049041748046875, -0.2467803955078125, -0.23307037353515625, -0.2193603515625, -0.20565032958984375, -0.1919403076171875, -0.17823028564453125, -0.164520263671875, -0.15081024169921875, -0.1371002197265625, -0.12339019775390625, -0.10968017578125, -0.09597015380859375, -0.0822601318359375, -0.06855010986328125, -0.054840087890625, -0.04113006591796875, -0.0274200439453125, -0.01371002197265625, 0.0, 0.01371002197265625, 0.0274200439453125, 0.04113006591796875, 0.054840087890625, 0.06855010986328125, 0.0822601318359375, 0.09597015380859375, 0.10968017578125, 0.12339019775390625, 0.1371002197265625, 0.15081024169921875, 0.164520263671875, 0.17823028564453125, 0.1919403076171875, 0.20565032958984375, 0.2193603515625, 0.23307037353515625, 0.2467803955078125, 0.26049041748046875, 0.274200439453125, 0.28791046142578125, 0.3016204833984375, 0.31533050537109375, 0.32904052734375, 0.34275054931640625, 0.3564605712890625, 0.37017059326171875, 0.383880615234375, 0.39759063720703125, 0.4113006591796875, 0.42501068115234375, 0.438720703125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 12.0, 14.0, 15.0, 34.0, 55.0, 122.0, 252.0, 713.0, 2180.0, 24322.0, 4040277.0, 120257.0, 4402.0, 924.0, 353.0, 166.0, 80.0, 42.0, 15.0, 15.0, 5.0, 9.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24212646484375, -2.1580810546875, -2.07403564453125, -1.989990234375, -1.90594482421875, -1.8218994140625, -1.73785400390625, -1.65380859375, -1.56976318359375, -1.4857177734375, -1.40167236328125, -1.317626953125, -1.23358154296875, -1.1495361328125, -1.06549072265625, -0.9814453125, -0.89739990234375, -0.8133544921875, -0.72930908203125, -0.645263671875, -0.56121826171875, -0.4771728515625, -0.39312744140625, -0.30908203125, -0.22503662109375, -0.1409912109375, -0.05694580078125, 0.027099609375, 0.11114501953125, 0.1951904296875, 0.27923583984375, 0.36328125, 0.44732666015625, 0.5313720703125, 0.61541748046875, 0.699462890625, 0.78350830078125, 0.8675537109375, 0.95159912109375, 1.03564453125, 1.11968994140625, 1.2037353515625, 1.28778076171875, 1.371826171875, 1.45587158203125, 1.5399169921875, 1.62396240234375, 1.7080078125, 1.79205322265625, 1.8760986328125, 1.96014404296875, 2.044189453125, 2.12823486328125, 2.2122802734375, 2.29632568359375, 2.38037109375, 2.46441650390625, 2.5484619140625, 2.63250732421875, 2.716552734375, 2.80059814453125, 2.8846435546875, 2.96868896484375, 3.052734375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 9.0, 15.0, 21.0, 44.0, 90.0, 170.0, 389.0, 1061.0, 1315.0, 513.0, 208.0, 115.0, 58.0, 30.0, 15.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400390625, -0.5242156982421875, -0.508392333984375, -0.4925689697265625, -0.47674560546875, -0.4609222412109375, -0.445098876953125, -0.4292755126953125, -0.4134521484375, -0.3976287841796875, -0.381805419921875, -0.3659820556640625, -0.35015869140625, -0.3343353271484375, -0.318511962890625, -0.3026885986328125, -0.286865234375, -0.2710418701171875, -0.255218505859375, -0.2393951416015625, -0.22357177734375, -0.2077484130859375, -0.191925048828125, -0.1761016845703125, -0.1602783203125, -0.1444549560546875, -0.128631591796875, -0.1128082275390625, -0.09698486328125, -0.0811614990234375, -0.065338134765625, -0.0495147705078125, -0.03369140625, -0.0178680419921875, -0.002044677734375, 0.0137786865234375, 0.02960205078125, 0.0454254150390625, 0.061248779296875, 0.0770721435546875, 0.0928955078125, 0.1087188720703125, 0.124542236328125, 0.1403656005859375, 0.15618896484375, 0.1720123291015625, 0.187835693359375, 0.2036590576171875, 0.219482421875, 0.2353057861328125, 0.251129150390625, 0.2669525146484375, 0.28277587890625, 0.2985992431640625, 0.314422607421875, 0.3302459716796875, 0.3460693359375, 0.3618927001953125, 0.377716064453125, 0.3935394287109375, 0.40936279296875, 0.4251861572265625, 0.441009521484375, 0.4568328857421875, 0.47265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 9.0, 12.0, 13.0, 16.0, 26.0, 34.0, 59.0, 51.0, 63.0, 95.0, 93.0, 92.0, 83.0, 72.0, 51.0, 61.0, 42.0, 28.0, 19.0, 11.0, 17.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.699211597442627, -0.6760556697845459, -0.6528997421264648, -0.6297438144683838, -0.6065878868103027, -0.5834318995475769, -0.5602759718894958, -0.5371200442314148, -0.5139641165733337, -0.4908081889152527, -0.46765226125717163, -0.4444963037967682, -0.42134037613868713, -0.3981844484806061, -0.37502849102020264, -0.3518725633621216, -0.3287166357040405, -0.3055607080459595, -0.2824047803878784, -0.259248822927475, -0.23609289526939392, -0.21293696761131287, -0.18978102505207062, -0.16662508249282837, -0.14346915483474731, -0.12031321972608566, -0.09715728461742401, -0.07400134950876236, -0.05084541440010071, -0.027689479291439056, -0.004533544182777405, 0.018622398376464844, 0.04177826642990112, 0.06493420153856277, 0.08809013664722443, 0.11124607175588608, 0.13440200686454773, 0.15755793452262878, 0.18071387708187103, 0.20386981964111328, 0.22702574729919434, 0.2501816749572754, 0.27333760261535645, 0.2964935600757599, 0.31964948773384094, 0.342805415391922, 0.36596137285232544, 0.3891173005104065, 0.41227322816848755, 0.4354291558265686, 0.45858508348464966, 0.4817410409450531, 0.5048969984054565, 0.5280529260635376, 0.5512088537216187, 0.5743647813796997, 0.5975207090377808, 0.6206766366958618, 0.6438325643539429, 0.6669884920120239, 0.690144419670105, 0.7133004069328308, 0.7364563345909119, 0.7596122622489929, 0.782768189907074]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 18.0, 17.0, 13.0, 20.0, 19.0, 27.0, 22.0, 26.0, 42.0, 40.0, 39.0, 38.0, 52.0, 40.0, 44.0, 44.0, 35.0, 49.0, 47.0, 43.0, 48.0, 30.0, 41.0, 33.0, 30.0, 16.0, 23.0, 23.0, 12.0, 18.0, 7.0, 9.0, 6.0, 0.0, 2.0, 7.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5059067606925964, -0.4903792440891266, -0.47485169768333435, -0.4593241810798645, -0.44379663467407227, -0.4282691180706024, -0.41274160146713257, -0.39721405506134033, -0.3816865384578705, -0.36615902185440063, -0.3506314754486084, -0.33510395884513855, -0.3195764422416687, -0.30404889583587646, -0.2885213792324066, -0.27299386262893677, -0.25746631622314453, -0.2419387847185135, -0.22641125321388245, -0.2108837366104126, -0.19535620510578156, -0.1798286736011505, -0.16430115699768066, -0.14877362549304962, -0.13324609398841858, -0.11771856248378754, -0.10219103842973709, -0.08666351437568665, -0.0711359828710556, -0.05560845136642456, -0.040080927312374115, -0.02455340325832367, -0.009025901556015015, 0.006501626223325729, 0.022029154002666473, 0.03755668178200722, 0.05308420956134796, 0.068611741065979, 0.08413926512002945, 0.0996667891740799, 0.11519432067871094, 0.13072185218334198, 0.14624938368797302, 0.16177690029144287, 0.1773044317960739, 0.19283196330070496, 0.2083594799041748, 0.22388701140880585, 0.2394145429134369, 0.25494205951690674, 0.270469605922699, 0.2859971225261688, 0.30152463912963867, 0.3170521855354309, 0.33257970213890076, 0.3481072187423706, 0.36363476514816284, 0.3791622817516327, 0.3946898281574249, 0.4102173447608948, 0.425744891166687, 0.44127240777015686, 0.4567999243736267, 0.47232747077941895, 0.4878549873828888]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 11.0, 28.0, 30.0, 43.0, 61.0, 84.0, 140.0, 201.0, 417.0, 671.0, 1205.0, 2156.0, 3900.0, 7597.0, 15276.0, 33023.0, 79385.0, 218782.0, 389526.0, 174699.0, 65599.0, 27926.0, 13227.0, 6635.0, 3494.0, 1833.0, 1033.0, 582.0, 398.0, 227.0, 119.0, 91.0, 53.0, 42.0, 21.0, 8.0, 7.0, 8.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2176513671875, -0.2111339569091797, -0.20461654663085938, -0.19809913635253906, -0.19158172607421875, -0.18506431579589844, -0.17854690551757812, -0.1720294952392578, -0.1655120849609375, -0.1589946746826172, -0.15247726440429688, -0.14595985412597656, -0.13944244384765625, -0.13292503356933594, -0.12640762329101562, -0.11989021301269531, -0.113372802734375, -0.10685539245605469, -0.10033798217773438, -0.09382057189941406, -0.08730316162109375, -0.08078575134277344, -0.07426834106445312, -0.06775093078613281, -0.0612335205078125, -0.05471611022949219, -0.048198699951171875, -0.04168128967285156, -0.03516387939453125, -0.028646469116210938, -0.022129058837890625, -0.015611648559570312, -0.00909423828125, -0.0025768280029296875, 0.003940582275390625, 0.010457992553710938, 0.01697540283203125, 0.023492813110351562, 0.030010223388671875, 0.03652763366699219, 0.0430450439453125, 0.04956245422363281, 0.056079864501953125, 0.06259727478027344, 0.06911468505859375, 0.07563209533691406, 0.08214950561523438, 0.08866691589355469, 0.095184326171875, 0.10170173645019531, 0.10821914672851562, 0.11473655700683594, 0.12125396728515625, 0.12777137756347656, 0.13428878784179688, 0.1408061981201172, 0.1473236083984375, 0.1538410186767578, 0.16035842895507812, 0.16687583923339844, 0.17339324951171875, 0.17991065979003906, 0.18642807006835938, 0.1929454803466797, 0.199462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 15.0, 11.0, 15.0, 21.0, 20.0, 21.0, 21.0, 43.0, 31.0, 45.0, 48.0, 60.0, 52.0, 61.0, 54.0, 48.0, 49.0, 46.0, 53.0, 35.0, 40.0, 35.0, 32.0, 25.0, 21.0, 21.0, 15.0, 16.0, 6.0, 8.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.3002510070800781, -0.28971099853515625, -0.2791709899902344, -0.2686309814453125, -0.2580909729003906, -0.24755096435546875, -0.23701095581054688, -0.226470947265625, -0.21593093872070312, -0.20539093017578125, -0.19485092163085938, -0.1843109130859375, -0.17377090454101562, -0.16323089599609375, -0.15269088745117188, -0.14215087890625, -0.13161087036132812, -0.12107086181640625, -0.11053085327148438, -0.0999908447265625, -0.08945083618164062, -0.07891082763671875, -0.06837081909179688, -0.057830810546875, -0.047290802001953125, -0.03675079345703125, -0.026210784912109375, -0.0156707763671875, -0.005130767822265625, 0.00540924072265625, 0.015949249267578125, 0.0264892578125, 0.037029266357421875, 0.04756927490234375, 0.058109283447265625, 0.0686492919921875, 0.07918930053710938, 0.08972930908203125, 0.10026931762695312, 0.110809326171875, 0.12134933471679688, 0.13188934326171875, 0.14242935180664062, 0.1529693603515625, 0.16350936889648438, 0.17404937744140625, 0.18458938598632812, 0.19512939453125, 0.20566940307617188, 0.21620941162109375, 0.22674942016601562, 0.2372894287109375, 0.24782943725585938, 0.25836944580078125, 0.2689094543457031, 0.279449462890625, 0.2899894714355469, 0.30052947998046875, 0.3110694885253906, 0.3216094970703125, 0.3321495056152344, 0.34268951416015625, 0.3532295227050781, 0.36376953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 12.0, 11.0, 24.0, 28.0, 45.0, 54.0, 97.0, 164.0, 241.0, 348.0, 599.0, 1003.0, 1881.0, 3519.0, 7202.0, 16436.0, 39745.0, 112087.0, 337862.0, 341775.0, 113687.0, 40159.0, 16202.0, 7314.0, 3657.0, 1779.0, 1077.0, 555.0, 333.0, 211.0, 140.0, 96.0, 62.0, 41.0, 35.0, 25.0, 11.0, 13.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2132568359375, -0.20764541625976562, -0.20203399658203125, -0.19642257690429688, -0.1908111572265625, -0.18519973754882812, -0.17958831787109375, -0.17397689819335938, -0.168365478515625, -0.16275405883789062, -0.15714263916015625, -0.15153121948242188, -0.1459197998046875, -0.14030838012695312, -0.13469696044921875, -0.12908554077148438, -0.12347412109375, -0.11786270141601562, -0.11225128173828125, -0.10663986206054688, -0.1010284423828125, -0.09541702270507812, -0.08980560302734375, -0.08419418334960938, -0.078582763671875, -0.07297134399414062, -0.06735992431640625, -0.061748504638671875, -0.0561370849609375, -0.050525665283203125, -0.04491424560546875, -0.039302825927734375, -0.03369140625, -0.028079986572265625, -0.02246856689453125, -0.016857147216796875, -0.0112457275390625, -0.005634307861328125, -2.288818359375e-05, 0.005588531494140625, 0.011199951171875, 0.016811370849609375, 0.02242279052734375, 0.028034210205078125, 0.0336456298828125, 0.039257049560546875, 0.04486846923828125, 0.050479888916015625, 0.05609130859375, 0.061702728271484375, 0.06731414794921875, 0.07292556762695312, 0.0785369873046875, 0.08414840698242188, 0.08975982666015625, 0.09537124633789062, 0.100982666015625, 0.10659408569335938, 0.11220550537109375, 0.11781692504882812, 0.1234283447265625, 0.12903976440429688, 0.13465118408203125, 0.14026260375976562, 0.1458740234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 11.0, 8.0, 17.0, 10.0, 24.0, 22.0, 35.0, 29.0, 39.0, 47.0, 39.0, 45.0, 48.0, 58.0, 54.0, 49.0, 52.0, 48.0, 52.0, 57.0, 36.0, 32.0, 36.0, 32.0, 24.0, 13.0, 15.0, 14.0, 19.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74072265625, -0.7204437255859375, -0.700164794921875, -0.6798858642578125, -0.65960693359375, -0.6393280029296875, -0.619049072265625, -0.5987701416015625, -0.5784912109375, -0.5582122802734375, -0.537933349609375, -0.5176544189453125, -0.49737548828125, -0.4770965576171875, -0.456817626953125, -0.4365386962890625, -0.416259765625, -0.3959808349609375, -0.375701904296875, -0.3554229736328125, -0.33514404296875, -0.3148651123046875, -0.294586181640625, -0.2743072509765625, -0.2540283203125, -0.2337493896484375, -0.213470458984375, -0.1931915283203125, -0.17291259765625, -0.1526336669921875, -0.132354736328125, -0.1120758056640625, -0.091796875, -0.0715179443359375, -0.051239013671875, -0.0309600830078125, -0.01068115234375, 0.0095977783203125, 0.029876708984375, 0.0501556396484375, 0.0704345703125, 0.0907135009765625, 0.110992431640625, 0.1312713623046875, 0.15155029296875, 0.1718292236328125, 0.192108154296875, 0.2123870849609375, 0.232666015625, 0.2529449462890625, 0.273223876953125, 0.2935028076171875, 0.31378173828125, 0.3340606689453125, 0.354339599609375, 0.3746185302734375, 0.3948974609375, 0.4151763916015625, 0.435455322265625, 0.4557342529296875, 0.47601318359375, 0.4962921142578125, 0.516571044921875, 0.5368499755859375, 0.55712890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 11.0, 12.0, 25.0, 26.0, 35.0, 73.0, 129.0, 255.0, 559.0, 1359.0, 4002.0, 16515.0, 123834.0, 791252.0, 91163.0, 13523.0, 3487.0, 1230.0, 487.0, 265.0, 113.0, 64.0, 53.0, 24.0, 9.0, 14.0, 7.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17678070068359375, -0.1724090576171875, -0.16803741455078125, -0.163665771484375, -0.15929412841796875, -0.1549224853515625, -0.15055084228515625, -0.14617919921875, -0.14180755615234375, -0.1374359130859375, -0.13306427001953125, -0.128692626953125, -0.12432098388671875, -0.1199493408203125, -0.11557769775390625, -0.1112060546875, -0.10683441162109375, -0.1024627685546875, -0.09809112548828125, -0.093719482421875, -0.08934783935546875, -0.0849761962890625, -0.08060455322265625, -0.07623291015625, -0.07186126708984375, -0.0674896240234375, -0.06311798095703125, -0.058746337890625, -0.05437469482421875, -0.0500030517578125, -0.04563140869140625, -0.041259765625, -0.03688812255859375, -0.0325164794921875, -0.02814483642578125, -0.023773193359375, -0.01940155029296875, -0.0150299072265625, -0.01065826416015625, -0.00628662109375, -0.00191497802734375, 0.0024566650390625, 0.00682830810546875, 0.011199951171875, 0.01557159423828125, 0.0199432373046875, 0.02431488037109375, 0.0286865234375, 0.03305816650390625, 0.0374298095703125, 0.04180145263671875, 0.046173095703125, 0.05054473876953125, 0.0549163818359375, 0.05928802490234375, 0.06365966796875, 0.06803131103515625, 0.0724029541015625, 0.07677459716796875, 0.081146240234375, 0.08551788330078125, 0.0898895263671875, 0.09426116943359375, 0.0986328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 8.0, 11.0, 15.0, 20.0, 33.0, 26.0, 40.0, 74.0, 106.0, 164.0, 154.0, 105.0, 58.0, 37.0, 21.0, 29.0, 13.0, 12.0, 8.0, 10.0, 3.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.103515625e-05, -5.9118494391441345e-05, -5.720183253288269e-05, -5.5285170674324036e-05, -5.336850881576538e-05, -5.1451846957206726e-05, -4.953518509864807e-05, -4.7618523240089417e-05, -4.570186138153076e-05, -4.378519952297211e-05, -4.186853766441345e-05, -3.99518758058548e-05, -3.803521394729614e-05, -3.611855208873749e-05, -3.420189023017883e-05, -3.228522837162018e-05, -3.0368566513061523e-05, -2.845190465450287e-05, -2.6535242795944214e-05, -2.461858093738556e-05, -2.2701919078826904e-05, -2.078525722026825e-05, -1.8868595361709595e-05, -1.695193350315094e-05, -1.5035271644592285e-05, -1.311860978603363e-05, -1.1201947927474976e-05, -9.28528606891632e-06, -7.368624210357666e-06, -5.451962351799011e-06, -3.5353004932403564e-06, -1.6186386346817017e-06, 2.980232238769531e-07, 2.214685082435608e-06, 4.131346940994263e-06, 6.0480087995529175e-06, 7.964670658111572e-06, 9.881332516670227e-06, 1.1797994375228882e-05, 1.3714656233787537e-05, 1.563131809234619e-05, 1.7547979950904846e-05, 1.94646418094635e-05, 2.1381303668022156e-05, 2.329796552658081e-05, 2.5214627385139465e-05, 2.713128924369812e-05, 2.9047951102256775e-05, 3.096461296081543e-05, 3.2881274819374084e-05, 3.479793667793274e-05, 3.6714598536491394e-05, 3.863126039505005e-05, 4.0547922253608704e-05, 4.246458411216736e-05, 4.438124597072601e-05, 4.629790782928467e-05, 4.821456968784332e-05, 5.013123154640198e-05, 5.204789340496063e-05, 5.396455526351929e-05, 5.588121712207794e-05, 5.77978789806366e-05, 5.971454083919525e-05, 6.16312026977539e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 8.0, 13.0, 21.0, 25.0, 37.0, 43.0, 77.0, 118.0, 232.0, 377.0, 647.0, 1354.0, 3065.0, 10284.0, 61848.0, 773106.0, 170673.0, 18286.0, 4558.0, 1747.0, 892.0, 416.0, 254.0, 152.0, 97.0, 67.0, 42.0, 24.0, 26.0, 18.0, 11.0, 8.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.15673828125, -0.1522197723388672, -0.14770126342773438, -0.14318275451660156, -0.13866424560546875, -0.13414573669433594, -0.12962722778320312, -0.1251087188720703, -0.1205902099609375, -0.11607170104980469, -0.11155319213867188, -0.10703468322753906, -0.10251617431640625, -0.09799766540527344, -0.09347915649414062, -0.08896064758300781, -0.084442138671875, -0.07992362976074219, -0.07540512084960938, -0.07088661193847656, -0.06636810302734375, -0.06184959411621094, -0.057331085205078125, -0.05281257629394531, -0.0482940673828125, -0.04377555847167969, -0.039257049560546875, -0.03473854064941406, -0.03022003173828125, -0.025701522827148438, -0.021183013916015625, -0.016664505004882812, -0.01214599609375, -0.0076274871826171875, -0.003108978271484375, 0.0014095306396484375, 0.00592803955078125, 0.010446548461914062, 0.014965057373046875, 0.019483566284179688, 0.0240020751953125, 0.028520584106445312, 0.033039093017578125, 0.03755760192871094, 0.04207611083984375, 0.04659461975097656, 0.051113128662109375, 0.05563163757324219, 0.060150146484375, 0.06466865539550781, 0.06918716430664062, 0.07370567321777344, 0.07822418212890625, 0.08274269104003906, 0.08726119995117188, 0.09177970886230469, 0.0962982177734375, 0.10081672668457031, 0.10533523559570312, 0.10985374450683594, 0.11437225341796875, 0.11889076232910156, 0.12340927124023438, 0.1279277801513672, 0.1324462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 19.0, 19.0, 37.0, 38.0, 55.0, 105.0, 131.0, 189.0, 124.0, 87.0, 47.0, 45.0, 21.0, 17.0, 19.0, 10.0, 3.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0301666259765625, -0.029288768768310547, -0.028410911560058594, -0.02753305435180664, -0.026655197143554688, -0.025777339935302734, -0.02489948272705078, -0.024021625518798828, -0.023143768310546875, -0.022265911102294922, -0.02138805389404297, -0.020510196685791016, -0.019632339477539062, -0.01875448226928711, -0.017876625061035156, -0.016998767852783203, -0.01612091064453125, -0.015243053436279297, -0.014365196228027344, -0.01348733901977539, -0.012609481811523438, -0.011731624603271484, -0.010853767395019531, -0.009975910186767578, -0.009098052978515625, -0.008220195770263672, -0.007342338562011719, -0.006464481353759766, -0.0055866241455078125, -0.004708766937255859, -0.0038309097290039062, -0.002953052520751953, -0.0020751953125, -0.0011973381042480469, -0.00031948089599609375, 0.0005583763122558594, 0.0014362335205078125, 0.0023140907287597656, 0.0031919479370117188, 0.004069805145263672, 0.004947662353515625, 0.005825519561767578, 0.006703376770019531, 0.007581233978271484, 0.008459091186523438, 0.00933694839477539, 0.010214805603027344, 0.011092662811279297, 0.01197052001953125, 0.012848377227783203, 0.013726234436035156, 0.01460409164428711, 0.015481948852539062, 0.016359806060791016, 0.01723766326904297, 0.018115520477294922, 0.018993377685546875, 0.019871234893798828, 0.02074909210205078, 0.021626949310302734, 0.022504806518554688, 0.02338266372680664, 0.024260520935058594, 0.025138378143310547, 0.0260162353515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 9.0, 16.0, 20.0, 27.0, 37.0, 44.0, 44.0, 59.0, 89.0, 73.0, 115.0, 107.0, 78.0, 61.0, 50.0, 39.0, 32.0, 25.0, 13.0, 9.0, 6.0, 4.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.45680394768714905, -0.44278910756111145, -0.42877423763275146, -0.41475939750671387, -0.40074455738067627, -0.3867296874523163, -0.3727148473262787, -0.3586999773979187, -0.3446851372718811, -0.3306702971458435, -0.3166554272174835, -0.3026405870914459, -0.28862571716308594, -0.27461087703704834, -0.26059603691101074, -0.24658118188381195, -0.23256632685661316, -0.21855147182941437, -0.20453661680221558, -0.19052177667617798, -0.1765069216489792, -0.1624920666217804, -0.1484772264957428, -0.134462371468544, -0.12044751644134521, -0.10643266141414642, -0.09241781383752823, -0.07840296626091003, -0.06438811123371124, -0.05037325620651245, -0.03635840862989426, -0.022343561053276062, -0.008328676223754883, 0.00568617507815361, 0.019701026380062103, 0.033715877681970596, 0.04773072898387909, 0.06174558401107788, 0.07576043158769608, 0.08977527916431427, 0.10379013419151306, 0.11780498921871185, 0.13181984424591064, 0.14583468437194824, 0.15984953939914703, 0.17386439442634583, 0.18787923455238342, 0.20189408957958221, 0.215908944606781, 0.2299237996339798, 0.2439386546611786, 0.2579534947872162, 0.27196836471557617, 0.28598320484161377, 0.29999804496765137, 0.31401288509368896, 0.32802775502204895, 0.34204259514808655, 0.35605746507644653, 0.37007230520248413, 0.38408714532852173, 0.3981020152568817, 0.4121168553829193, 0.4261317253112793, 0.4401465654373169]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 7.0, 19.0, 24.0, 28.0, 22.0, 33.0, 34.0, 47.0, 45.0, 51.0, 53.0, 58.0, 54.0, 68.0, 53.0, 58.0, 52.0, 51.0, 36.0, 41.0, 32.0, 23.0, 23.0, 24.0, 20.0, 9.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3513355851173401, -0.34003373980522156, -0.328731894493103, -0.3174300789833069, -0.30612823367118835, -0.2948263883590698, -0.2835245728492737, -0.27222272753715515, -0.2609208822250366, -0.2496190369129181, -0.23831720650196075, -0.22701537609100342, -0.2157135307788849, -0.20441168546676636, -0.19310985505580902, -0.18180802464485168, -0.17050617933273315, -0.15920433402061462, -0.1479025036096573, -0.13660067319869995, -0.12529882788658142, -0.11399699002504349, -0.10269515216350555, -0.09139331430196762, -0.08009147644042969, -0.06878963857889175, -0.05748780071735382, -0.04618596285581589, -0.034884124994277954, -0.02358228713274002, -0.012280449271202087, -0.000978611409664154, 0.010323196649551392, 0.021625034511089325, 0.03292687237262726, 0.04422871023416519, 0.055530548095703125, 0.06683238595724106, 0.07813422381877899, 0.08943606168031693, 0.10073789954185486, 0.11203973740339279, 0.12334157526493073, 0.13464340567588806, 0.1459452509880066, 0.15724709630012512, 0.16854892671108246, 0.1798507571220398, 0.19115260243415833, 0.20245444774627686, 0.2137562781572342, 0.22505810856819153, 0.23635995388031006, 0.2476617991924286, 0.2589636445045471, 0.27026546001434326, 0.2815673053264618, 0.2928691506385803, 0.30417096614837646, 0.315472811460495, 0.3267746567726135, 0.33807650208473206, 0.3493783473968506, 0.36068016290664673, 0.37198200821876526]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 10.0, 14.0, 18.0, 54.0, 52.0, 110.0, 148.0, 262.0, 445.0, 807.0, 1521.0, 3102.0, 6527.0, 14966.0, 37959.0, 134551.0, 658078.0, 125997.0, 36655.0, 14495.0, 6435.0, 2963.0, 1481.0, 799.0, 419.0, 261.0, 142.0, 94.0, 64.0, 34.0, 18.0, 14.0, 16.0, 17.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0], "bins": [-0.537109375, -0.5231513977050781, -0.5091934204101562, -0.4952354431152344, -0.4812774658203125, -0.4673194885253906, -0.45336151123046875, -0.4394035339355469, -0.425445556640625, -0.4114875793457031, -0.39752960205078125, -0.3835716247558594, -0.3696136474609375, -0.3556556701660156, -0.34169769287109375, -0.3277397155761719, -0.31378173828125, -0.2998237609863281, -0.28586578369140625, -0.2719078063964844, -0.2579498291015625, -0.24399185180664062, -0.23003387451171875, -0.21607589721679688, -0.202117919921875, -0.18815994262695312, -0.17420196533203125, -0.16024398803710938, -0.1462860107421875, -0.13232803344726562, -0.11837005615234375, -0.10441207885742188, -0.0904541015625, -0.07649612426757812, -0.06253814697265625, -0.048580169677734375, -0.0346221923828125, -0.020664215087890625, -0.00670623779296875, 0.007251739501953125, 0.021209716796875, 0.035167694091796875, 0.04912567138671875, 0.06308364868164062, 0.0770416259765625, 0.09099960327148438, 0.10495758056640625, 0.11891555786132812, 0.13287353515625, 0.14683151245117188, 0.16078948974609375, 0.17474746704101562, 0.1887054443359375, 0.20266342163085938, 0.21662139892578125, 0.23057937622070312, 0.244537353515625, 0.2584953308105469, 0.27245330810546875, 0.2864112854003906, 0.3003692626953125, 0.3143272399902344, 0.32828521728515625, 0.3422431945800781, 0.356201171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 12.0, 16.0, 18.0, 28.0, 38.0, 33.0, 23.0, 43.0, 45.0, 60.0, 50.0, 55.0, 60.0, 62.0, 67.0, 50.0, 46.0, 44.0, 51.0, 35.0, 28.0, 22.0, 21.0, 16.0, 20.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.744140625, -0.7214736938476562, -0.6988067626953125, -0.6761398315429688, -0.653472900390625, -0.6308059692382812, -0.6081390380859375, -0.5854721069335938, -0.56280517578125, -0.5401382446289062, -0.5174713134765625, -0.49480438232421875, -0.472137451171875, -0.44947052001953125, -0.4268035888671875, -0.40413665771484375, -0.3814697265625, -0.35880279541015625, -0.3361358642578125, -0.31346893310546875, -0.290802001953125, -0.26813507080078125, -0.2454681396484375, -0.22280120849609375, -0.20013427734375, -0.17746734619140625, -0.1548004150390625, -0.13213348388671875, -0.109466552734375, -0.08679962158203125, -0.0641326904296875, -0.04146575927734375, -0.018798828125, 0.00386810302734375, 0.0265350341796875, 0.04920196533203125, 0.071868896484375, 0.09453582763671875, 0.1172027587890625, 0.13986968994140625, 0.16253662109375, 0.18520355224609375, 0.2078704833984375, 0.23053741455078125, 0.253204345703125, 0.27587127685546875, 0.2985382080078125, 0.32120513916015625, 0.3438720703125, 0.36653900146484375, 0.3892059326171875, 0.41187286376953125, 0.434539794921875, 0.45720672607421875, 0.4798736572265625, 0.5025405883789062, 0.52520751953125, 0.5478744506835938, 0.5705413818359375, 0.5932083129882812, 0.615875244140625, 0.6385421752929688, 0.6612091064453125, 0.6838760375976562, 0.70654296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 3.0, 7.0, 5.0, 13.0, 5.0, 13.0, 16.0, 17.0, 17.0, 16.0, 26.0, 24.0, 35.0, 52.0, 57.0, 75.0, 187.0, 957.0, 26887.0, 1009751.0, 9382.0, 533.0, 128.0, 74.0, 42.0, 43.0, 31.0, 24.0, 20.0, 25.0, 16.0, 15.0, 14.0, 9.0, 13.0, 4.0, 8.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.3345947265625, -2.255126953125, -2.1756591796875, -2.09619140625, -2.0167236328125, -1.937255859375, -1.8577880859375, -1.7783203125, -1.6988525390625, -1.619384765625, -1.5399169921875, -1.46044921875, -1.3809814453125, -1.301513671875, -1.2220458984375, -1.142578125, -1.0631103515625, -0.983642578125, -0.9041748046875, -0.82470703125, -0.7452392578125, -0.665771484375, -0.5863037109375, -0.5068359375, -0.4273681640625, -0.347900390625, -0.2684326171875, -0.18896484375, -0.1094970703125, -0.030029296875, 0.0494384765625, 0.12890625, 0.2083740234375, 0.287841796875, 0.3673095703125, 0.44677734375, 0.5262451171875, 0.605712890625, 0.6851806640625, 0.7646484375, 0.8441162109375, 0.923583984375, 1.0030517578125, 1.08251953125, 1.1619873046875, 1.241455078125, 1.3209228515625, 1.400390625, 1.4798583984375, 1.559326171875, 1.6387939453125, 1.71826171875, 1.7977294921875, 1.877197265625, 1.9566650390625, 2.0361328125, 2.1156005859375, 2.195068359375, 2.2745361328125, 2.35400390625, 2.4334716796875, 2.512939453125, 2.5924072265625, 2.671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 5.0, 8.0, 12.0, 15.0, 8.0, 18.0, 16.0, 16.0, 22.0, 31.0, 36.0, 35.0, 34.0, 46.0, 31.0, 37.0, 41.0, 50.0, 33.0, 48.0, 42.0, 45.0, 41.0, 40.0, 30.0, 26.0, 24.0, 31.0, 27.0, 19.0, 21.0, 20.0, 16.0, 12.0, 15.0, 12.0, 7.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5302734375, -0.5126495361328125, -0.495025634765625, -0.4774017333984375, -0.45977783203125, -0.4421539306640625, -0.424530029296875, -0.4069061279296875, -0.3892822265625, -0.3716583251953125, -0.354034423828125, -0.3364105224609375, -0.31878662109375, -0.3011627197265625, -0.283538818359375, -0.2659149169921875, -0.248291015625, -0.2306671142578125, -0.213043212890625, -0.1954193115234375, -0.17779541015625, -0.1601715087890625, -0.142547607421875, -0.1249237060546875, -0.1072998046875, -0.0896759033203125, -0.072052001953125, -0.0544281005859375, -0.03680419921875, -0.0191802978515625, -0.001556396484375, 0.0160675048828125, 0.03369140625, 0.0513153076171875, 0.068939208984375, 0.0865631103515625, 0.10418701171875, 0.1218109130859375, 0.139434814453125, 0.1570587158203125, 0.1746826171875, 0.1923065185546875, 0.209930419921875, 0.2275543212890625, 0.24517822265625, 0.2628021240234375, 0.280426025390625, 0.2980499267578125, 0.315673828125, 0.3332977294921875, 0.350921630859375, 0.3685455322265625, 0.38616943359375, 0.4037933349609375, 0.421417236328125, 0.4390411376953125, 0.4566650390625, 0.4742889404296875, 0.491912841796875, 0.5095367431640625, 0.52716064453125, 0.5447845458984375, 0.562408447265625, 0.5800323486328125, 0.59765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 9.0, 11.0, 10.0, 14.0, 19.0, 45.0, 78.0, 201.0, 520.0, 1743.0, 7682.0, 165736.0, 855921.0, 12883.0, 2512.0, 710.0, 225.0, 98.0, 41.0, 31.0, 16.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.508514404296875, -0.49163818359375, -0.474761962890625, -0.4578857421875, -0.441009521484375, -0.42413330078125, -0.407257080078125, -0.390380859375, -0.373504638671875, -0.35662841796875, -0.339752197265625, -0.3228759765625, -0.305999755859375, -0.28912353515625, -0.272247314453125, -0.25537109375, -0.238494873046875, -0.22161865234375, -0.204742431640625, -0.1878662109375, -0.170989990234375, -0.15411376953125, -0.137237548828125, -0.120361328125, -0.103485107421875, -0.08660888671875, -0.069732666015625, -0.0528564453125, -0.035980224609375, -0.01910400390625, -0.002227783203125, 0.0146484375, 0.031524658203125, 0.04840087890625, 0.065277099609375, 0.0821533203125, 0.099029541015625, 0.11590576171875, 0.132781982421875, 0.149658203125, 0.166534423828125, 0.18341064453125, 0.200286865234375, 0.2171630859375, 0.234039306640625, 0.25091552734375, 0.267791748046875, 0.28466796875, 0.301544189453125, 0.31842041015625, 0.335296630859375, 0.3521728515625, 0.369049072265625, 0.38592529296875, 0.402801513671875, 0.419677734375, 0.436553955078125, 0.45343017578125, 0.470306396484375, 0.4871826171875, 0.504058837890625, 0.52093505859375, 0.537811279296875, 0.5546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 17.0, 21.0, 32.0, 74.0, 234.0, 339.0, 100.0, 56.0, 30.0, 21.0, 14.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40614128112793e-05, -5.2072107791900635e-05, -5.008280277252197e-05, -4.809349775314331e-05, -4.610419273376465e-05, -4.4114887714385986e-05, -4.2125582695007324e-05, -4.013627767562866e-05, -3.814697265625e-05, -3.615766763687134e-05, -3.4168362617492676e-05, -3.2179057598114014e-05, -3.018975257873535e-05, -2.820044755935669e-05, -2.6211142539978027e-05, -2.4221837520599365e-05, -2.2232532501220703e-05, -2.024322748184204e-05, -1.825392246246338e-05, -1.6264617443084717e-05, -1.4275312423706055e-05, -1.2286007404327393e-05, -1.029670238494873e-05, -8.307397365570068e-06, -6.318092346191406e-06, -4.328787326812744e-06, -2.339482307434082e-06, -3.501772880554199e-07, 1.6391277313232422e-06, 3.6284327507019043e-06, 5.617737770080566e-06, 7.6070427894592285e-06, 9.59634780883789e-06, 1.1585652828216553e-05, 1.3574957847595215e-05, 1.5564262866973877e-05, 1.755356788635254e-05, 1.95428729057312e-05, 2.1532177925109863e-05, 2.3521482944488525e-05, 2.5510787963867188e-05, 2.750009298324585e-05, 2.9489398002624512e-05, 3.1478703022003174e-05, 3.3468008041381836e-05, 3.54573130607605e-05, 3.744661808013916e-05, 3.943592309951782e-05, 4.1425228118896484e-05, 4.3414533138275146e-05, 4.540383815765381e-05, 4.739314317703247e-05, 4.938244819641113e-05, 5.1371753215789795e-05, 5.336105823516846e-05, 5.535036325454712e-05, 5.733966827392578e-05, 5.932897329330444e-05, 6.13182783126831e-05, 6.330758333206177e-05, 6.529688835144043e-05, 6.728619337081909e-05, 6.927549839019775e-05, 7.126480340957642e-05, 7.325410842895508e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 10.0, 18.0, 23.0, 35.0, 60.0, 104.0, 198.0, 463.0, 1233.0, 4783.0, 39781.0, 944849.0, 49509.0, 5241.0, 1321.0, 446.0, 195.0, 117.0, 60.0, 36.0, 30.0, 7.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409423828125, -0.39556121826171875, -0.3816986083984375, -0.36783599853515625, -0.353973388671875, -0.34011077880859375, -0.3262481689453125, -0.31238555908203125, -0.29852294921875, -0.28466033935546875, -0.2707977294921875, -0.25693511962890625, -0.243072509765625, -0.22920989990234375, -0.2153472900390625, -0.20148468017578125, -0.1876220703125, -0.17375946044921875, -0.1598968505859375, -0.14603424072265625, -0.132171630859375, -0.11830902099609375, -0.1044464111328125, -0.09058380126953125, -0.07672119140625, -0.06285858154296875, -0.0489959716796875, -0.03513336181640625, -0.021270751953125, -0.00740814208984375, 0.0064544677734375, 0.02031707763671875, 0.0341796875, 0.04804229736328125, 0.0619049072265625, 0.07576751708984375, 0.089630126953125, 0.10349273681640625, 0.1173553466796875, 0.13121795654296875, 0.14508056640625, 0.15894317626953125, 0.1728057861328125, 0.18666839599609375, 0.200531005859375, 0.21439361572265625, 0.2282562255859375, 0.24211883544921875, 0.2559814453125, 0.26984405517578125, 0.2837066650390625, 0.29756927490234375, 0.311431884765625, 0.32529449462890625, 0.3391571044921875, 0.35301971435546875, 0.36688232421875, 0.38074493408203125, 0.3946075439453125, 0.40847015380859375, 0.422332763671875, 0.43619537353515625, 0.4500579833984375, 0.46392059326171875, 0.477783203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 22.0, 23.0, 43.0, 73.0, 187.0, 348.0, 123.0, 63.0, 42.0, 14.0, 14.0, 9.0, 3.0, 8.0, 7.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206298828125, -0.20142269134521484, -0.1965465545654297, -0.19167041778564453, -0.18679428100585938, -0.18191814422607422, -0.17704200744628906, -0.1721658706665039, -0.16728973388671875, -0.1624135971069336, -0.15753746032714844, -0.15266132354736328, -0.14778518676757812, -0.14290904998779297, -0.1380329132080078, -0.13315677642822266, -0.1282806396484375, -0.12340450286865234, -0.11852836608886719, -0.11365222930908203, -0.10877609252929688, -0.10389995574951172, -0.09902381896972656, -0.0941476821899414, -0.08927154541015625, -0.0843954086303711, -0.07951927185058594, -0.07464313507080078, -0.06976699829101562, -0.06489086151123047, -0.06001472473144531, -0.055138587951660156, -0.050262451171875, -0.045386314392089844, -0.04051017761230469, -0.03563404083251953, -0.030757904052734375, -0.02588176727294922, -0.021005630493164062, -0.016129493713378906, -0.01125335693359375, -0.006377220153808594, -0.0015010833740234375, 0.0033750534057617188, 0.008251190185546875, 0.013127326965332031, 0.018003463745117188, 0.022879600524902344, 0.0277557373046875, 0.032631874084472656, 0.03750801086425781, 0.04238414764404297, 0.047260284423828125, 0.05213642120361328, 0.05701255798339844, 0.061888694763183594, 0.06676483154296875, 0.0716409683227539, 0.07651710510253906, 0.08139324188232422, 0.08626937866210938, 0.09114551544189453, 0.09602165222167969, 0.10089778900146484, 0.10577392578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 32.0, 400.0, 524.0, 53.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85219407081604, -0.5773032307624817, -0.30241239070892334, -0.02752155065536499, 0.24736928939819336, 0.5222601890563965, 0.7971509695053101, 1.0720417499542236, 1.3469326496124268, 1.6218235492706299, 1.8967143297195435, 2.171605110168457, 2.44649600982666, 2.7213869094848633, 2.9962778091430664, 3.2711684703826904, 3.5460593700408936, 3.8209502696990967, 4.095840930938721, 4.370731830596924, 4.645622730255127, 4.92051362991333, 5.195404529571533, 5.470294952392578, 5.745185852050781, 6.020076751708984, 6.2949676513671875, 6.569858551025391, 6.844749450683594, 7.119640350341797, 7.394530773162842, 7.669421672821045, 7.944313049316406, 8.21920394897461, 8.494094848632812, 8.768985748291016, 9.043876647949219, 9.318767547607422, 9.593658447265625, 9.868549346923828, 10.143440246582031, 10.418331146240234, 10.693222045898438, 10.96811294555664, 11.243003845214844, 11.517894744873047, 11.79278564453125, 12.067676544189453, 12.34256649017334, 12.617457389831543, 12.892348289489746, 13.16723918914795, 13.442130088806152, 13.717020988464355, 13.991911888122559, 14.266801834106445, 14.541692733764648, 14.816583633422852, 15.091474533081055, 15.366365432739258, 15.641256332397461, 15.916147232055664, 16.191038131713867, 16.46592903137207, 16.740819931030273]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 7.0, 17.0, 20.0, 15.0, 29.0, 32.0, 33.0, 40.0, 47.0, 41.0, 46.0, 50.0, 44.0, 61.0, 50.0, 38.0, 57.0, 43.0, 49.0, 28.0, 34.0, 33.0, 25.0, 27.0, 20.0, 19.0, 9.0, 17.0, 10.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9638789892196655, -0.9347702264785767, -0.9056615233421326, -0.8765528202056885, -0.8474440574645996, -0.8183352947235107, -0.7892265915870667, -0.7601178884506226, -0.7310091257095337, -0.7019003629684448, -0.6727916598320007, -0.6436829566955566, -0.6145741939544678, -0.5854654312133789, -0.5563567280769348, -0.5272480249404907, -0.49813926219940186, -0.4690305292606354, -0.4399217963218689, -0.4108130633831024, -0.38170433044433594, -0.35259559750556946, -0.323486864566803, -0.2943781316280365, -0.26526939868927, -0.23616066575050354, -0.20705193281173706, -0.17794319987297058, -0.1488344669342041, -0.11972573399543762, -0.09061700105667114, -0.06150826811790466, -0.032399535179138184, -0.003290802240371704, 0.025817930698394775, 0.054926663637161255, 0.08403539657592773, 0.11314412951469421, 0.1422528624534607, 0.17136159539222717, 0.20047032833099365, 0.22957906126976013, 0.2586877942085266, 0.2877965271472931, 0.31690526008605957, 0.34601399302482605, 0.37512272596359253, 0.404231458902359, 0.4333401918411255, 0.46244892477989197, 0.49155765771865845, 0.5206663608551025, 0.5497751235961914, 0.5788838863372803, 0.6079925894737244, 0.6371012926101685, 0.6662100553512573, 0.6953188180923462, 0.7244275212287903, 0.7535362243652344, 0.7826449871063232, 0.8117537498474121, 0.8408624529838562, 0.8699711561203003, 0.8990799188613892]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 6.0, 9.0, 30.0, 37.0, 48.0, 98.0, 162.0, 312.0, 675.0, 1693.0, 5115.0, 23037.0, 282509.0, 3395522.0, 448645.0, 26894.0, 5934.0, 1939.0, 792.0, 337.0, 196.0, 110.0, 43.0, 43.0, 26.0, 20.0, 15.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.941131591796875, -0.90570068359375, -0.870269775390625, -0.8348388671875, -0.799407958984375, -0.76397705078125, -0.728546142578125, -0.693115234375, -0.657684326171875, -0.62225341796875, -0.586822509765625, -0.5513916015625, -0.515960693359375, -0.48052978515625, -0.445098876953125, -0.40966796875, -0.374237060546875, -0.33880615234375, -0.303375244140625, -0.2679443359375, -0.232513427734375, -0.19708251953125, -0.161651611328125, -0.126220703125, -0.090789794921875, -0.05535888671875, -0.019927978515625, 0.0155029296875, 0.050933837890625, 0.08636474609375, 0.121795654296875, 0.1572265625, 0.192657470703125, 0.22808837890625, 0.263519287109375, 0.2989501953125, 0.334381103515625, 0.36981201171875, 0.405242919921875, 0.440673828125, 0.476104736328125, 0.51153564453125, 0.546966552734375, 0.5823974609375, 0.617828369140625, 0.65325927734375, 0.688690185546875, 0.72412109375, 0.759552001953125, 0.79498291015625, 0.830413818359375, 0.8658447265625, 0.901275634765625, 0.93670654296875, 0.972137451171875, 1.007568359375, 1.042999267578125, 1.07843017578125, 1.113861083984375, 1.1492919921875, 1.184722900390625, 1.22015380859375, 1.255584716796875, 1.291015625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 9.0, 14.0, 18.0, 22.0, 19.0, 33.0, 32.0, 70.0, 39.0, 60.0, 53.0, 74.0, 84.0, 70.0, 77.0, 42.0, 53.0, 39.0, 38.0, 34.0, 25.0, 25.0, 17.0, 13.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453369140625, -0.4363441467285156, -0.41931915283203125, -0.4022941589355469, -0.3852691650390625, -0.3682441711425781, -0.35121917724609375, -0.3341941833496094, -0.317169189453125, -0.3001441955566406, -0.28311920166015625, -0.2660942077636719, -0.2490692138671875, -0.23204421997070312, -0.21501922607421875, -0.19799423217773438, -0.18096923828125, -0.16394424438476562, -0.14691925048828125, -0.12989425659179688, -0.1128692626953125, -0.09584426879882812, -0.07881927490234375, -0.061794281005859375, -0.044769287109375, -0.027744293212890625, -0.01071929931640625, 0.006305694580078125, 0.0233306884765625, 0.040355682373046875, 0.05738067626953125, 0.07440567016601562, 0.0914306640625, 0.10845565795898438, 0.12548065185546875, 0.14250564575195312, 0.1595306396484375, 0.17655563354492188, 0.19358062744140625, 0.21060562133789062, 0.227630615234375, 0.24465560913085938, 0.26168060302734375, 0.2787055969238281, 0.2957305908203125, 0.3127555847167969, 0.32978057861328125, 0.3468055725097656, 0.36383056640625, 0.3808555603027344, 0.39788055419921875, 0.4149055480957031, 0.4319305419921875, 0.4489555358886719, 0.46598052978515625, 0.4830055236816406, 0.500030517578125, 0.5170555114746094, 0.5340805053710938, 0.5511054992675781, 0.5681304931640625, 0.5851554870605469, 0.6021804809570312, 0.6192054748535156, 0.63623046875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 13.0, 18.0, 18.0, 20.0, 44.0, 61.0, 127.0, 252.0, 805.0, 3524.0, 39032.0, 3913388.0, 226365.0, 8401.0, 1383.0, 427.0, 166.0, 87.0, 49.0, 26.0, 17.0, 12.0, 9.0, 8.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8525390625, -1.79412841796875, -1.7357177734375, -1.67730712890625, -1.618896484375, -1.56048583984375, -1.5020751953125, -1.44366455078125, -1.38525390625, -1.32684326171875, -1.2684326171875, -1.21002197265625, -1.151611328125, -1.09320068359375, -1.0347900390625, -0.97637939453125, -0.91796875, -0.85955810546875, -0.8011474609375, -0.74273681640625, -0.684326171875, -0.62591552734375, -0.5675048828125, -0.50909423828125, -0.45068359375, -0.39227294921875, -0.3338623046875, -0.27545166015625, -0.217041015625, -0.15863037109375, -0.1002197265625, -0.04180908203125, 0.0166015625, 0.07501220703125, 0.1334228515625, 0.19183349609375, 0.250244140625, 0.30865478515625, 0.3670654296875, 0.42547607421875, 0.48388671875, 0.54229736328125, 0.6007080078125, 0.65911865234375, 0.717529296875, 0.77593994140625, 0.8343505859375, 0.89276123046875, 0.951171875, 1.00958251953125, 1.0679931640625, 1.12640380859375, 1.184814453125, 1.24322509765625, 1.3016357421875, 1.36004638671875, 1.41845703125, 1.47686767578125, 1.5352783203125, 1.59368896484375, 1.652099609375, 1.71051025390625, 1.7689208984375, 1.82733154296875, 1.8857421875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 12.0, 14.0, 32.0, 40.0, 55.0, 82.0, 163.0, 226.0, 403.0, 759.0, 813.0, 606.0, 298.0, 163.0, 124.0, 70.0, 36.0, 42.0, 23.0, 24.0, 17.0, 13.0, 4.0, 7.0, 10.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235595703125, -0.2275390625, -0.219482421875, -0.21142578125, -0.203369140625, -0.1953125, -0.187255859375, -0.17919921875, -0.171142578125, -0.1630859375, -0.155029296875, -0.14697265625, -0.138916015625, -0.130859375, -0.122802734375, -0.11474609375, -0.106689453125, -0.0986328125, -0.090576171875, -0.08251953125, -0.074462890625, -0.06640625, -0.058349609375, -0.05029296875, -0.042236328125, -0.0341796875, -0.026123046875, -0.01806640625, -0.010009765625, -0.001953125, 0.006103515625, 0.01416015625, 0.022216796875, 0.0302734375, 0.038330078125, 0.04638671875, 0.054443359375, 0.0625, 0.070556640625, 0.07861328125, 0.086669921875, 0.0947265625, 0.102783203125, 0.11083984375, 0.118896484375, 0.126953125, 0.135009765625, 0.14306640625, 0.151123046875, 0.1591796875, 0.167236328125, 0.17529296875, 0.183349609375, 0.19140625, 0.199462890625, 0.20751953125, 0.215576171875, 0.2236328125, 0.231689453125, 0.23974609375, 0.247802734375, 0.255859375, 0.263916015625, 0.27197265625, 0.280029296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 11.0, 15.0, 28.0, 38.0, 42.0, 61.0, 70.0, 93.0, 106.0, 99.0, 96.0, 71.0, 69.0, 44.0, 43.0, 25.0, 15.0, 13.0, 10.0, 12.0, 8.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021980285644531, -0.6773347854614258, -0.6524714827537537, -0.6276082396507263, -0.6027449369430542, -0.5778816938400269, -0.5530184507369995, -0.5281551480293274, -0.5032918453216553, -0.47842857241630554, -0.4535652995109558, -0.42870205640792847, -0.40383875370025635, -0.378975510597229, -0.3541122376918793, -0.32924896478652954, -0.3043857216835022, -0.27952244877815247, -0.25465917587280273, -0.2297959178686142, -0.20493264496326447, -0.18006937205791473, -0.1552061140537262, -0.13034284114837646, -0.10547956824302673, -0.080616295337677, -0.05575302988290787, -0.030889764428138733, -0.0060264915227890015, 0.01883678138256073, 0.04370003938674927, 0.068563312292099, 0.09342652559280396, 0.11828979849815369, 0.14315307140350342, 0.16801632940769196, 0.1928796023130417, 0.21774287521839142, 0.24260613322257996, 0.2674694061279297, 0.2923326790332794, 0.31719595193862915, 0.3420592248439789, 0.3669224977493286, 0.39178574085235596, 0.4166490435600281, 0.4415122866630554, 0.46637555956840515, 0.4912388324737549, 0.5161020755767822, 0.5409653782844543, 0.5658286213874817, 0.5906919240951538, 0.6155551671981812, 0.6404184103012085, 0.6652817130088806, 0.6901450157165527, 0.7150082588195801, 0.7398715615272522, 0.7647348046302795, 0.7895981073379517, 0.814461350440979, 0.8393245935440063, 0.8641878962516785, 0.8890511393547058]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 12.0, 9.0, 15.0, 18.0, 14.0, 17.0, 19.0, 37.0, 21.0, 38.0, 23.0, 29.0, 40.0, 38.0, 56.0, 50.0, 38.0, 57.0, 46.0, 51.0, 49.0, 32.0, 47.0, 36.0, 24.0, 34.0, 30.0, 25.0, 17.0, 17.0, 10.0, 16.0, 10.0, 5.0, 6.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4636613726615906, -0.44915205240249634, -0.4346427321434021, -0.42013341188430786, -0.4056240916252136, -0.3911147713661194, -0.37660548090934753, -0.3620961606502533, -0.34758684039115906, -0.3330775201320648, -0.3185681998729706, -0.30405887961387634, -0.2895495891571045, -0.27504026889801025, -0.260530948638916, -0.24602162837982178, -0.23151230812072754, -0.2170029878616333, -0.20249366760253906, -0.18798436224460602, -0.17347504198551178, -0.15896572172641754, -0.1444564163684845, -0.12994709610939026, -0.11543777585029602, -0.10092845559120178, -0.08641914278268814, -0.0719098299741745, -0.05740050971508026, -0.04289118945598602, -0.02838187664747238, -0.01387256383895874, 0.0006367862224578857, 0.015146102756261826, 0.029655419290065765, 0.044164735823869705, 0.058674052357673645, 0.07318337261676788, 0.08769268542528152, 0.10220199823379517, 0.1167113184928894, 0.13122063875198364, 0.14572995901107788, 0.16023926436901093, 0.17474858462810516, 0.1892579048871994, 0.20376721024513245, 0.21827653050422668, 0.23278585076332092, 0.24729517102241516, 0.2618044912815094, 0.27631381154060364, 0.2908231019973755, 0.3053324222564697, 0.31984174251556396, 0.3343510627746582, 0.34886038303375244, 0.3633697032928467, 0.3778790235519409, 0.39238834381103516, 0.4068976640701294, 0.42140698432922363, 0.4359162747859955, 0.4504255950450897, 0.46493491530418396]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 1.0, 2.0, 3.0, 7.0, 11.0, 13.0, 12.0, 17.0, 23.0, 47.0, 81.0, 127.0, 269.0, 505.0, 1013.0, 2067.0, 4761.0, 11396.0, 31371.0, 162695.0, 670164.0, 119628.0, 26590.0, 9917.0, 4123.0, 1808.0, 901.0, 431.0, 229.0, 129.0, 70.0, 29.0, 34.0, 15.0, 13.0, 7.0, 12.0, 7.0, 3.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.30810546875, -0.29915618896484375, -0.2902069091796875, -0.28125762939453125, -0.272308349609375, -0.26335906982421875, -0.2544097900390625, -0.24546051025390625, -0.23651123046875, -0.22756195068359375, -0.2186126708984375, -0.20966339111328125, -0.200714111328125, -0.19176483154296875, -0.1828155517578125, -0.17386627197265625, -0.1649169921875, -0.15596771240234375, -0.1470184326171875, -0.13806915283203125, -0.129119873046875, -0.12017059326171875, -0.1112213134765625, -0.10227203369140625, -0.09332275390625, -0.08437347412109375, -0.0754241943359375, -0.06647491455078125, -0.057525634765625, -0.04857635498046875, -0.0396270751953125, -0.03067779541015625, -0.021728515625, -0.01277923583984375, -0.0038299560546875, 0.00511932373046875, 0.014068603515625, 0.02301788330078125, 0.0319671630859375, 0.04091644287109375, 0.04986572265625, 0.05881500244140625, 0.0677642822265625, 0.07671356201171875, 0.085662841796875, 0.09461212158203125, 0.1035614013671875, 0.11251068115234375, 0.1214599609375, 0.13040924072265625, 0.1393585205078125, 0.14830780029296875, 0.157257080078125, 0.16620635986328125, 0.1751556396484375, 0.18410491943359375, 0.19305419921875, 0.20200347900390625, 0.2109527587890625, 0.21990203857421875, 0.228851318359375, 0.23780059814453125, 0.2467498779296875, 0.25569915771484375, 0.2646484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 14.0, 7.0, 19.0, 16.0, 15.0, 36.0, 33.0, 33.0, 37.0, 40.0, 59.0, 49.0, 69.0, 66.0, 66.0, 59.0, 61.0, 59.0, 40.0, 46.0, 37.0, 39.0, 27.0, 23.0, 10.0, 11.0, 11.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3577537536621094, -0.34661102294921875, -0.3354682922363281, -0.3243255615234375, -0.3131828308105469, -0.30204010009765625, -0.2908973693847656, -0.279754638671875, -0.2686119079589844, -0.25746917724609375, -0.24632644653320312, -0.2351837158203125, -0.22404098510742188, -0.21289825439453125, -0.20175552368164062, -0.19061279296875, -0.17947006225585938, -0.16832733154296875, -0.15718460083007812, -0.1460418701171875, -0.13489913940429688, -0.12375640869140625, -0.11261367797851562, -0.101470947265625, -0.09032821655273438, -0.07918548583984375, -0.06804275512695312, -0.0569000244140625, -0.045757293701171875, -0.03461456298828125, -0.023471832275390625, -0.0123291015625, -0.001186370849609375, 0.00995635986328125, 0.021099090576171875, 0.0322418212890625, 0.043384552001953125, 0.05452728271484375, 0.06567001342773438, 0.076812744140625, 0.08795547485351562, 0.09909820556640625, 0.11024093627929688, 0.1213836669921875, 0.13252639770507812, 0.14366912841796875, 0.15481185913085938, 0.16595458984375, 0.17709732055664062, 0.18824005126953125, 0.19938278198242188, 0.2105255126953125, 0.22166824340820312, 0.23281097412109375, 0.24395370483398438, 0.255096435546875, 0.2662391662597656, 0.27738189697265625, 0.2885246276855469, 0.2996673583984375, 0.3108100891113281, 0.32195281982421875, 0.3330955505371094, 0.34423828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 9.0, 8.0, 12.0, 18.0, 12.0, 35.0, 56.0, 68.0, 85.0, 151.0, 248.0, 367.0, 592.0, 1033.0, 1991.0, 3567.0, 7106.0, 15071.0, 34547.0, 96643.0, 310295.0, 373612.0, 124822.0, 42724.0, 17895.0, 8261.0, 4129.0, 2102.0, 1219.0, 677.0, 399.0, 291.0, 151.0, 109.0, 78.0, 52.0, 37.0, 27.0, 15.0, 14.0, 12.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.135986328125, -0.1323223114013672, -0.12865829467773438, -0.12499427795410156, -0.12133026123046875, -0.11766624450683594, -0.11400222778320312, -0.11033821105957031, -0.1066741943359375, -0.10301017761230469, -0.09934616088867188, -0.09568214416503906, -0.09201812744140625, -0.08835411071777344, -0.08469009399414062, -0.08102607727050781, -0.077362060546875, -0.07369804382324219, -0.07003402709960938, -0.06637001037597656, -0.06270599365234375, -0.05904197692871094, -0.055377960205078125, -0.05171394348144531, -0.0480499267578125, -0.04438591003417969, -0.040721893310546875, -0.03705787658691406, -0.03339385986328125, -0.029729843139648438, -0.026065826416015625, -0.022401809692382812, -0.01873779296875, -0.015073776245117188, -0.011409759521484375, -0.0077457427978515625, -0.00408172607421875, -0.0004177093505859375, 0.003246307373046875, 0.0069103240966796875, 0.0105743408203125, 0.014238357543945312, 0.017902374267578125, 0.021566390991210938, 0.02523040771484375, 0.028894424438476562, 0.032558441162109375, 0.03622245788574219, 0.039886474609375, 0.04355049133300781, 0.047214508056640625, 0.05087852478027344, 0.05454254150390625, 0.05820655822753906, 0.061870574951171875, 0.06553459167480469, 0.0691986083984375, 0.07286262512207031, 0.07652664184570312, 0.08019065856933594, 0.08385467529296875, 0.08751869201660156, 0.09118270874023438, 0.09484672546386719, 0.0985107421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 13.0, 7.0, 8.0, 9.0, 14.0, 17.0, 16.0, 26.0, 23.0, 24.0, 30.0, 24.0, 20.0, 40.0, 34.0, 39.0, 45.0, 41.0, 33.0, 42.0, 50.0, 67.0, 34.0, 41.0, 36.0, 37.0, 35.0, 23.0, 31.0, 18.0, 26.0, 24.0, 12.0, 10.0, 9.0, 13.0, 5.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.52294921875, -0.50732421875, -0.49169921875, -0.47607421875, -0.46044921875, -0.44482421875, -0.42919921875, -0.41357421875, -0.39794921875, -0.38232421875, -0.36669921875, -0.35107421875, -0.33544921875, -0.31982421875, -0.30419921875, -0.28857421875, -0.27294921875, -0.25732421875, -0.24169921875, -0.22607421875, -0.21044921875, -0.19482421875, -0.17919921875, -0.16357421875, -0.14794921875, -0.13232421875, -0.11669921875, -0.10107421875, -0.08544921875, -0.06982421875, -0.05419921875, -0.03857421875, -0.02294921875, -0.00732421875, 0.00830078125, 0.02392578125, 0.03955078125, 0.05517578125, 0.07080078125, 0.08642578125, 0.10205078125, 0.11767578125, 0.13330078125, 0.14892578125, 0.16455078125, 0.18017578125, 0.19580078125, 0.21142578125, 0.22705078125, 0.24267578125, 0.25830078125, 0.27392578125, 0.28955078125, 0.30517578125, 0.32080078125, 0.33642578125, 0.35205078125, 0.36767578125, 0.38330078125, 0.39892578125, 0.41455078125, 0.43017578125, 0.44580078125, 0.46142578125, 0.47705078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 7.0, 7.0, 16.0, 21.0, 29.0, 53.0, 89.0, 121.0, 210.0, 327.0, 618.0, 1163.0, 2157.0, 4606.0, 10656.0, 27263.0, 83628.0, 306648.0, 417874.0, 128443.0, 38732.0, 13961.0, 6059.0, 2718.0, 1364.0, 733.0, 400.0, 239.0, 142.0, 93.0, 62.0, 34.0, 28.0, 14.0, 8.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.035186767578125, -0.03409290313720703, -0.03299903869628906, -0.031905174255371094, -0.030811309814453125, -0.029717445373535156, -0.028623580932617188, -0.02752971649169922, -0.02643585205078125, -0.02534198760986328, -0.024248123168945312, -0.023154258728027344, -0.022060394287109375, -0.020966529846191406, -0.019872665405273438, -0.01877880096435547, -0.0176849365234375, -0.01659107208251953, -0.015497207641601562, -0.014403343200683594, -0.013309478759765625, -0.012215614318847656, -0.011121749877929688, -0.010027885437011719, -0.00893402099609375, -0.007840156555175781, -0.0067462921142578125, -0.005652427673339844, -0.004558563232421875, -0.0034646987915039062, -0.0023708343505859375, -0.0012769699096679688, -0.00018310546875, 0.0009107589721679688, 0.0020046234130859375, 0.0030984878540039062, 0.004192352294921875, 0.005286216735839844, 0.0063800811767578125, 0.007473945617675781, 0.00856781005859375, 0.009661674499511719, 0.010755538940429688, 0.011849403381347656, 0.012943267822265625, 0.014037132263183594, 0.015130996704101562, 0.01622486114501953, 0.0173187255859375, 0.01841259002685547, 0.019506454467773438, 0.020600318908691406, 0.021694183349609375, 0.022788047790527344, 0.023881912231445312, 0.02497577667236328, 0.02606964111328125, 0.02716350555419922, 0.028257369995117188, 0.029351234436035156, 0.030445098876953125, 0.031538963317871094, 0.03263282775878906, 0.03372669219970703, 0.034820556640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 4.0, 5.0, 11.0, 11.0, 20.0, 16.0, 30.0, 32.0, 43.0, 51.0, 55.0, 63.0, 93.0, 76.0, 84.0, 72.0, 72.0, 37.0, 47.0, 31.0, 26.0, 29.0, 12.0, 13.0, 11.0, 6.0, 7.0, 7.0, 3.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6702880859375e-05, -2.595502883195877e-05, -2.520717680454254e-05, -2.4459324777126312e-05, -2.3711472749710083e-05, -2.2963620722293854e-05, -2.2215768694877625e-05, -2.1467916667461395e-05, -2.0720064640045166e-05, -1.9972212612628937e-05, -1.9224360585212708e-05, -1.8476508557796478e-05, -1.772865653038025e-05, -1.698080450296402e-05, -1.623295247554779e-05, -1.548510044813156e-05, -1.4737248420715332e-05, -1.3989396393299103e-05, -1.3241544365882874e-05, -1.2493692338466644e-05, -1.1745840311050415e-05, -1.0997988283634186e-05, -1.0250136256217957e-05, -9.502284228801727e-06, -8.754432201385498e-06, -8.006580173969269e-06, -7.2587281465530396e-06, -6.51087611913681e-06, -5.763024091720581e-06, -5.015172064304352e-06, -4.2673200368881226e-06, -3.5194680094718933e-06, -2.771615982055664e-06, -2.023763954639435e-06, -1.2759119272232056e-06, -5.280598998069763e-07, 2.1979212760925293e-07, 9.676441550254822e-07, 1.7154961824417114e-06, 2.4633482098579407e-06, 3.21120023727417e-06, 3.959052264690399e-06, 4.706904292106628e-06, 5.454756319522858e-06, 6.202608346939087e-06, 6.950460374355316e-06, 7.698312401771545e-06, 8.446164429187775e-06, 9.194016456604004e-06, 9.941868484020233e-06, 1.0689720511436462e-05, 1.1437572538852692e-05, 1.2185424566268921e-05, 1.293327659368515e-05, 1.368112862110138e-05, 1.4428980648517609e-05, 1.5176832675933838e-05, 1.5924684703350067e-05, 1.6672536730766296e-05, 1.7420388758182526e-05, 1.8168240785598755e-05, 1.8916092813014984e-05, 1.9663944840431213e-05, 2.0411796867847443e-05, 2.1159648895263672e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 7.0, 19.0, 22.0, 50.0, 77.0, 128.0, 226.0, 413.0, 715.0, 1425.0, 3098.0, 7231.0, 19488.0, 65466.0, 298628.0, 479200.0, 121680.0, 31588.0, 10561.0, 4399.0, 1980.0, 921.0, 555.0, 283.0, 128.0, 76.0, 60.0, 36.0, 18.0, 18.0, 8.0, 9.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04656982421875, -0.045124053955078125, -0.04367828369140625, -0.042232513427734375, -0.0407867431640625, -0.039340972900390625, -0.03789520263671875, -0.036449432373046875, -0.035003662109375, -0.033557891845703125, -0.03211212158203125, -0.030666351318359375, -0.0292205810546875, -0.027774810791015625, -0.02632904052734375, -0.024883270263671875, -0.0234375, -0.021991729736328125, -0.02054595947265625, -0.019100189208984375, -0.0176544189453125, -0.016208648681640625, -0.01476287841796875, -0.013317108154296875, -0.011871337890625, -0.010425567626953125, -0.00897979736328125, -0.007534027099609375, -0.0060882568359375, -0.004642486572265625, -0.00319671630859375, -0.001750946044921875, -0.00030517578125, 0.001140594482421875, 0.00258636474609375, 0.004032135009765625, 0.0054779052734375, 0.006923675537109375, 0.00836944580078125, 0.009815216064453125, 0.011260986328125, 0.012706756591796875, 0.01415252685546875, 0.015598297119140625, 0.0170440673828125, 0.018489837646484375, 0.01993560791015625, 0.021381378173828125, 0.0228271484375, 0.024272918701171875, 0.02571868896484375, 0.027164459228515625, 0.0286102294921875, 0.030055999755859375, 0.03150177001953125, 0.032947540283203125, 0.034393310546875, 0.035839080810546875, 0.03728485107421875, 0.038730621337890625, 0.0401763916015625, 0.041622161865234375, 0.04306793212890625, 0.044513702392578125, 0.04595947265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 10.0, 9.0, 10.0, 10.0, 15.0, 24.0, 29.0, 31.0, 49.0, 80.0, 75.0, 79.0, 69.0, 85.0, 82.0, 65.0, 65.0, 51.0, 29.0, 30.0, 26.0, 15.0, 8.0, 14.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01165008544921875, -0.01130533218383789, -0.010960578918457031, -0.010615825653076172, -0.010271072387695312, -0.009926319122314453, -0.009581565856933594, -0.009236812591552734, -0.008892059326171875, -0.008547306060791016, -0.008202552795410156, -0.007857799530029297, -0.0075130462646484375, -0.007168292999267578, -0.006823539733886719, -0.006478786468505859, -0.006134033203125, -0.005789279937744141, -0.005444526672363281, -0.005099773406982422, -0.0047550201416015625, -0.004410266876220703, -0.004065513610839844, -0.0037207603454589844, -0.003376007080078125, -0.0030312538146972656, -0.0026865005493164062, -0.002341747283935547, -0.0019969940185546875, -0.0016522407531738281, -0.0013074874877929688, -0.0009627342224121094, -0.00061798095703125, -0.0002732276916503906, 7.152557373046875e-05, 0.0004162788391113281, 0.0007610321044921875, 0.0011057853698730469, 0.0014505386352539062, 0.0017952919006347656, 0.002140045166015625, 0.0024847984313964844, 0.0028295516967773438, 0.003174304962158203, 0.0035190582275390625, 0.003863811492919922, 0.004208564758300781, 0.004553318023681641, 0.0048980712890625, 0.005242824554443359, 0.005587577819824219, 0.005932331085205078, 0.0062770843505859375, 0.006621837615966797, 0.006966590881347656, 0.007311344146728516, 0.007656097412109375, 0.008000850677490234, 0.008345603942871094, 0.008690357208251953, 0.009035110473632812, 0.009379863739013672, 0.009724617004394531, 0.01006937026977539, 0.01041412353515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 15.0, 25.0, 35.0, 50.0, 89.0, 107.0, 155.0, 142.0, 133.0, 83.0, 54.0, 34.0, 18.0, 21.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47072476148605347, -0.451171338558197, -0.43161794543266296, -0.4120645225048065, -0.39251112937927246, -0.372957706451416, -0.35340428352355957, -0.3338508605957031, -0.31429746747016907, -0.2947440445423126, -0.27519065141677856, -0.2556372284889221, -0.23608382046222687, -0.21653041243553162, -0.19697698950767517, -0.17742358148097992, -0.15787017345428467, -0.13831676542758942, -0.11876334995031357, -0.09920993447303772, -0.07965652644634247, -0.06010311841964722, -0.04054970294237137, -0.02099628746509552, -0.0014428794384002686, 0.01811053231358528, 0.03766394406557083, 0.05721735581755638, 0.07677076756954193, 0.09632417559623718, 0.11587759107351303, 0.13543100655078888, 0.15498441457748413, 0.17453782260417938, 0.19409123063087463, 0.21364465355873108, 0.23319806158542633, 0.2527514696121216, 0.272304892539978, 0.2918583154678345, 0.31141170859336853, 0.330965131521225, 0.35051852464675903, 0.3700719475746155, 0.3896253705024719, 0.409178763628006, 0.4287321865558624, 0.4482855796813965, 0.46783900260925293, 0.4873924255371094, 0.5069458484649658, 0.5264992117881775, 0.5460526347160339, 0.5656060576438904, 0.5851594805717468, 0.6047129034996033, 0.6242662668228149, 0.6438196897506714, 0.6633731126785278, 0.6829264760017395, 0.702479898929596, 0.7220333218574524, 0.7415867447853088, 0.7611401677131653, 0.7806935906410217]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 1.0, 8.0, 15.0, 15.0, 14.0, 12.0, 22.0, 28.0, 44.0, 33.0, 34.0, 39.0, 44.0, 56.0, 59.0, 60.0, 53.0, 68.0, 58.0, 55.0, 43.0, 43.0, 36.0, 31.0, 21.0, 26.0, 25.0, 18.0, 11.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3167051374912262, -0.30682605504989624, -0.2969469428062439, -0.28706786036491394, -0.2771887481212616, -0.26730966567993164, -0.2574305534362793, -0.24755147099494934, -0.2376723736524582, -0.22779327630996704, -0.2179141789674759, -0.20803508162498474, -0.19815599918365479, -0.18827688694000244, -0.17839780449867249, -0.16851870715618134, -0.15863960981369019, -0.14876051247119904, -0.13888141512870789, -0.12900231778621674, -0.11912322789430618, -0.10924413055181503, -0.09936504065990448, -0.08948594331741333, -0.07960684597492218, -0.06972774863243103, -0.05984865501523018, -0.04996956139802933, -0.04009046405553818, -0.030211366713047028, -0.020332273095846176, -0.010453179478645325, -0.0005740523338317871, 0.009305043146014214, 0.019184138625860214, 0.029063234105706215, 0.038942329585552216, 0.048821426928043365, 0.05870052054524422, 0.06857961416244507, 0.07845871150493622, 0.08833780884742737, 0.09821690618991852, 0.10809599608182907, 0.11797509342432022, 0.12785419821739197, 0.13773328065872192, 0.14761237800121307, 0.15749147534370422, 0.16737057268619537, 0.17724967002868652, 0.18712876737117767, 0.19700786471366882, 0.20688694715499878, 0.21676604449748993, 0.22664514183998108, 0.23652423918247223, 0.24640333652496338, 0.25628241896629333, 0.2661615312099457, 0.27604061365127563, 0.285919725894928, 0.29579880833625793, 0.3056778907775879, 0.31555700302124023]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 13.0, 16.0, 29.0, 44.0, 64.0, 153.0, 303.0, 589.0, 1120.0, 2428.0, 5775.0, 15069.0, 50161.0, 292596.0, 553929.0, 89504.0, 22276.0, 8082.0, 3431.0, 1477.0, 748.0, 313.0, 185.0, 111.0, 47.0, 29.0, 15.0, 5.0, 6.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5763320922851562, -0.5584259033203125, -0.5405197143554688, -0.522613525390625, -0.5047073364257812, -0.4868011474609375, -0.46889495849609375, -0.45098876953125, -0.43308258056640625, -0.4151763916015625, -0.39727020263671875, -0.379364013671875, -0.36145782470703125, -0.3435516357421875, -0.32564544677734375, -0.3077392578125, -0.28983306884765625, -0.2719268798828125, -0.25402069091796875, -0.236114501953125, -0.21820831298828125, -0.2003021240234375, -0.18239593505859375, -0.16448974609375, -0.14658355712890625, -0.1286773681640625, -0.11077117919921875, -0.092864990234375, -0.07495880126953125, -0.0570526123046875, -0.03914642333984375, -0.021240234375, -0.00333404541015625, 0.0145721435546875, 0.03247833251953125, 0.050384521484375, 0.06829071044921875, 0.0861968994140625, 0.10410308837890625, 0.12200927734375, 0.13991546630859375, 0.1578216552734375, 0.17572784423828125, 0.193634033203125, 0.21154022216796875, 0.2294464111328125, 0.24735260009765625, 0.2652587890625, 0.28316497802734375, 0.3010711669921875, 0.31897735595703125, 0.336883544921875, 0.35478973388671875, 0.3726959228515625, 0.39060211181640625, 0.40850830078125, 0.42641448974609375, 0.4443206787109375, 0.46222686767578125, 0.480133056640625, 0.49803924560546875, 0.5159454345703125, 0.5338516235351562, 0.5517578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 9.0, 10.0, 13.0, 18.0, 29.0, 20.0, 34.0, 24.0, 40.0, 40.0, 35.0, 54.0, 57.0, 46.0, 54.0, 52.0, 62.0, 58.0, 63.0, 40.0, 45.0, 33.0, 34.0, 20.0, 16.0, 26.0, 11.0, 11.0, 8.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.4165840148925781, -0.39884185791015625, -0.3810997009277344, -0.3633575439453125, -0.3456153869628906, -0.32787322998046875, -0.3101310729980469, -0.292388916015625, -0.2746467590332031, -0.25690460205078125, -0.23916244506835938, -0.2214202880859375, -0.20367813110351562, -0.18593597412109375, -0.16819381713867188, -0.15045166015625, -0.13270950317382812, -0.11496734619140625, -0.09722518920898438, -0.0794830322265625, -0.061740875244140625, -0.04399871826171875, -0.026256561279296875, -0.008514404296875, 0.009227752685546875, 0.02696990966796875, 0.044712066650390625, 0.0624542236328125, 0.08019638061523438, 0.09793853759765625, 0.11568069458007812, 0.1334228515625, 0.15116500854492188, 0.16890716552734375, 0.18664932250976562, 0.2043914794921875, 0.22213363647460938, 0.23987579345703125, 0.2576179504394531, 0.275360107421875, 0.2931022644042969, 0.31084442138671875, 0.3285865783691406, 0.3463287353515625, 0.3640708923339844, 0.38181304931640625, 0.3995552062988281, 0.41729736328125, 0.4350395202636719, 0.45278167724609375, 0.4705238342285156, 0.4882659912109375, 0.5060081481933594, 0.5237503051757812, 0.5414924621582031, 0.559234619140625, 0.5769767761230469, 0.5947189331054688, 0.6124610900878906, 0.6302032470703125, 0.6479454040527344, 0.6656875610351562, 0.6834297180175781, 0.701171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 7.0, 3.0, 4.0, 11.0, 8.0, 12.0, 7.0, 16.0, 16.0, 22.0, 25.0, 25.0, 34.0, 28.0, 50.0, 81.0, 160.0, 286.0, 796.0, 5247.0, 113610.0, 903148.0, 21905.0, 1961.0, 438.0, 172.0, 102.0, 67.0, 55.0, 50.0, 35.0, 21.0, 23.0, 17.0, 22.0, 12.0, 17.0, 17.0, 10.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.41015625, -1.3650665283203125, -1.319976806640625, -1.2748870849609375, -1.22979736328125, -1.1847076416015625, -1.139617919921875, -1.0945281982421875, -1.0494384765625, -1.0043487548828125, -0.959259033203125, -0.9141693115234375, -0.86907958984375, -0.8239898681640625, -0.778900146484375, -0.7338104248046875, -0.688720703125, -0.6436309814453125, -0.598541259765625, -0.5534515380859375, -0.50836181640625, -0.4632720947265625, -0.418182373046875, -0.3730926513671875, -0.3280029296875, -0.2829132080078125, -0.237823486328125, -0.1927337646484375, -0.14764404296875, -0.1025543212890625, -0.057464599609375, -0.0123748779296875, 0.03271484375, 0.0778045654296875, 0.122894287109375, 0.1679840087890625, 0.21307373046875, 0.2581634521484375, 0.303253173828125, 0.3483428955078125, 0.3934326171875, 0.4385223388671875, 0.483612060546875, 0.5287017822265625, 0.57379150390625, 0.6188812255859375, 0.663970947265625, 0.7090606689453125, 0.754150390625, 0.7992401123046875, 0.844329833984375, 0.8894195556640625, 0.93450927734375, 0.9795989990234375, 1.024688720703125, 1.0697784423828125, 1.1148681640625, 1.1599578857421875, 1.205047607421875, 1.2501373291015625, 1.29522705078125, 1.3403167724609375, 1.385406494140625, 1.4304962158203125, 1.4755859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 7.0, 4.0, 9.0, 6.0, 13.0, 13.0, 9.0, 12.0, 20.0, 18.0, 21.0, 25.0, 22.0, 29.0, 28.0, 22.0, 41.0, 42.0, 38.0, 36.0, 43.0, 34.0, 28.0, 40.0, 52.0, 37.0, 35.0, 41.0, 31.0, 38.0, 24.0, 21.0, 21.0, 17.0, 21.0, 23.0, 12.0, 11.0, 8.0, 8.0, 7.0, 4.0, 7.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.474609375, -0.4599800109863281, -0.44535064697265625, -0.4307212829589844, -0.4160919189453125, -0.4014625549316406, -0.38683319091796875, -0.3722038269042969, -0.357574462890625, -0.3429450988769531, -0.32831573486328125, -0.3136863708496094, -0.2990570068359375, -0.2844276428222656, -0.26979827880859375, -0.2551689147949219, -0.24053955078125, -0.22591018676757812, -0.21128082275390625, -0.19665145874023438, -0.1820220947265625, -0.16739273071289062, -0.15276336669921875, -0.13813400268554688, -0.123504638671875, -0.10887527465820312, -0.09424591064453125, -0.07961654663085938, -0.0649871826171875, -0.050357818603515625, -0.03572845458984375, -0.021099090576171875, -0.0064697265625, 0.008159637451171875, 0.02278900146484375, 0.037418365478515625, 0.0520477294921875, 0.06667709350585938, 0.08130645751953125, 0.09593582153320312, 0.110565185546875, 0.12519454956054688, 0.13982391357421875, 0.15445327758789062, 0.1690826416015625, 0.18371200561523438, 0.19834136962890625, 0.21297073364257812, 0.22760009765625, 0.24222946166992188, 0.25685882568359375, 0.2714881896972656, 0.2861175537109375, 0.3007469177246094, 0.31537628173828125, 0.3300056457519531, 0.344635009765625, 0.3592643737792969, 0.37389373779296875, 0.3885231018066406, 0.4031524658203125, 0.4177818298339844, 0.43241119384765625, 0.4470405578613281, 0.461669921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 12.0, 19.0, 23.0, 41.0, 76.0, 127.0, 240.0, 468.0, 1194.0, 3635.0, 16828.0, 145155.0, 772177.0, 91491.0, 12305.0, 2811.0, 988.0, 416.0, 215.0, 103.0, 67.0, 49.0, 26.0, 14.0, 10.0, 16.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.25048828125, -0.2436084747314453, -0.23672866821289062, -0.22984886169433594, -0.22296905517578125, -0.21608924865722656, -0.20920944213867188, -0.2023296356201172, -0.1954498291015625, -0.1885700225830078, -0.18169021606445312, -0.17481040954589844, -0.16793060302734375, -0.16105079650878906, -0.15417098999023438, -0.1472911834716797, -0.140411376953125, -0.1335315704345703, -0.12665176391601562, -0.11977195739746094, -0.11289215087890625, -0.10601234436035156, -0.09913253784179688, -0.09225273132324219, -0.0853729248046875, -0.07849311828613281, -0.07161331176757812, -0.06473350524902344, -0.05785369873046875, -0.05097389221191406, -0.044094085693359375, -0.03721427917480469, -0.03033447265625, -0.023454666137695312, -0.016574859619140625, -0.009695053100585938, -0.00281524658203125, 0.0040645599365234375, 0.010944366455078125, 0.017824172973632812, 0.0247039794921875, 0.03158378601074219, 0.038463592529296875, 0.04534339904785156, 0.05222320556640625, 0.05910301208496094, 0.06598281860351562, 0.07286262512207031, 0.079742431640625, 0.08662223815917969, 0.09350204467773438, 0.10038185119628906, 0.10726165771484375, 0.11414146423339844, 0.12102127075195312, 0.1279010772705078, 0.1347808837890625, 0.1416606903076172, 0.14854049682617188, 0.15542030334472656, 0.16230010986328125, 0.16917991638183594, 0.17605972290039062, 0.1829395294189453, 0.1898193359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 2.0, 5.0, 2.0, 8.0, 10.0, 15.0, 22.0, 17.0, 25.0, 36.0, 46.0, 71.0, 95.0, 147.0, 139.0, 94.0, 73.0, 47.0, 53.0, 20.0, 17.0, 13.0, 13.0, 7.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-05, -2.8806738555431366e-05, -2.781115472316742e-05, -2.6815570890903473e-05, -2.5819987058639526e-05, -2.482440322637558e-05, -2.3828819394111633e-05, -2.2833235561847687e-05, -2.183765172958374e-05, -2.0842067897319794e-05, -1.9846484065055847e-05, -1.88509002327919e-05, -1.7855316400527954e-05, -1.6859732568264008e-05, -1.586414873600006e-05, -1.4868564903736115e-05, -1.3872981071472168e-05, -1.2877397239208221e-05, -1.1881813406944275e-05, -1.0886229574680328e-05, -9.890645742416382e-06, -8.895061910152435e-06, -7.899478077888489e-06, -6.903894245624542e-06, -5.908310413360596e-06, -4.912726581096649e-06, -3.917142748832703e-06, -2.921558916568756e-06, -1.9259750843048096e-06, -9.30391252040863e-07, 6.51925802230835e-08, 1.06077641248703e-06, 2.0563602447509766e-06, 3.051944077014923e-06, 4.04752790927887e-06, 5.043111741542816e-06, 6.038695573806763e-06, 7.034279406070709e-06, 8.029863238334656e-06, 9.025447070598602e-06, 1.0021030902862549e-05, 1.1016614735126495e-05, 1.2012198567390442e-05, 1.3007782399654388e-05, 1.4003366231918335e-05, 1.4998950064182281e-05, 1.5994533896446228e-05, 1.6990117728710175e-05, 1.798570156097412e-05, 1.8981285393238068e-05, 1.9976869225502014e-05, 2.097245305776596e-05, 2.1968036890029907e-05, 2.2963620722293854e-05, 2.39592045545578e-05, 2.4954788386821747e-05, 2.5950372219085693e-05, 2.694595605134964e-05, 2.7941539883613586e-05, 2.8937123715877533e-05, 2.993270754814148e-05, 3.0928291380405426e-05, 3.192387521266937e-05, 3.291945904493332e-05, 3.3915042877197266e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 9.0, 18.0, 20.0, 31.0, 65.0, 120.0, 228.0, 480.0, 1172.0, 3874.0, 20944.0, 248157.0, 709534.0, 53431.0, 7336.0, 1801.0, 641.0, 282.0, 156.0, 67.0, 64.0, 34.0, 27.0, 16.0, 10.0, 8.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3037109375, -0.2961578369140625, -0.288604736328125, -0.2810516357421875, -0.27349853515625, -0.2659454345703125, -0.258392333984375, -0.2508392333984375, -0.2432861328125, -0.2357330322265625, -0.228179931640625, -0.2206268310546875, -0.21307373046875, -0.2055206298828125, -0.197967529296875, -0.1904144287109375, -0.182861328125, -0.1753082275390625, -0.167755126953125, -0.1602020263671875, -0.15264892578125, -0.1450958251953125, -0.137542724609375, -0.1299896240234375, -0.1224365234375, -0.1148834228515625, -0.107330322265625, -0.0997772216796875, -0.09222412109375, -0.0846710205078125, -0.077117919921875, -0.0695648193359375, -0.06201171875, -0.0544586181640625, -0.046905517578125, -0.0393524169921875, -0.03179931640625, -0.0242462158203125, -0.016693115234375, -0.0091400146484375, -0.0015869140625, 0.0059661865234375, 0.013519287109375, 0.0210723876953125, 0.02862548828125, 0.0361785888671875, 0.043731689453125, 0.0512847900390625, 0.058837890625, 0.0663909912109375, 0.073944091796875, 0.0814971923828125, 0.08905029296875, 0.0966033935546875, 0.104156494140625, 0.1117095947265625, 0.1192626953125, 0.1268157958984375, 0.134368896484375, 0.1419219970703125, 0.14947509765625, 0.1570281982421875, 0.164581298828125, 0.1721343994140625, 0.1796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 13.0, 12.0, 21.0, 18.0, 37.0, 44.0, 41.0, 61.0, 87.0, 96.0, 108.0, 85.0, 63.0, 61.0, 56.0, 49.0, 37.0, 20.0, 19.0, 15.0, 8.0, 9.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05999755859375, -0.05782318115234375, -0.0556488037109375, -0.05347442626953125, -0.051300048828125, -0.04912567138671875, -0.0469512939453125, -0.04477691650390625, -0.0426025390625, -0.04042816162109375, -0.0382537841796875, -0.03607940673828125, -0.033905029296875, -0.03173065185546875, -0.0295562744140625, -0.02738189697265625, -0.02520751953125, -0.02303314208984375, -0.0208587646484375, -0.01868438720703125, -0.016510009765625, -0.01433563232421875, -0.0121612548828125, -0.00998687744140625, -0.0078125, -0.00563812255859375, -0.0034637451171875, -0.00128936767578125, 0.000885009765625, 0.00305938720703125, 0.0052337646484375, 0.00740814208984375, 0.00958251953125, 0.01175689697265625, 0.0139312744140625, 0.01610565185546875, 0.018280029296875, 0.02045440673828125, 0.0226287841796875, 0.02480316162109375, 0.0269775390625, 0.02915191650390625, 0.0313262939453125, 0.03350067138671875, 0.035675048828125, 0.03784942626953125, 0.0400238037109375, 0.04219818115234375, 0.04437255859375, 0.04654693603515625, 0.0487213134765625, 0.05089569091796875, 0.053070068359375, 0.05524444580078125, 0.0574188232421875, 0.05959320068359375, 0.061767578125, 0.06394195556640625, 0.0661163330078125, 0.06829071044921875, 0.070465087890625, 0.07263946533203125, 0.0748138427734375, 0.07698822021484375, 0.07916259765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 62.0, 648.0, 275.0, 26.0, 3.0], "bins": [-15.009307861328125, -14.762321472167969, -14.515335083007812, -14.26834774017334, -14.021361351013184, -13.774374961853027, -13.527387619018555, -13.280401229858398, -13.033414840698242, -12.786428451538086, -12.53944206237793, -12.292454719543457, -12.0454683303833, -11.798481941223145, -11.551494598388672, -11.304508209228516, -11.05752182006836, -10.810535430908203, -10.563549041748047, -10.316561698913574, -10.069575309753418, -9.822588920593262, -9.575601577758789, -9.328615188598633, -9.081628799438477, -8.83464241027832, -8.587656021118164, -8.340668678283691, -8.093682289123535, -7.846695899963379, -7.5997090339660645, -7.35272216796875, -7.1057353019714355, -6.858748435974121, -6.611762046813965, -6.364775657653809, -6.117788791656494, -5.87080192565918, -5.623815536499023, -5.376829147338867, -5.129842281341553, -4.882855415344238, -4.635869026184082, -4.388882637023926, -4.141895771026611, -3.894909143447876, -3.6479225158691406, -3.4009358882904053, -3.15394926071167, -2.9069626331329346, -2.659976005554199, -2.412989377975464, -2.1660027503967285, -1.9190161228179932, -1.6720294952392578, -1.4250428676605225, -1.1780563592910767, -0.9310697317123413, -0.684083104133606, -0.4370964765548706, -0.19010984897613525, 0.0568767786026001, 0.30386340618133545, 0.5508500337600708, 0.7978366613388062]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 12.0, 15.0, 11.0, 20.0, 12.0, 26.0, 25.0, 26.0, 30.0, 28.0, 38.0, 34.0, 34.0, 50.0, 44.0, 38.0, 36.0, 47.0, 46.0, 41.0, 36.0, 46.0, 39.0, 38.0, 31.0, 30.0, 24.0, 26.0, 14.0, 15.0, 13.0, 10.0, 9.0, 4.0, 7.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8316761255264282, -0.8047030568122864, -0.7777299880981445, -0.7507569193840027, -0.7237838506698608, -0.6968108415603638, -0.6698377132415771, -0.6428647041320801, -0.6158916354179382, -0.5889185667037964, -0.5619454979896545, -0.5349724292755127, -0.5079993605613708, -0.4810263216495514, -0.45405325293540955, -0.4270802140235901, -0.40010711550712585, -0.373134046792984, -0.34616097807884216, -0.3191879391670227, -0.29221487045288086, -0.265241801738739, -0.23826873302459717, -0.21129567921161652, -0.18432261049747467, -0.15734954178333282, -0.13037648797035217, -0.10340341925621033, -0.07643035799264908, -0.04945729672908783, -0.022484228014945984, 0.004488825798034668, 0.031461894512176514, 0.05843495577573776, 0.08540801703929901, 0.11238108575344086, 0.1393541395664215, 0.16632720828056335, 0.1933002769947052, 0.22027333080768585, 0.2472463995218277, 0.27421945333480835, 0.3011925220489502, 0.32816559076309204, 0.3551386594772339, 0.38211172819137573, 0.4090847969055176, 0.43605783581733704, 0.4630309045314789, 0.4900039732456207, 0.5169770121574402, 0.543950080871582, 0.5709231495857239, 0.5978962182998657, 0.6248692870140076, 0.6518423557281494, 0.6788154244422913, 0.7057884931564331, 0.732761561870575, 0.7597346305847168, 0.7867076992988586, 0.8136807680130005, 0.8406537771224976, 0.8676268458366394, 0.8945999145507812]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 17.0, 14.0, 21.0, 44.0, 41.0, 89.0, 141.0, 228.0, 408.0, 809.0, 1823.0, 5311.0, 23220.0, 345800.0, 3379263.0, 403344.0, 24337.0, 5541.0, 1904.0, 863.0, 405.0, 268.0, 149.0, 88.0, 45.0, 30.0, 21.0, 20.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.894989013671875, -0.86566162109375, -0.836334228515625, -0.8070068359375, -0.777679443359375, -0.74835205078125, -0.719024658203125, -0.689697265625, -0.660369873046875, -0.63104248046875, -0.601715087890625, -0.5723876953125, -0.543060302734375, -0.51373291015625, -0.484405517578125, -0.455078125, -0.425750732421875, -0.39642333984375, -0.367095947265625, -0.3377685546875, -0.308441162109375, -0.27911376953125, -0.249786376953125, -0.220458984375, -0.191131591796875, -0.16180419921875, -0.132476806640625, -0.1031494140625, -0.073822021484375, -0.04449462890625, -0.015167236328125, 0.01416015625, 0.043487548828125, 0.07281494140625, 0.102142333984375, 0.1314697265625, 0.160797119140625, 0.19012451171875, 0.219451904296875, 0.248779296875, 0.278106689453125, 0.30743408203125, 0.336761474609375, 0.3660888671875, 0.395416259765625, 0.42474365234375, 0.454071044921875, 0.4833984375, 0.512725830078125, 0.54205322265625, 0.571380615234375, 0.6007080078125, 0.630035400390625, 0.65936279296875, 0.688690185546875, 0.718017578125, 0.747344970703125, 0.77667236328125, 0.805999755859375, 0.8353271484375, 0.864654541015625, 0.89398193359375, 0.923309326171875, 0.95263671875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 7.0, 1.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 9.0, 7.0, 21.0, 7.0, 23.0, 9.0, 18.0, 27.0, 25.0, 44.0, 19.0, 25.0, 25.0, 29.0, 26.0, 46.0, 25.0, 44.0, 34.0, 39.0, 47.0, 29.0, 28.0, 32.0, 38.0, 43.0, 39.0, 23.0, 28.0, 19.0, 21.0, 21.0, 16.0, 16.0, 15.0, 12.0, 8.0, 6.0, 2.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.281982421875, -0.2727813720703125, -0.263580322265625, -0.2543792724609375, -0.24517822265625, -0.2359771728515625, -0.226776123046875, -0.2175750732421875, -0.2083740234375, -0.1991729736328125, -0.189971923828125, -0.1807708740234375, -0.17156982421875, -0.1623687744140625, -0.153167724609375, -0.1439666748046875, -0.134765625, -0.1255645751953125, -0.116363525390625, -0.1071624755859375, -0.09796142578125, -0.0887603759765625, -0.079559326171875, -0.0703582763671875, -0.0611572265625, -0.0519561767578125, -0.042755126953125, -0.0335540771484375, -0.02435302734375, -0.0151519775390625, -0.005950927734375, 0.0032501220703125, 0.012451171875, 0.0216522216796875, 0.030853271484375, 0.0400543212890625, 0.04925537109375, 0.0584564208984375, 0.067657470703125, 0.0768585205078125, 0.0860595703125, 0.0952606201171875, 0.104461669921875, 0.1136627197265625, 0.12286376953125, 0.1320648193359375, 0.141265869140625, 0.1504669189453125, 0.15966796875, 0.1688690185546875, 0.178070068359375, 0.1872711181640625, 0.19647216796875, 0.2056732177734375, 0.214874267578125, 0.2240753173828125, 0.2332763671875, 0.2424774169921875, 0.251678466796875, 0.2608795166015625, 0.27008056640625, 0.2792816162109375, 0.288482666015625, 0.2976837158203125, 0.306884765625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 13.0, 6.0, 15.0, 18.0, 19.0, 32.0, 38.0, 53.0, 90.0, 135.0, 306.0, 820.0, 3401.0, 43035.0, 4021819.0, 117151.0, 5327.0, 1080.0, 361.0, 173.0, 105.0, 72.0, 42.0, 37.0, 22.0, 19.0, 7.0, 12.0, 11.0, 10.0, 9.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.501251220703125, -1.44879150390625, -1.396331787109375, -1.3438720703125, -1.291412353515625, -1.23895263671875, -1.186492919921875, -1.134033203125, -1.081573486328125, -1.02911376953125, -0.976654052734375, -0.9241943359375, -0.871734619140625, -0.81927490234375, -0.766815185546875, -0.71435546875, -0.661895751953125, -0.60943603515625, -0.556976318359375, -0.5045166015625, -0.452056884765625, -0.39959716796875, -0.347137451171875, -0.294677734375, -0.242218017578125, -0.18975830078125, -0.137298583984375, -0.0848388671875, -0.032379150390625, 0.02008056640625, 0.072540283203125, 0.125, 0.177459716796875, 0.22991943359375, 0.282379150390625, 0.3348388671875, 0.387298583984375, 0.43975830078125, 0.492218017578125, 0.544677734375, 0.597137451171875, 0.64959716796875, 0.702056884765625, 0.7545166015625, 0.806976318359375, 0.85943603515625, 0.911895751953125, 0.96435546875, 1.016815185546875, 1.06927490234375, 1.121734619140625, 1.1741943359375, 1.226654052734375, 1.27911376953125, 1.331573486328125, 1.384033203125, 1.436492919921875, 1.48895263671875, 1.541412353515625, 1.5938720703125, 1.646331787109375, 1.69879150390625, 1.751251220703125, 1.8037109375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 9.0, 6.0, 8.0, 17.0, 43.0, 49.0, 80.0, 138.0, 287.0, 494.0, 932.0, 930.0, 501.0, 231.0, 139.0, 82.0, 30.0, 29.0, 16.0, 15.0, 10.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.323974609375, -0.3156585693359375, -0.307342529296875, -0.2990264892578125, -0.29071044921875, -0.2823944091796875, -0.274078369140625, -0.2657623291015625, -0.2574462890625, -0.2491302490234375, -0.240814208984375, -0.2324981689453125, -0.22418212890625, -0.2158660888671875, -0.207550048828125, -0.1992340087890625, -0.19091796875, -0.1826019287109375, -0.174285888671875, -0.1659698486328125, -0.15765380859375, -0.1493377685546875, -0.141021728515625, -0.1327056884765625, -0.1243896484375, -0.1160736083984375, -0.107757568359375, -0.0994415283203125, -0.09112548828125, -0.0828094482421875, -0.074493408203125, -0.0661773681640625, -0.057861328125, -0.0495452880859375, -0.041229248046875, -0.0329132080078125, -0.02459716796875, -0.0162811279296875, -0.007965087890625, 0.0003509521484375, 0.0086669921875, 0.0169830322265625, 0.025299072265625, 0.0336151123046875, 0.04193115234375, 0.0502471923828125, 0.058563232421875, 0.0668792724609375, 0.0751953125, 0.0835113525390625, 0.091827392578125, 0.1001434326171875, 0.10845947265625, 0.1167755126953125, 0.125091552734375, 0.1334075927734375, 0.1417236328125, 0.1500396728515625, 0.158355712890625, 0.1666717529296875, 0.17498779296875, 0.1833038330078125, 0.191619873046875, 0.1999359130859375, 0.208251953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 2.0, 6.0, 12.0, 17.0, 16.0, 23.0, 35.0, 46.0, 54.0, 76.0, 81.0, 100.0, 89.0, 85.0, 84.0, 65.0, 57.0, 35.0, 36.0, 19.0, 20.0, 11.0, 13.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.571103572845459, -0.5502992272377014, -0.5294948816299438, -0.5086905360221863, -0.4878861606121063, -0.46708181500434875, -0.4462774693965912, -0.42547309398651123, -0.40466874837875366, -0.3838644027709961, -0.3630600571632385, -0.34225571155548096, -0.321451336145401, -0.30064699053764343, -0.27984264492988586, -0.2590382695198059, -0.23823395371437073, -0.21742960810661316, -0.1966252475976944, -0.17582090198993683, -0.15501654148101807, -0.1342121958732605, -0.11340785026550293, -0.09260348975658417, -0.0717991441488266, -0.050994791090488434, -0.030190441757440567, -0.0093860924243927, 0.011418260633945465, 0.03222261369228363, 0.0530269593000412, 0.07383131980895996, 0.09463566541671753, 0.1154400184750557, 0.13624437153339386, 0.15704871714115143, 0.1778530776500702, 0.19865742325782776, 0.21946176886558533, 0.2402661293745041, 0.26107048988342285, 0.2818748354911804, 0.302679181098938, 0.32348352670669556, 0.3442879021167755, 0.3650922477245331, 0.38589659333229065, 0.4067009687423706, 0.4275052845478058, 0.44830963015556335, 0.4691139757633209, 0.4899183511734009, 0.5107226967811584, 0.531527042388916, 0.5523313879966736, 0.5731357336044312, 0.5939400792121887, 0.6147444248199463, 0.6355487704277039, 0.6563531160354614, 0.677157461643219, 0.6979618072509766, 0.7187662124633789, 0.7395705580711365, 0.760374903678894]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 3.0, 2.0, 7.0, 7.0, 11.0, 8.0, 6.0, 12.0, 20.0, 23.0, 21.0, 21.0, 35.0, 28.0, 30.0, 35.0, 46.0, 35.0, 33.0, 39.0, 45.0, 48.0, 42.0, 45.0, 27.0, 33.0, 30.0, 36.0, 33.0, 29.0, 38.0, 19.0, 32.0, 25.0, 18.0, 15.0, 12.0, 7.0, 14.0, 6.0, 3.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32858216762542725, -0.31640568375587463, -0.304229199886322, -0.2920527458190918, -0.2798762619495392, -0.2676997780799866, -0.25552329421043396, -0.24334681034088135, -0.23117034137248993, -0.21899385750293732, -0.2068173885345459, -0.1946409046649933, -0.18246442079544067, -0.17028795182704926, -0.15811146795749664, -0.14593499898910522, -0.1337585151195526, -0.1215820387005806, -0.10940556228160858, -0.09722907841205597, -0.08505260199308395, -0.07287612557411194, -0.060699641704559326, -0.04852316528558731, -0.036346688866615295, -0.02417021058499813, -0.011993732303380966, 0.00018274784088134766, 0.012359224259853363, 0.02453570067882538, 0.03671218454837799, 0.048888660967350006, 0.061065107583999634, 0.07324158400297165, 0.08541806042194366, 0.09759454429149628, 0.10977102071046829, 0.12194749712944031, 0.13412398099899292, 0.14630046486854553, 0.15847693383693695, 0.17065341770648956, 0.18282988667488098, 0.1950063705444336, 0.2071828544139862, 0.21935932338237762, 0.23153580725193024, 0.24371227622032166, 0.25588876008987427, 0.2680652439594269, 0.2802417278289795, 0.2924181818962097, 0.30459466576576233, 0.31677114963531494, 0.32894763350486755, 0.34112411737442017, 0.3533005714416504, 0.365477055311203, 0.3776535391807556, 0.38982999324798584, 0.40200647711753845, 0.41418296098709106, 0.4263594448566437, 0.4385359287261963, 0.4507124125957489]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 5.0, 7.0, 17.0, 21.0, 29.0, 45.0, 79.0, 88.0, 158.0, 283.0, 467.0, 834.0, 1704.0, 3653.0, 8698.0, 23171.0, 70863.0, 229989.0, 417614.0, 195996.0, 60235.0, 20295.0, 7792.0, 3141.0, 1513.0, 791.0, 396.0, 253.0, 131.0, 92.0, 59.0, 44.0, 25.0, 22.0, 17.0, 10.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0789794921875, -0.07629585266113281, -0.07361221313476562, -0.07092857360839844, -0.06824493408203125, -0.06556129455566406, -0.06287765502929688, -0.06019401550292969, -0.0575103759765625, -0.05482673645019531, -0.052143096923828125, -0.04945945739746094, -0.04677581787109375, -0.04409217834472656, -0.041408538818359375, -0.03872489929199219, -0.036041259765625, -0.03335762023925781, -0.030673980712890625, -0.027990341186523438, -0.02530670166015625, -0.022623062133789062, -0.019939422607421875, -0.017255783081054688, -0.0145721435546875, -0.011888504028320312, -0.009204864501953125, -0.0065212249755859375, -0.00383758544921875, -0.0011539459228515625, 0.001529693603515625, 0.0042133331298828125, 0.00689697265625, 0.009580612182617188, 0.012264251708984375, 0.014947891235351562, 0.01763153076171875, 0.020315170288085938, 0.022998809814453125, 0.025682449340820312, 0.0283660888671875, 0.031049728393554688, 0.033733367919921875, 0.03641700744628906, 0.03910064697265625, 0.04178428649902344, 0.044467926025390625, 0.04715156555175781, 0.049835205078125, 0.05251884460449219, 0.055202484130859375, 0.05788612365722656, 0.06056976318359375, 0.06325340270996094, 0.06593704223632812, 0.06862068176269531, 0.0713043212890625, 0.07398796081542969, 0.07667160034179688, 0.07935523986816406, 0.08203887939453125, 0.08472251892089844, 0.08740615844726562, 0.09008979797363281, 0.0927734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 7.0, 14.0, 10.0, 10.0, 16.0, 9.0, 34.0, 32.0, 33.0, 28.0, 42.0, 49.0, 54.0, 43.0, 51.0, 58.0, 55.0, 61.0, 33.0, 43.0, 36.0, 41.0, 38.0, 27.0, 36.0, 28.0, 23.0, 18.0, 16.0, 11.0, 9.0, 10.0, 3.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.253692626953125, -0.24395751953125, -0.234222412109375, -0.2244873046875, -0.214752197265625, -0.20501708984375, -0.195281982421875, -0.185546875, -0.175811767578125, -0.16607666015625, -0.156341552734375, -0.1466064453125, -0.136871337890625, -0.12713623046875, -0.117401123046875, -0.107666015625, -0.097930908203125, -0.08819580078125, -0.078460693359375, -0.0687255859375, -0.058990478515625, -0.04925537109375, -0.039520263671875, -0.02978515625, -0.020050048828125, -0.01031494140625, -0.000579833984375, 0.0091552734375, 0.018890380859375, 0.02862548828125, 0.038360595703125, 0.048095703125, 0.057830810546875, 0.06756591796875, 0.077301025390625, 0.0870361328125, 0.096771240234375, 0.10650634765625, 0.116241455078125, 0.1259765625, 0.135711669921875, 0.14544677734375, 0.155181884765625, 0.1649169921875, 0.174652099609375, 0.18438720703125, 0.194122314453125, 0.203857421875, 0.213592529296875, 0.22332763671875, 0.233062744140625, 0.2427978515625, 0.252532958984375, 0.26226806640625, 0.272003173828125, 0.28173828125, 0.291473388671875, 0.30120849609375, 0.310943603515625, 0.3206787109375, 0.330413818359375, 0.34014892578125, 0.349884033203125, 0.359619140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 17.0, 14.0, 36.0, 38.0, 56.0, 82.0, 142.0, 199.0, 343.0, 616.0, 1133.0, 2317.0, 5167.0, 12620.0, 35839.0, 113749.0, 325108.0, 352513.0, 131236.0, 41650.0, 14397.0, 5711.0, 2622.0, 1250.0, 651.0, 354.0, 239.0, 143.0, 107.0, 50.0, 41.0, 29.0, 22.0, 10.0, 14.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0614013671875, -0.058951377868652344, -0.05650138854980469, -0.05405139923095703, -0.051601409912109375, -0.04915142059326172, -0.04670143127441406, -0.044251441955566406, -0.04180145263671875, -0.039351463317871094, -0.03690147399902344, -0.03445148468017578, -0.032001495361328125, -0.02955150604248047, -0.027101516723632812, -0.024651527404785156, -0.0222015380859375, -0.019751548767089844, -0.017301559448242188, -0.014851570129394531, -0.012401580810546875, -0.009951591491699219, -0.0075016021728515625, -0.005051612854003906, -0.00260162353515625, -0.00015163421630859375, 0.0022983551025390625, 0.004748344421386719, 0.007198333740234375, 0.009648323059082031, 0.012098312377929688, 0.014548301696777344, 0.016998291015625, 0.019448280334472656, 0.021898269653320312, 0.02434825897216797, 0.026798248291015625, 0.02924823760986328, 0.03169822692871094, 0.034148216247558594, 0.03659820556640625, 0.039048194885253906, 0.04149818420410156, 0.04394817352294922, 0.046398162841796875, 0.04884815216064453, 0.05129814147949219, 0.053748130798339844, 0.0561981201171875, 0.058648109436035156, 0.06109809875488281, 0.06354808807373047, 0.06599807739257812, 0.06844806671142578, 0.07089805603027344, 0.0733480453491211, 0.07579803466796875, 0.0782480239868164, 0.08069801330566406, 0.08314800262451172, 0.08559799194335938, 0.08804798126220703, 0.09049797058105469, 0.09294795989990234, 0.09539794921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 9.0, 8.0, 20.0, 18.0, 23.0, 18.0, 21.0, 35.0, 33.0, 33.0, 55.0, 39.0, 56.0, 63.0, 47.0, 56.0, 41.0, 36.0, 50.0, 43.0, 35.0, 38.0, 32.0, 29.0, 27.0, 30.0, 16.0, 12.0, 11.0, 13.0, 11.0, 6.0, 6.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.583526611328125, -0.56549072265625, -0.547454833984375, -0.5294189453125, -0.511383056640625, -0.49334716796875, -0.475311279296875, -0.457275390625, -0.439239501953125, -0.42120361328125, -0.403167724609375, -0.3851318359375, -0.367095947265625, -0.34906005859375, -0.331024169921875, -0.31298828125, -0.294952392578125, -0.27691650390625, -0.258880615234375, -0.2408447265625, -0.222808837890625, -0.20477294921875, -0.186737060546875, -0.168701171875, -0.150665283203125, -0.13262939453125, -0.114593505859375, -0.0965576171875, -0.078521728515625, -0.06048583984375, -0.042449951171875, -0.0244140625, -0.006378173828125, 0.01165771484375, 0.029693603515625, 0.0477294921875, 0.065765380859375, 0.08380126953125, 0.101837158203125, 0.119873046875, 0.137908935546875, 0.15594482421875, 0.173980712890625, 0.1920166015625, 0.210052490234375, 0.22808837890625, 0.246124267578125, 0.26416015625, 0.282196044921875, 0.30023193359375, 0.318267822265625, 0.3363037109375, 0.354339599609375, 0.37237548828125, 0.390411376953125, 0.408447265625, 0.426483154296875, 0.44451904296875, 0.462554931640625, 0.4805908203125, 0.498626708984375, 0.51666259765625, 0.534698486328125, 0.552734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 12.0, 16.0, 22.0, 38.0, 53.0, 105.0, 167.0, 326.0, 544.0, 1195.0, 2619.0, 6243.0, 18732.0, 77187.0, 395437.0, 427598.0, 86024.0, 20185.0, 6732.0, 2677.0, 1178.0, 628.0, 336.0, 186.0, 107.0, 66.0, 39.0, 33.0, 15.0, 17.0, 10.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.040771484375, -0.039726972579956055, -0.03868246078491211, -0.037637948989868164, -0.03659343719482422, -0.03554892539978027, -0.03450441360473633, -0.03345990180969238, -0.03241539001464844, -0.03137087821960449, -0.030326366424560547, -0.0292818546295166, -0.028237342834472656, -0.02719283103942871, -0.026148319244384766, -0.02510380744934082, -0.024059295654296875, -0.02301478385925293, -0.021970272064208984, -0.02092576026916504, -0.019881248474121094, -0.01883673667907715, -0.017792224884033203, -0.016747713088989258, -0.015703201293945312, -0.014658689498901367, -0.013614177703857422, -0.012569665908813477, -0.011525154113769531, -0.010480642318725586, -0.00943613052368164, -0.008391618728637695, -0.00734710693359375, -0.006302595138549805, -0.005258083343505859, -0.004213571548461914, -0.0031690597534179688, -0.0021245479583740234, -0.0010800361633300781, -3.552436828613281e-05, 0.0010089874267578125, 0.002053499221801758, 0.003098011016845703, 0.0041425228118896484, 0.005187034606933594, 0.006231546401977539, 0.007276058197021484, 0.00832056999206543, 0.009365081787109375, 0.01040959358215332, 0.011454105377197266, 0.012498617172241211, 0.013543128967285156, 0.014587640762329102, 0.015632152557373047, 0.016676664352416992, 0.017721176147460938, 0.018765687942504883, 0.019810199737548828, 0.020854711532592773, 0.02189922332763672, 0.022943735122680664, 0.02398824691772461, 0.025032758712768555, 0.0260772705078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 8.0, 4.0, 6.0, 6.0, 4.0, 13.0, 12.0, 19.0, 32.0, 32.0, 58.0, 56.0, 78.0, 81.0, 104.0, 93.0, 101.0, 82.0, 54.0, 45.0, 36.0, 34.0, 13.0, 4.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7437152564525604e-05, -1.681409776210785e-05, -1.6191042959690094e-05, -1.556798815727234e-05, -1.4944933354854584e-05, -1.4321878552436829e-05, -1.3698823750019073e-05, -1.3075768947601318e-05, -1.2452714145183563e-05, -1.1829659342765808e-05, -1.1206604540348053e-05, -1.0583549737930298e-05, -9.960494935512543e-06, -9.337440133094788e-06, -8.714385330677032e-06, -8.091330528259277e-06, -7.468275725841522e-06, -6.845220923423767e-06, -6.222166121006012e-06, -5.599111318588257e-06, -4.976056516170502e-06, -4.353001713752747e-06, -3.7299469113349915e-06, -3.1068921089172363e-06, -2.483837306499481e-06, -1.860782504081726e-06, -1.237727701663971e-06, -6.146728992462158e-07, 8.381903171539307e-09, 6.314367055892944e-07, 1.2544915080070496e-06, 1.8775463104248047e-06, 2.50060111284256e-06, 3.123655915260315e-06, 3.74671071767807e-06, 4.369765520095825e-06, 4.99282032251358e-06, 5.6158751249313354e-06, 6.2389299273490906e-06, 6.861984729766846e-06, 7.485039532184601e-06, 8.108094334602356e-06, 8.731149137020111e-06, 9.354203939437866e-06, 9.977258741855621e-06, 1.0600313544273376e-05, 1.1223368346691132e-05, 1.1846423149108887e-05, 1.2469477951526642e-05, 1.3092532753944397e-05, 1.3715587556362152e-05, 1.4338642358779907e-05, 1.4961697161197662e-05, 1.5584751963615417e-05, 1.6207806766033173e-05, 1.6830861568450928e-05, 1.7453916370868683e-05, 1.8076971173286438e-05, 1.8700025975704193e-05, 1.9323080778121948e-05, 1.9946135580539703e-05, 2.056919038295746e-05, 2.1192245185375214e-05, 2.181529998779297e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 11.0, 12.0, 17.0, 32.0, 61.0, 102.0, 142.0, 234.0, 462.0, 829.0, 1798.0, 4314.0, 11887.0, 38347.0, 161437.0, 489571.0, 254919.0, 57533.0, 16368.0, 5694.0, 2386.0, 1096.0, 596.0, 273.0, 164.0, 95.0, 50.0, 31.0, 16.0, 21.0, 14.0, 11.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297088623046875, -0.02877020835876465, -0.027831554412841797, -0.026892900466918945, -0.025954246520996094, -0.025015592575073242, -0.02407693862915039, -0.02313828468322754, -0.022199630737304688, -0.021260976791381836, -0.020322322845458984, -0.019383668899536133, -0.01844501495361328, -0.01750636100769043, -0.016567707061767578, -0.015629053115844727, -0.014690399169921875, -0.013751745223999023, -0.012813091278076172, -0.01187443733215332, -0.010935783386230469, -0.009997129440307617, -0.009058475494384766, -0.008119821548461914, -0.0071811676025390625, -0.006242513656616211, -0.005303859710693359, -0.004365205764770508, -0.0034265518188476562, -0.0024878978729248047, -0.0015492439270019531, -0.0006105899810791016, 0.00032806396484375, 0.0012667179107666016, 0.002205371856689453, 0.0031440258026123047, 0.004082679748535156, 0.005021333694458008, 0.005959987640380859, 0.006898641586303711, 0.007837295532226562, 0.008775949478149414, 0.009714603424072266, 0.010653257369995117, 0.011591911315917969, 0.01253056526184082, 0.013469219207763672, 0.014407873153686523, 0.015346527099609375, 0.016285181045532227, 0.017223834991455078, 0.01816248893737793, 0.01910114288330078, 0.020039796829223633, 0.020978450775146484, 0.021917104721069336, 0.022855758666992188, 0.02379441261291504, 0.02473306655883789, 0.025671720504760742, 0.026610374450683594, 0.027549028396606445, 0.028487682342529297, 0.02942633628845215, 0.030364990234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 9.0, 6.0, 4.0, 5.0, 9.0, 13.0, 14.0, 16.0, 27.0, 44.0, 44.0, 47.0, 72.0, 93.0, 85.0, 84.0, 91.0, 59.0, 67.0, 54.0, 38.0, 33.0, 18.0, 23.0, 12.0, 11.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0082244873046875, -0.007966399192810059, -0.007708311080932617, -0.007450222969055176, -0.007192134857177734, -0.006934046745300293, -0.0066759586334228516, -0.00641787052154541, -0.006159782409667969, -0.005901694297790527, -0.005643606185913086, -0.0053855180740356445, -0.005127429962158203, -0.004869341850280762, -0.00461125373840332, -0.004353165626525879, -0.0040950775146484375, -0.003836989402770996, -0.0035789012908935547, -0.0033208131790161133, -0.003062725067138672, -0.0028046369552612305, -0.002546548843383789, -0.0022884607315063477, -0.0020303726196289062, -0.0017722845077514648, -0.0015141963958740234, -0.001256108283996582, -0.0009980201721191406, -0.0007399320602416992, -0.0004818439483642578, -0.0002237558364868164, 3.4332275390625e-05, 0.0002924203872680664, 0.0005505084991455078, 0.0008085966110229492, 0.0010666847229003906, 0.001324772834777832, 0.0015828609466552734, 0.0018409490585327148, 0.0020990371704101562, 0.0023571252822875977, 0.002615213394165039, 0.0028733015060424805, 0.003131389617919922, 0.0033894777297973633, 0.0036475658416748047, 0.003905653953552246, 0.0041637420654296875, 0.004421830177307129, 0.00467991828918457, 0.004938006401062012, 0.005196094512939453, 0.0054541826248168945, 0.005712270736694336, 0.005970358848571777, 0.006228446960449219, 0.00648653507232666, 0.0067446231842041016, 0.007002711296081543, 0.007260799407958984, 0.007518887519836426, 0.007776975631713867, 0.008035063743591309, 0.00829315185546875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 18.0, 25.0, 58.0, 84.0, 154.0, 203.0, 165.0, 129.0, 62.0, 52.0, 17.0, 11.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5143777132034302, -0.489646315574646, -0.4649149477481842, -0.4401835501194, -0.41545215249061584, -0.39072078466415405, -0.3659893870353699, -0.3412579894065857, -0.3165265917778015, -0.29179519414901733, -0.26706382632255554, -0.24233242869377136, -0.21760103106498718, -0.1928696483373642, -0.1681382656097412, -0.14340686798095703, -0.11867550015449524, -0.09394410997629166, -0.06921271979808807, -0.04448133707046509, -0.019749946892261505, 0.004981443285942078, 0.029712826013565063, 0.05444422364234924, 0.07917560636997223, 0.10390699654817581, 0.1286383867263794, 0.15336976945400238, 0.17810115218162537, 0.20283254981040955, 0.22756393253803253, 0.2522953152656555, 0.2770267128944397, 0.3017581105232239, 0.32648947834968567, 0.35122087597846985, 0.37595227360725403, 0.4006836414337158, 0.4254150390625, 0.4501464366912842, 0.47487783432006836, 0.49960923194885254, 0.5243406295776367, 0.5490720272064209, 0.5738033652305603, 0.5985347628593445, 0.6232661604881287, 0.6479975581169128, 0.6727288961410522, 0.6974602937698364, 0.7221916913986206, 0.7469230890274048, 0.7716544270515442, 0.7963858246803284, 0.8211172223091125, 0.8458486199378967, 0.8705800175666809, 0.8953114151954651, 0.9200428128242493, 0.9447741508483887, 0.9695055484771729, 0.994236946105957, 1.0189683437347412, 1.0436997413635254, 1.0684311389923096]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 12.0, 10.0, 14.0, 19.0, 25.0, 25.0, 30.0, 33.0, 41.0, 32.0, 47.0, 46.0, 38.0, 54.0, 57.0, 53.0, 46.0, 39.0, 27.0, 33.0, 37.0, 51.0, 35.0, 32.0, 22.0, 23.0, 24.0, 16.0, 10.0, 8.0, 14.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23610919713974, -0.22735466063022614, -0.21860012412071228, -0.20984557271003723, -0.20109103620052338, -0.19233649969100952, -0.18358194828033447, -0.17482741177082062, -0.16607287526130676, -0.1573183387517929, -0.14856380224227905, -0.139809250831604, -0.13105471432209015, -0.1223001778125763, -0.11354563385248184, -0.10479108989238739, -0.09603655338287354, -0.08728201687335968, -0.07852747291326523, -0.06977292895317078, -0.06101839244365692, -0.05226385220885277, -0.043509311974048615, -0.03475477173924446, -0.026000231504440308, -0.017245691269636154, -0.008491151034832, 0.0002633891999721527, 0.009017929434776306, 0.01777246966958046, 0.026527009904384613, 0.035281550139188766, 0.04403609037399292, 0.05279063060879707, 0.06154517084360123, 0.07029971480369568, 0.07905425131320953, 0.08780878782272339, 0.09656333178281784, 0.10531787574291229, 0.11407241225242615, 0.12282694876194, 0.13158148527145386, 0.1403360366821289, 0.14909057319164276, 0.15784510970115662, 0.16659966111183167, 0.17535419762134552, 0.18410873413085938, 0.19286327064037323, 0.20161780714988708, 0.21037235856056213, 0.219126895070076, 0.22788143157958984, 0.2366359829902649, 0.24539051949977875, 0.2541450560092926, 0.26289960741996765, 0.2716541290283203, 0.28040868043899536, 0.2891632318496704, 0.29791775345802307, 0.3066723048686981, 0.3154268264770508, 0.32418137788772583]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 12.0, 7.0, 18.0, 53.0, 110.0, 412.0, 1786.0, 11144.0, 132611.0, 821456.0, 71883.0, 7301.0, 1256.0, 321.0, 87.0, 39.0, 18.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97607421875, -0.94769287109375, -0.9193115234375, -0.89093017578125, -0.862548828125, -0.83416748046875, -0.8057861328125, -0.77740478515625, -0.7490234375, -0.72064208984375, -0.6922607421875, -0.66387939453125, -0.635498046875, -0.60711669921875, -0.5787353515625, -0.55035400390625, -0.52197265625, -0.49359130859375, -0.4652099609375, -0.43682861328125, -0.408447265625, -0.38006591796875, -0.3516845703125, -0.32330322265625, -0.294921875, -0.26654052734375, -0.2381591796875, -0.20977783203125, -0.181396484375, -0.15301513671875, -0.1246337890625, -0.09625244140625, -0.06787109375, -0.03948974609375, -0.0111083984375, 0.01727294921875, 0.045654296875, 0.07403564453125, 0.1024169921875, 0.13079833984375, 0.1591796875, 0.18756103515625, 0.2159423828125, 0.24432373046875, 0.272705078125, 0.30108642578125, 0.3294677734375, 0.35784912109375, 0.38623046875, 0.41461181640625, 0.4429931640625, 0.47137451171875, 0.499755859375, 0.52813720703125, 0.5565185546875, 0.58489990234375, 0.61328125, 0.64166259765625, 0.6700439453125, 0.69842529296875, 0.726806640625, 0.75518798828125, 0.7835693359375, 0.81195068359375, 0.84033203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 12.0, 13.0, 20.0, 27.0, 33.0, 29.0, 43.0, 48.0, 50.0, 53.0, 58.0, 62.0, 90.0, 58.0, 58.0, 45.0, 52.0, 47.0, 41.0, 39.0, 22.0, 23.0, 15.0, 15.0, 10.0, 8.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.484130859375, -0.4623908996582031, -0.44065093994140625, -0.4189109802246094, -0.3971710205078125, -0.3754310607910156, -0.35369110107421875, -0.3319511413574219, -0.310211181640625, -0.2884712219238281, -0.26673126220703125, -0.24499130249023438, -0.2232513427734375, -0.20151138305664062, -0.17977142333984375, -0.15803146362304688, -0.13629150390625, -0.11455154418945312, -0.09281158447265625, -0.07107162475585938, -0.0493316650390625, -0.027591705322265625, -0.00585174560546875, 0.015888214111328125, 0.037628173828125, 0.059368133544921875, 0.08110809326171875, 0.10284805297851562, 0.1245880126953125, 0.14632797241210938, 0.16806793212890625, 0.18980789184570312, 0.2115478515625, 0.23328781127929688, 0.25502777099609375, 0.2767677307128906, 0.2985076904296875, 0.3202476501464844, 0.34198760986328125, 0.3637275695800781, 0.385467529296875, 0.4072074890136719, 0.42894744873046875, 0.4506874084472656, 0.4724273681640625, 0.4941673278808594, 0.5159072875976562, 0.5376472473144531, 0.55938720703125, 0.5811271667480469, 0.6028671264648438, 0.6246070861816406, 0.6463470458984375, 0.6680870056152344, 0.6898269653320312, 0.7115669250488281, 0.733306884765625, 0.7550468444824219, 0.7767868041992188, 0.7985267639160156, 0.8202667236328125, 0.8420066833496094, 0.8637466430664062, 0.8854866027832031, 0.9072265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 9.0, 4.0, 11.0, 20.0, 22.0, 22.0, 37.0, 38.0, 38.0, 37.0, 70.0, 72.0, 110.0, 133.0, 183.0, 337.0, 794.0, 3641.0, 31193.0, 648320.0, 339592.0, 19575.0, 2576.0, 593.0, 290.0, 198.0, 133.0, 106.0, 80.0, 55.0, 46.0, 51.0, 35.0, 24.0, 22.0, 17.0, 12.0, 11.0, 5.0, 4.0, 11.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.8916015625, -0.866058349609375, -0.84051513671875, -0.814971923828125, -0.7894287109375, -0.763885498046875, -0.73834228515625, -0.712799072265625, -0.687255859375, -0.661712646484375, -0.63616943359375, -0.610626220703125, -0.5850830078125, -0.559539794921875, -0.53399658203125, -0.508453369140625, -0.48291015625, -0.457366943359375, -0.43182373046875, -0.406280517578125, -0.3807373046875, -0.355194091796875, -0.32965087890625, -0.304107666015625, -0.278564453125, -0.253021240234375, -0.22747802734375, -0.201934814453125, -0.1763916015625, -0.150848388671875, -0.12530517578125, -0.099761962890625, -0.07421875, -0.048675537109375, -0.02313232421875, 0.002410888671875, 0.0279541015625, 0.053497314453125, 0.07904052734375, 0.104583740234375, 0.130126953125, 0.155670166015625, 0.18121337890625, 0.206756591796875, 0.2322998046875, 0.257843017578125, 0.28338623046875, 0.308929443359375, 0.33447265625, 0.360015869140625, 0.38555908203125, 0.411102294921875, 0.4366455078125, 0.462188720703125, 0.48773193359375, 0.513275146484375, 0.538818359375, 0.564361572265625, 0.58990478515625, 0.615447998046875, 0.6409912109375, 0.666534423828125, 0.69207763671875, 0.717620849609375, 0.7431640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 8.0, 13.0, 12.0, 9.0, 14.0, 15.0, 22.0, 28.0, 18.0, 26.0, 26.0, 37.0, 33.0, 30.0, 30.0, 40.0, 44.0, 45.0, 40.0, 42.0, 54.0, 46.0, 42.0, 37.0, 36.0, 34.0, 40.0, 30.0, 16.0, 20.0, 19.0, 9.0, 10.0, 17.0, 11.0, 13.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5217132568359375, -0.504852294921875, -0.4879913330078125, -0.47113037109375, -0.4542694091796875, -0.437408447265625, -0.4205474853515625, -0.4036865234375, -0.3868255615234375, -0.369964599609375, -0.3531036376953125, -0.33624267578125, -0.3193817138671875, -0.302520751953125, -0.2856597900390625, -0.268798828125, -0.2519378662109375, -0.235076904296875, -0.2182159423828125, -0.20135498046875, -0.1844940185546875, -0.167633056640625, -0.1507720947265625, -0.1339111328125, -0.1170501708984375, -0.100189208984375, -0.0833282470703125, -0.06646728515625, -0.0496063232421875, -0.032745361328125, -0.0158843994140625, 0.0009765625, 0.0178375244140625, 0.034698486328125, 0.0515594482421875, 0.06842041015625, 0.0852813720703125, 0.102142333984375, 0.1190032958984375, 0.1358642578125, 0.1527252197265625, 0.169586181640625, 0.1864471435546875, 0.20330810546875, 0.2201690673828125, 0.237030029296875, 0.2538909912109375, 0.270751953125, 0.2876129150390625, 0.304473876953125, 0.3213348388671875, 0.33819580078125, 0.3550567626953125, 0.371917724609375, 0.3887786865234375, 0.4056396484375, 0.4225006103515625, 0.439361572265625, 0.4562225341796875, 0.47308349609375, 0.4899444580078125, 0.506805419921875, 0.5236663818359375, 0.54052734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 2.0, 4.0, 6.0, 7.0, 18.0, 22.0, 40.0, 73.0, 162.0, 485.0, 1612.0, 8321.0, 120923.0, 860966.0, 49255.0, 4874.0, 1142.0, 342.0, 136.0, 59.0, 31.0, 20.0, 14.0, 6.0, 4.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.2579078674316406, -0.24848175048828125, -0.23905563354492188, -0.2296295166015625, -0.22020339965820312, -0.21077728271484375, -0.20135116577148438, -0.191925048828125, -0.18249893188476562, -0.17307281494140625, -0.16364669799804688, -0.1542205810546875, -0.14479446411132812, -0.13536834716796875, -0.12594223022460938, -0.11651611328125, -0.10708999633789062, -0.09766387939453125, -0.08823776245117188, -0.0788116455078125, -0.06938552856445312, -0.05995941162109375, -0.050533294677734375, -0.041107177734375, -0.031681060791015625, -0.02225494384765625, -0.012828826904296875, -0.0034027099609375, 0.006023406982421875, 0.01544952392578125, 0.024875640869140625, 0.0343017578125, 0.043727874755859375, 0.05315399169921875, 0.06258010864257812, 0.0720062255859375, 0.08143234252929688, 0.09085845947265625, 0.10028457641601562, 0.109710693359375, 0.11913681030273438, 0.12856292724609375, 0.13798904418945312, 0.1474151611328125, 0.15684127807617188, 0.16626739501953125, 0.17569351196289062, 0.18511962890625, 0.19454574584960938, 0.20397186279296875, 0.21339797973632812, 0.2228240966796875, 0.23225021362304688, 0.24167633056640625, 0.2511024475097656, 0.260528564453125, 0.2699546813964844, 0.27938079833984375, 0.2888069152832031, 0.2982330322265625, 0.3076591491699219, 0.31708526611328125, 0.3265113830566406, 0.3359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 12.0, 20.0, 30.0, 51.0, 65.0, 116.0, 182.0, 191.0, 112.0, 71.0, 43.0, 29.0, 21.0, 17.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7206878662109375e-05, -4.590023308992386e-05, -4.459358751773834e-05, -4.3286941945552826e-05, -4.198029637336731e-05, -4.067365080118179e-05, -3.936700522899628e-05, -3.806035965681076e-05, -3.6753714084625244e-05, -3.544706851243973e-05, -3.414042294025421e-05, -3.2833777368068695e-05, -3.152713179588318e-05, -3.0220486223697662e-05, -2.8913840651512146e-05, -2.760719507932663e-05, -2.6300549507141113e-05, -2.4993903934955597e-05, -2.368725836277008e-05, -2.2380612790584564e-05, -2.1073967218399048e-05, -1.976732164621353e-05, -1.8460676074028015e-05, -1.71540305018425e-05, -1.5847384929656982e-05, -1.4540739357471466e-05, -1.323409378528595e-05, -1.1927448213100433e-05, -1.0620802640914917e-05, -9.3141570687294e-06, -8.007511496543884e-06, -6.700865924358368e-06, -5.3942203521728516e-06, -4.087574779987335e-06, -2.780929207801819e-06, -1.4742836356163025e-06, -1.6763806343078613e-07, 1.1390075087547302e-06, 2.4456530809402466e-06, 3.752298653125763e-06, 5.058944225311279e-06, 6.365589797496796e-06, 7.672235369682312e-06, 8.978880941867828e-06, 1.0285526514053345e-05, 1.1592172086238861e-05, 1.2898817658424377e-05, 1.4205463230609894e-05, 1.551210880279541e-05, 1.6818754374980927e-05, 1.8125399947166443e-05, 1.943204551935196e-05, 2.0738691091537476e-05, 2.2045336663722992e-05, 2.3351982235908508e-05, 2.4658627808094025e-05, 2.596527338027954e-05, 2.7271918952465057e-05, 2.8578564524650574e-05, 2.988521009683609e-05, 3.1191855669021606e-05, 3.249850124120712e-05, 3.380514681339264e-05, 3.5111792385578156e-05, 3.641843795776367e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 6.0, 1.0, 10.0, 9.0, 17.0, 17.0, 36.0, 80.0, 158.0, 493.0, 1764.0, 10846.0, 290272.0, 721933.0, 19331.0, 2544.0, 613.0, 204.0, 86.0, 47.0, 36.0, 11.0, 9.0, 13.0, 5.0, 1.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.37548828125, -0.3637962341308594, -0.35210418701171875, -0.3404121398925781, -0.3287200927734375, -0.3170280456542969, -0.30533599853515625, -0.2936439514160156, -0.281951904296875, -0.2702598571777344, -0.25856781005859375, -0.24687576293945312, -0.2351837158203125, -0.22349166870117188, -0.21179962158203125, -0.20010757446289062, -0.18841552734375, -0.17672348022460938, -0.16503143310546875, -0.15333938598632812, -0.1416473388671875, -0.12995529174804688, -0.11826324462890625, -0.10657119750976562, -0.094879150390625, -0.08318710327148438, -0.07149505615234375, -0.059803009033203125, -0.0481109619140625, -0.036418914794921875, -0.02472686767578125, -0.013034820556640625, -0.0013427734375, 0.010349273681640625, 0.02204132080078125, 0.033733367919921875, 0.0454254150390625, 0.057117462158203125, 0.06880950927734375, 0.08050155639648438, 0.092193603515625, 0.10388565063476562, 0.11557769775390625, 0.12726974487304688, 0.1389617919921875, 0.15065383911132812, 0.16234588623046875, 0.17403793334960938, 0.18572998046875, 0.19742202758789062, 0.20911407470703125, 0.22080612182617188, 0.2324981689453125, 0.24419021606445312, 0.25588226318359375, 0.2675743103027344, 0.279266357421875, 0.2909584045410156, 0.30265045166015625, 0.3143424987792969, 0.3260345458984375, 0.3377265930175781, 0.34941864013671875, 0.3611106872558594, 0.372802734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 11.0, 7.0, 23.0, 28.0, 39.0, 67.0, 113.0, 164.0, 156.0, 125.0, 90.0, 41.0, 37.0, 25.0, 17.0, 15.0, 8.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.10021686553955078, -0.09728431701660156, -0.09435176849365234, -0.09141921997070312, -0.0884866714477539, -0.08555412292480469, -0.08262157440185547, -0.07968902587890625, -0.07675647735595703, -0.07382392883300781, -0.0708913803100586, -0.06795883178710938, -0.06502628326416016, -0.06209373474121094, -0.05916118621826172, -0.0562286376953125, -0.05329608917236328, -0.05036354064941406, -0.047430992126464844, -0.044498443603515625, -0.041565895080566406, -0.03863334655761719, -0.03570079803466797, -0.03276824951171875, -0.02983570098876953, -0.026903152465820312, -0.023970603942871094, -0.021038055419921875, -0.018105506896972656, -0.015172958374023438, -0.012240409851074219, -0.009307861328125, -0.006375312805175781, -0.0034427642822265625, -0.0005102157592773438, 0.002422332763671875, 0.005354881286621094, 0.008287429809570312, 0.011219978332519531, 0.01415252685546875, 0.01708507537841797, 0.020017623901367188, 0.022950172424316406, 0.025882720947265625, 0.028815269470214844, 0.03174781799316406, 0.03468036651611328, 0.0376129150390625, 0.04054546356201172, 0.04347801208496094, 0.046410560607910156, 0.049343109130859375, 0.052275657653808594, 0.05520820617675781, 0.05814075469970703, 0.06107330322265625, 0.06400585174560547, 0.06693840026855469, 0.0698709487915039, 0.07280349731445312, 0.07573604583740234, 0.07866859436035156, 0.08160114288330078, 0.08453369140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 20.0, 25.0, 40.0, 65.0, 90.0, 108.0, 141.0, 133.0, 107.0, 91.0, 59.0, 31.0, 24.0, 11.0, 9.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8961554765701294, -0.8628050684928894, -0.8294546008110046, -0.7961041927337646, -0.7627537250518799, -0.7294033169746399, -0.6960529088973999, -0.6627024412155151, -0.6293519735336304, -0.5960015654563904, -0.5626510977745056, -0.5293006896972656, -0.49595022201538086, -0.46259981393814087, -0.4292493760585785, -0.3958989381790161, -0.3625485301017761, -0.32919809222221375, -0.29584765434265137, -0.2624972462654114, -0.2291467934846878, -0.19579635560512543, -0.16244593262672424, -0.12909549474716187, -0.09574505686759949, -0.06239462271332741, -0.02904418855905533, 0.004306241869926453, 0.03765667974948883, 0.07100711762905121, 0.10435754060745239, 0.13770797848701477, 0.17105841636657715, 0.20440885424613953, 0.2377592921257019, 0.2711097002029419, 0.30446016788482666, 0.33781057596206665, 0.37116101384162903, 0.4045114517211914, 0.4378618896007538, 0.47121232748031616, 0.5045627355575562, 0.5379132032394409, 0.5712636113166809, 0.6046140789985657, 0.6379644870758057, 0.6713149547576904, 0.7046653628349304, 0.7380157709121704, 0.7713662385940552, 0.8047166466712952, 0.8380671143531799, 0.8714175224304199, 0.9047679901123047, 0.9381183981895447, 0.9714688062667847, 1.0048192739486694, 1.0381696224212646, 1.0715200901031494, 1.1048705577850342, 1.138221025466919, 1.1715713739395142, 1.204921841621399, 1.2382723093032837]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 14.0, 8.0, 12.0, 9.0, 21.0, 15.0, 25.0, 31.0, 37.0, 49.0, 29.0, 45.0, 55.0, 52.0, 56.0, 54.0, 56.0, 56.0, 57.0, 48.0, 50.0, 42.0, 31.0, 40.0, 28.0, 22.0, 19.0, 20.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9736251831054688, -0.9356900453567505, -0.8977549076080322, -0.8598197102546692, -0.8218845725059509, -0.7839494347572327, -0.7460142374038696, -0.7080790996551514, -0.6701439619064331, -0.6322088241577148, -0.5942736864089966, -0.5563384890556335, -0.5184033513069153, -0.480468213558197, -0.44253304600715637, -0.4045978784561157, -0.36666274070739746, -0.3287276029586792, -0.29079243540763855, -0.2528572678565979, -0.21492213010787964, -0.17698697745800018, -0.13905182480812073, -0.10111665725708008, -0.06318151950836182, -0.02524636685848236, 0.012688785791397095, 0.05062393844127655, 0.088559091091156, 0.12649424374103546, 0.16442939639091492, 0.20236456394195557, 0.24029982089996338, 0.27823495864868164, 0.3161701261997223, 0.35410529375076294, 0.3920404314994812, 0.42997556924819946, 0.4679107367992401, 0.5058459043502808, 0.543781042098999, 0.5817161798477173, 0.6196513175964355, 0.6575865149497986, 0.6955216526985168, 0.7334567904472351, 0.7713919878005981, 0.8093271255493164, 0.8472622632980347, 0.8851974010467529, 0.9231325387954712, 0.9610677361488342, 0.9990028738975525, 1.0369380712509155, 1.0748732089996338, 1.112808346748352, 1.1507434844970703, 1.1886786222457886, 1.2266137599945068, 1.264548897743225, 1.3024840354919434, 1.3404192924499512, 1.3783544301986694, 1.4162895679473877, 1.454224705696106]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 10.0, 15.0, 20.0, 43.0, 57.0, 110.0, 269.0, 613.0, 1869.0, 7164.0, 52445.0, 1978350.0, 2083160.0, 59274.0, 7524.0, 2011.0, 680.0, 276.0, 130.0, 78.0, 39.0, 35.0, 15.0, 15.0, 11.0, 10.0, 4.0, 3.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8552093505859375, -0.824676513671875, -0.7941436767578125, -0.76361083984375, -0.7330780029296875, -0.702545166015625, -0.6720123291015625, -0.6414794921875, -0.6109466552734375, -0.580413818359375, -0.5498809814453125, -0.51934814453125, -0.4888153076171875, -0.458282470703125, -0.4277496337890625, -0.397216796875, -0.3666839599609375, -0.336151123046875, -0.3056182861328125, -0.27508544921875, -0.2445526123046875, -0.214019775390625, -0.1834869384765625, -0.1529541015625, -0.1224212646484375, -0.091888427734375, -0.0613555908203125, -0.03082275390625, -0.0002899169921875, 0.030242919921875, 0.0607757568359375, 0.09130859375, 0.1218414306640625, 0.152374267578125, 0.1829071044921875, 0.21343994140625, 0.2439727783203125, 0.274505615234375, 0.3050384521484375, 0.3355712890625, 0.3661041259765625, 0.396636962890625, 0.4271697998046875, 0.45770263671875, 0.4882354736328125, 0.518768310546875, 0.5493011474609375, 0.579833984375, 0.6103668212890625, 0.640899658203125, 0.6714324951171875, 0.70196533203125, 0.7324981689453125, 0.763031005859375, 0.7935638427734375, 0.8240966796875, 0.8546295166015625, 0.885162353515625, 0.9156951904296875, 0.94622802734375, 0.9767608642578125, 1.007293701171875, 1.0378265380859375, 1.068359375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 7.0, 12.0, 11.0, 20.0, 21.0, 18.0, 23.0, 39.0, 27.0, 48.0, 40.0, 45.0, 54.0, 40.0, 51.0, 58.0, 45.0, 46.0, 49.0, 41.0, 42.0, 48.0, 29.0, 28.0, 29.0, 28.0, 20.0, 13.0, 15.0, 10.0, 7.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.3273773193359375, -0.314910888671875, -0.3024444580078125, -0.28997802734375, -0.2775115966796875, -0.265045166015625, -0.2525787353515625, -0.2401123046875, -0.2276458740234375, -0.215179443359375, -0.2027130126953125, -0.19024658203125, -0.1777801513671875, -0.165313720703125, -0.1528472900390625, -0.140380859375, -0.1279144287109375, -0.115447998046875, -0.1029815673828125, -0.09051513671875, -0.0780487060546875, -0.065582275390625, -0.0531158447265625, -0.0406494140625, -0.0281829833984375, -0.015716552734375, -0.0032501220703125, 0.00921630859375, 0.0216827392578125, 0.034149169921875, 0.0466156005859375, 0.05908203125, 0.0715484619140625, 0.084014892578125, 0.0964813232421875, 0.10894775390625, 0.1214141845703125, 0.133880615234375, 0.1463470458984375, 0.1588134765625, 0.1712799072265625, 0.183746337890625, 0.1962127685546875, 0.20867919921875, 0.2211456298828125, 0.233612060546875, 0.2460784912109375, 0.258544921875, 0.2710113525390625, 0.283477783203125, 0.2959442138671875, 0.30841064453125, 0.3208770751953125, 0.333343505859375, 0.3458099365234375, 0.3582763671875, 0.3707427978515625, 0.383209228515625, 0.3956756591796875, 0.40814208984375, 0.4206085205078125, 0.433074951171875, 0.4455413818359375, 0.4580078125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 21.0, 38.0, 64.0, 82.0, 191.0, 452.0, 1500.0, 6838.0, 98440.0, 3946702.0, 129280.0, 8024.0, 1651.0, 511.0, 221.0, 81.0, 46.0, 31.0, 21.0, 23.0, 12.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3203125, -1.2831573486328125, -1.246002197265625, -1.2088470458984375, -1.17169189453125, -1.1345367431640625, -1.097381591796875, -1.0602264404296875, -1.0230712890625, -0.9859161376953125, -0.948760986328125, -0.9116058349609375, -0.87445068359375, -0.8372955322265625, -0.800140380859375, -0.7629852294921875, -0.725830078125, -0.6886749267578125, -0.651519775390625, -0.6143646240234375, -0.57720947265625, -0.5400543212890625, -0.502899169921875, -0.4657440185546875, -0.4285888671875, -0.3914337158203125, -0.354278564453125, -0.3171234130859375, -0.27996826171875, -0.2428131103515625, -0.205657958984375, -0.1685028076171875, -0.13134765625, -0.0941925048828125, -0.057037353515625, -0.0198822021484375, 0.01727294921875, 0.0544281005859375, 0.091583251953125, 0.1287384033203125, 0.1658935546875, 0.2030487060546875, 0.240203857421875, 0.2773590087890625, 0.31451416015625, 0.3516693115234375, 0.388824462890625, 0.4259796142578125, 0.463134765625, 0.5002899169921875, 0.537445068359375, 0.5746002197265625, 0.61175537109375, 0.6489105224609375, 0.686065673828125, 0.7232208251953125, 0.7603759765625, 0.7975311279296875, 0.834686279296875, 0.8718414306640625, 0.90899658203125, 0.9461517333984375, 0.983306884765625, 1.0204620361328125, 1.0576171875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 11.0, 15.0, 21.0, 25.0, 27.0, 41.0, 74.0, 101.0, 163.0, 280.0, 462.0, 671.0, 724.0, 527.0, 331.0, 192.0, 121.0, 82.0, 48.0, 46.0, 28.0, 21.0, 16.0, 13.0, 9.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.1548004150390625, -0.149322509765625, -0.1438446044921875, -0.13836669921875, -0.1328887939453125, -0.127410888671875, -0.1219329833984375, -0.116455078125, -0.1109771728515625, -0.105499267578125, -0.1000213623046875, -0.09454345703125, -0.0890655517578125, -0.083587646484375, -0.0781097412109375, -0.0726318359375, -0.0671539306640625, -0.061676025390625, -0.0561981201171875, -0.05072021484375, -0.0452423095703125, -0.039764404296875, -0.0342864990234375, -0.02880859375, -0.0233306884765625, -0.017852783203125, -0.0123748779296875, -0.00689697265625, -0.0014190673828125, 0.004058837890625, 0.0095367431640625, 0.0150146484375, 0.0204925537109375, 0.025970458984375, 0.0314483642578125, 0.03692626953125, 0.0424041748046875, 0.047882080078125, 0.0533599853515625, 0.058837890625, 0.0643157958984375, 0.069793701171875, 0.0752716064453125, 0.08074951171875, 0.0862274169921875, 0.091705322265625, 0.0971832275390625, 0.1026611328125, 0.1081390380859375, 0.113616943359375, 0.1190948486328125, 0.12457275390625, 0.1300506591796875, 0.135528564453125, 0.1410064697265625, 0.146484375, 0.1519622802734375, 0.157440185546875, 0.1629180908203125, 0.16839599609375, 0.1738739013671875, 0.179351806640625, 0.1848297119140625, 0.1903076171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 16.0, 27.0, 30.0, 44.0, 60.0, 90.0, 123.0, 149.0, 122.0, 96.0, 68.0, 65.0, 37.0, 15.0, 11.0, 9.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6566445231437683, -0.6300395727157593, -0.6034346222877502, -0.5768296718597412, -0.5502246618270874, -0.5236197113990784, -0.49701476097106934, -0.4704098105430603, -0.4438048303127289, -0.41719987988471985, -0.3905948996543884, -0.3639899492263794, -0.33738499879837036, -0.31078001856803894, -0.2841750681400299, -0.2575700879096985, -0.23096513748168945, -0.20436017215251923, -0.177755206823349, -0.15115025639533997, -0.12454529106616974, -0.09794032573699951, -0.07133537530899048, -0.04473040997982025, -0.018125444650650024, 0.008479516953229904, 0.03508447855710983, 0.06168943643569946, 0.08829440176486969, 0.11489936709403992, 0.14150431752204895, 0.16810928285121918, 0.19471430778503418, 0.2213192731142044, 0.24792423844337463, 0.27452918887138367, 0.3011341691017151, 0.3277391195297241, 0.35434406995773315, 0.3809490203857422, 0.4075540006160736, 0.43415895104408264, 0.46076393127441406, 0.4873688817024231, 0.5139738321304321, 0.5405788421630859, 0.5671837329864502, 0.593788743019104, 0.620393693447113, 0.6469986438751221, 0.6736035943031311, 0.7002085447311401, 0.726813554763794, 0.753418505191803, 0.780023455619812, 0.806628406047821, 0.8332333564758301, 0.8598383069038391, 0.8864432573318481, 0.913048267364502, 0.939653217792511, 0.96625816822052, 0.992863118648529, 1.019468069076538, 1.046073079109192]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 7.0, 16.0, 10.0, 15.0, 21.0, 18.0, 26.0, 18.0, 32.0, 41.0, 35.0, 50.0, 55.0, 44.0, 48.0, 52.0, 48.0, 52.0, 46.0, 49.0, 37.0, 47.0, 41.0, 32.0, 30.0, 14.0, 25.0, 17.0, 18.0, 9.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3984873294830322, -0.38455063104629517, -0.3706139326095581, -0.35667726397514343, -0.34274056553840637, -0.3288038671016693, -0.31486716866493225, -0.3009305000305176, -0.2869938015937805, -0.27305710315704346, -0.2591204047203064, -0.24518372118473053, -0.23124703764915466, -0.2173103392124176, -0.20337364077568054, -0.18943695724010468, -0.17550025880336761, -0.16156356036663055, -0.1476268768310547, -0.13369017839431763, -0.11975349485874176, -0.1058167964220047, -0.09188010543584824, -0.07794341444969177, -0.06400672346353531, -0.050070032477378845, -0.03613334149122238, -0.02219664677977562, -0.008259955793619156, 0.005676738917827606, 0.01961342990398407, 0.03355012089014053, 0.047486811876297, 0.06142350286245346, 0.07536019384860992, 0.08929689228534698, 0.10323357582092285, 0.11717027425765991, 0.13110697269439697, 0.14504365622997284, 0.1589803397655487, 0.17291703820228577, 0.18685372173786163, 0.2007904201745987, 0.21472710371017456, 0.22866380214691162, 0.24260050058364868, 0.25653719902038574, 0.2704738974571228, 0.28441059589385986, 0.2983472943305969, 0.3122839629650116, 0.32622066140174866, 0.3401573598384857, 0.3540940582752228, 0.36803072690963745, 0.3819674253463745, 0.3959041237831116, 0.40984082221984863, 0.4237774908542633, 0.43771418929100037, 0.4516508877277374, 0.4655875861644745, 0.47952425479888916, 0.4934609532356262]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 6.0, 6.0, 10.0, 24.0, 43.0, 59.0, 179.0, 483.0, 1293.0, 4013.0, 16190.0, 130349.0, 727663.0, 144451.0, 17293.0, 4378.0, 1327.0, 424.0, 185.0, 84.0, 29.0, 18.0, 14.0, 5.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17403602600097656, -0.16814041137695312, -0.1622447967529297, -0.15634918212890625, -0.1504535675048828, -0.14455795288085938, -0.13866233825683594, -0.1327667236328125, -0.12687110900878906, -0.12097549438476562, -0.11507987976074219, -0.10918426513671875, -0.10328865051269531, -0.09739303588867188, -0.09149742126464844, -0.085601806640625, -0.07970619201660156, -0.07381057739257812, -0.06791496276855469, -0.06201934814453125, -0.05612373352050781, -0.050228118896484375, -0.04433250427246094, -0.0384368896484375, -0.03254127502441406, -0.026645660400390625, -0.020750045776367188, -0.01485443115234375, -0.008958816528320312, -0.003063201904296875, 0.0028324127197265625, 0.00872802734375, 0.014623641967773438, 0.020519256591796875, 0.026414871215820312, 0.03231048583984375, 0.03820610046386719, 0.044101715087890625, 0.04999732971191406, 0.0558929443359375, 0.06178855895996094, 0.06768417358398438, 0.07357978820800781, 0.07947540283203125, 0.08537101745605469, 0.09126663208007812, 0.09716224670410156, 0.103057861328125, 0.10895347595214844, 0.11484909057617188, 0.12074470520019531, 0.12664031982421875, 0.1325359344482422, 0.13843154907226562, 0.14432716369628906, 0.1502227783203125, 0.15611839294433594, 0.16201400756835938, 0.1679096221923828, 0.17380523681640625, 0.1797008514404297, 0.18559646606445312, 0.19149208068847656, 0.1973876953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 15.0, 9.0, 18.0, 23.0, 19.0, 21.0, 34.0, 48.0, 47.0, 54.0, 65.0, 67.0, 62.0, 68.0, 61.0, 63.0, 65.0, 56.0, 44.0, 35.0, 30.0, 18.0, 27.0, 6.0, 15.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.35467529296875, -0.3424072265625, -0.33013916015625, -0.31787109375, -0.30560302734375, -0.2933349609375, -0.28106689453125, -0.268798828125, -0.25653076171875, -0.2442626953125, -0.23199462890625, -0.2197265625, -0.20745849609375, -0.1951904296875, -0.18292236328125, -0.170654296875, -0.15838623046875, -0.1461181640625, -0.13385009765625, -0.12158203125, -0.10931396484375, -0.0970458984375, -0.08477783203125, -0.072509765625, -0.06024169921875, -0.0479736328125, -0.03570556640625, -0.0234375, -0.01116943359375, 0.0010986328125, 0.01336669921875, 0.025634765625, 0.03790283203125, 0.0501708984375, 0.06243896484375, 0.07470703125, 0.08697509765625, 0.0992431640625, 0.11151123046875, 0.123779296875, 0.13604736328125, 0.1483154296875, 0.16058349609375, 0.1728515625, 0.18511962890625, 0.1973876953125, 0.20965576171875, 0.221923828125, 0.23419189453125, 0.2464599609375, 0.25872802734375, 0.27099609375, 0.28326416015625, 0.2955322265625, 0.30780029296875, 0.320068359375, 0.33233642578125, 0.3446044921875, 0.35687255859375, 0.369140625, 0.38140869140625, 0.3936767578125, 0.40594482421875, 0.418212890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 21.0, 32.0, 57.0, 71.0, 113.0, 194.0, 402.0, 699.0, 1436.0, 3401.0, 9050.0, 26981.0, 104612.0, 395855.0, 371244.0, 94409.0, 25174.0, 8455.0, 3240.0, 1415.0, 670.0, 382.0, 213.0, 127.0, 98.0, 51.0, 33.0, 27.0, 19.0, 6.0, 10.0, 13.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09930419921875, -0.09629154205322266, -0.09327888488769531, -0.09026622772216797, -0.08725357055664062, -0.08424091339111328, -0.08122825622558594, -0.0782155990600586, -0.07520294189453125, -0.0721902847290039, -0.06917762756347656, -0.06616497039794922, -0.06315231323242188, -0.06013965606689453, -0.05712699890136719, -0.054114341735839844, -0.0511016845703125, -0.048089027404785156, -0.04507637023925781, -0.04206371307373047, -0.039051055908203125, -0.03603839874267578, -0.03302574157714844, -0.030013084411621094, -0.02700042724609375, -0.023987770080566406, -0.020975112915039062, -0.01796245574951172, -0.014949798583984375, -0.011937141418457031, -0.008924484252929688, -0.005911827087402344, -0.002899169921875, 0.00011348724365234375, 0.0031261444091796875, 0.006138801574707031, 0.009151458740234375, 0.012164115905761719, 0.015176773071289062, 0.018189430236816406, 0.02120208740234375, 0.024214744567871094, 0.027227401733398438, 0.03024005889892578, 0.033252716064453125, 0.03626537322998047, 0.03927803039550781, 0.042290687561035156, 0.0453033447265625, 0.048316001892089844, 0.05132865905761719, 0.05434131622314453, 0.057353973388671875, 0.06036663055419922, 0.06337928771972656, 0.0663919448852539, 0.06940460205078125, 0.0724172592163086, 0.07542991638183594, 0.07844257354736328, 0.08145523071289062, 0.08446788787841797, 0.08748054504394531, 0.09049320220947266, 0.093505859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 8.0, 11.0, 15.0, 18.0, 19.0, 14.0, 30.0, 33.0, 45.0, 34.0, 48.0, 49.0, 53.0, 75.0, 52.0, 45.0, 61.0, 55.0, 42.0, 47.0, 47.0, 36.0, 32.0, 27.0, 20.0, 17.0, 17.0, 10.0, 2.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.5912322998046875, -0.569671630859375, -0.5481109619140625, -0.52655029296875, -0.5049896240234375, -0.483428955078125, -0.4618682861328125, -0.4403076171875, -0.4187469482421875, -0.397186279296875, -0.3756256103515625, -0.35406494140625, -0.3325042724609375, -0.310943603515625, -0.2893829345703125, -0.267822265625, -0.2462615966796875, -0.224700927734375, -0.2031402587890625, -0.18157958984375, -0.1600189208984375, -0.138458251953125, -0.1168975830078125, -0.0953369140625, -0.0737762451171875, -0.052215576171875, -0.0306549072265625, -0.00909423828125, 0.0124664306640625, 0.034027099609375, 0.0555877685546875, 0.0771484375, 0.0987091064453125, 0.120269775390625, 0.1418304443359375, 0.16339111328125, 0.1849517822265625, 0.206512451171875, 0.2280731201171875, 0.2496337890625, 0.2711944580078125, 0.292755126953125, 0.3143157958984375, 0.33587646484375, 0.3574371337890625, 0.378997802734375, 0.4005584716796875, 0.422119140625, 0.4436798095703125, 0.465240478515625, 0.4868011474609375, 0.50836181640625, 0.5299224853515625, 0.551483154296875, 0.5730438232421875, 0.5946044921875, 0.6161651611328125, 0.637725830078125, 0.6592864990234375, 0.68084716796875, 0.7024078369140625, 0.723968505859375, 0.7455291748046875, 0.76708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 23.0, 22.0, 27.0, 28.0, 46.0, 86.0, 135.0, 241.0, 443.0, 823.0, 1642.0, 3768.0, 9746.0, 32138.0, 141307.0, 505474.0, 271021.0, 56006.0, 15437.0, 5525.0, 2236.0, 1051.0, 527.0, 317.0, 193.0, 89.0, 66.0, 36.0, 27.0, 23.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.03829383850097656, -0.037250518798828125, -0.03620719909667969, -0.03516387939453125, -0.03412055969238281, -0.033077239990234375, -0.03203392028808594, -0.0309906005859375, -0.029947280883789062, -0.028903961181640625, -0.027860641479492188, -0.02681732177734375, -0.025774002075195312, -0.024730682373046875, -0.023687362670898438, -0.02264404296875, -0.021600723266601562, -0.020557403564453125, -0.019514083862304688, -0.01847076416015625, -0.017427444458007812, -0.016384124755859375, -0.015340805053710938, -0.0142974853515625, -0.013254165649414062, -0.012210845947265625, -0.011167526245117188, -0.01012420654296875, -0.009080886840820312, -0.008037567138671875, -0.0069942474365234375, -0.005950927734375, -0.0049076080322265625, -0.003864288330078125, -0.0028209686279296875, -0.00177764892578125, -0.0007343292236328125, 0.000308990478515625, 0.0013523101806640625, 0.0023956298828125, 0.0034389495849609375, 0.004482269287109375, 0.0055255889892578125, 0.00656890869140625, 0.0076122283935546875, 0.008655548095703125, 0.009698867797851562, 0.0107421875, 0.011785507202148438, 0.012828826904296875, 0.013872146606445312, 0.01491546630859375, 0.015958786010742188, 0.017002105712890625, 0.018045425415039062, 0.0190887451171875, 0.020132064819335938, 0.021175384521484375, 0.022218704223632812, 0.02326202392578125, 0.024305343627929688, 0.025348663330078125, 0.026391983032226562, 0.027435302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 6.0, 6.0, 15.0, 10.0, 20.0, 19.0, 22.0, 31.0, 55.0, 52.0, 59.0, 74.0, 105.0, 74.0, 70.0, 74.0, 56.0, 53.0, 32.0, 39.0, 26.0, 17.0, 24.0, 10.0, 5.0, 7.0, 8.0, 6.0, 3.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6510486602783203e-05, -1.6016885638237e-05, -1.5523284673690796e-05, -1.5029683709144592e-05, -1.4536082744598389e-05, -1.4042481780052185e-05, -1.3548880815505981e-05, -1.3055279850959778e-05, -1.2561678886413574e-05, -1.206807792186737e-05, -1.1574476957321167e-05, -1.1080875992774963e-05, -1.058727502822876e-05, -1.0093674063682556e-05, -9.600073099136353e-06, -9.106472134590149e-06, -8.612871170043945e-06, -8.119270205497742e-06, -7.625669240951538e-06, -7.1320682764053345e-06, -6.638467311859131e-06, -6.144866347312927e-06, -5.651265382766724e-06, -5.15766441822052e-06, -4.664063453674316e-06, -4.170462489128113e-06, -3.676861524581909e-06, -3.1832605600357056e-06, -2.689659595489502e-06, -2.1960586309432983e-06, -1.7024576663970947e-06, -1.2088567018508911e-06, -7.152557373046875e-07, -2.2165477275848389e-07, 2.7194619178771973e-07, 7.655471563339233e-07, 1.259148120880127e-06, 1.7527490854263306e-06, 2.246350049972534e-06, 2.739951014518738e-06, 3.2335519790649414e-06, 3.727152943611145e-06, 4.220753908157349e-06, 4.714354872703552e-06, 5.207955837249756e-06, 5.7015568017959595e-06, 6.195157766342163e-06, 6.688758730888367e-06, 7.18235969543457e-06, 7.675960659980774e-06, 8.169561624526978e-06, 8.663162589073181e-06, 9.156763553619385e-06, 9.650364518165588e-06, 1.0143965482711792e-05, 1.0637566447257996e-05, 1.11311674118042e-05, 1.1624768376350403e-05, 1.2118369340896606e-05, 1.261197030544281e-05, 1.3105571269989014e-05, 1.3599172234535217e-05, 1.4092773199081421e-05, 1.4586374163627625e-05, 1.5079975128173828e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 10.0, 7.0, 11.0, 18.0, 26.0, 43.0, 66.0, 108.0, 175.0, 296.0, 474.0, 867.0, 1953.0, 4927.0, 14199.0, 53378.0, 254597.0, 505310.0, 159826.0, 35076.0, 10225.0, 3634.0, 1547.0, 708.0, 406.0, 240.0, 149.0, 97.0, 63.0, 40.0, 24.0, 15.0, 17.0, 10.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032470703125, -0.03143501281738281, -0.030399322509765625, -0.029363632202148438, -0.02832794189453125, -0.027292251586914062, -0.026256561279296875, -0.025220870971679688, -0.0241851806640625, -0.023149490356445312, -0.022113800048828125, -0.021078109741210938, -0.02004241943359375, -0.019006729125976562, -0.017971038818359375, -0.016935348510742188, -0.015899658203125, -0.014863967895507812, -0.013828277587890625, -0.012792587280273438, -0.01175689697265625, -0.010721206665039062, -0.009685516357421875, -0.008649826049804688, -0.0076141357421875, -0.0065784454345703125, -0.005542755126953125, -0.0045070648193359375, -0.00347137451171875, -0.0024356842041015625, -0.001399993896484375, -0.0003643035888671875, 0.00067138671875, 0.0017070770263671875, 0.002742767333984375, 0.0037784576416015625, 0.00481414794921875, 0.0058498382568359375, 0.006885528564453125, 0.007921218872070312, 0.0089569091796875, 0.009992599487304688, 0.011028289794921875, 0.012063980102539062, 0.01309967041015625, 0.014135360717773438, 0.015171051025390625, 0.016206741333007812, 0.017242431640625, 0.018278121948242188, 0.019313812255859375, 0.020349502563476562, 0.02138519287109375, 0.022420883178710938, 0.023456573486328125, 0.024492263793945312, 0.0255279541015625, 0.026563644409179688, 0.027599334716796875, 0.028635025024414062, 0.02967071533203125, 0.030706405639648438, 0.031742095947265625, 0.03277778625488281, 0.0338134765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 4.0, 9.0, 19.0, 12.0, 19.0, 35.0, 28.0, 25.0, 26.0, 51.0, 58.0, 56.0, 72.0, 56.0, 64.0, 52.0, 65.0, 49.0, 45.0, 34.0, 31.0, 26.0, 29.0, 18.0, 17.0, 17.0, 8.0, 13.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005687713623046875, -0.005492985248565674, -0.005298256874084473, -0.0051035284996032715, -0.00490880012512207, -0.004714071750640869, -0.004519343376159668, -0.004324615001678467, -0.004129886627197266, -0.0039351582527160645, -0.0037404298782348633, -0.003545701503753662, -0.003350973129272461, -0.0031562447547912598, -0.0029615163803100586, -0.0027667880058288574, -0.0025720596313476562, -0.002377331256866455, -0.002182602882385254, -0.0019878745079040527, -0.0017931461334228516, -0.0015984177589416504, -0.0014036893844604492, -0.001208961009979248, -0.0010142326354980469, -0.0008195042610168457, -0.0006247758865356445, -0.00043004751205444336, -0.0002353191375732422, -4.0590763092041016e-05, 0.00015413761138916016, 0.00034886598587036133, 0.0005435943603515625, 0.0007383227348327637, 0.0009330511093139648, 0.001127779483795166, 0.0013225078582763672, 0.0015172362327575684, 0.0017119646072387695, 0.0019066929817199707, 0.002101421356201172, 0.002296149730682373, 0.0024908781051635742, 0.0026856064796447754, 0.0028803348541259766, 0.0030750632286071777, 0.003269791603088379, 0.00346451997756958, 0.0036592483520507812, 0.0038539767265319824, 0.004048705101013184, 0.004243433475494385, 0.004438161849975586, 0.004632890224456787, 0.004827618598937988, 0.0050223469734191895, 0.005217075347900391, 0.005411803722381592, 0.005606532096862793, 0.005801260471343994, 0.005995988845825195, 0.0061907172203063965, 0.006385445594787598, 0.006580173969268799, 0.00677490234375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 20.0, 36.0, 61.0, 93.0, 209.0, 224.0, 156.0, 96.0, 45.0, 23.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888968706130981, -0.5613466501235962, -0.5337964296340942, -0.5062462091445923, -0.47869595885276794, -0.451145738363266, -0.42359548807144165, -0.3960452675819397, -0.36849504709243774, -0.3409448266029358, -0.31339460611343384, -0.2858443558216095, -0.25829413533210754, -0.2307439148426056, -0.20319367945194244, -0.1756434440612793, -0.14809322357177734, -0.1205429956316948, -0.09299276769161224, -0.0654425397515297, -0.037892311811447144, -0.01034209132194519, 0.017208144068717957, 0.044758379459381104, 0.07230859994888306, 0.0998588278889656, 0.12740905582904816, 0.1549592912197113, 0.18250951170921326, 0.2100597321987152, 0.23760996758937836, 0.2651602029800415, 0.29271042346954346, 0.3202606439590454, 0.34781086444854736, 0.3753611147403717, 0.40291133522987366, 0.4304615557193756, 0.45801180601119995, 0.4855620265007019, 0.5131122469902039, 0.5406624674797058, 0.5682126879692078, 0.5957629084587097, 0.6233131885528564, 0.6508634090423584, 0.6784136295318604, 0.7059638500213623, 0.7335140705108643, 0.7610642910003662, 0.7886145114898682, 0.8161647319793701, 0.8437149524688721, 0.871265172958374, 0.8988154530525208, 0.9263656735420227, 0.9539158940315247, 0.9814661145210266, 1.0090163946151733, 1.0365666151046753, 1.0641168355941772, 1.0916670560836792, 1.1192172765731812, 1.146767497062683, 1.174317717552185]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 9.0, 13.0, 9.0, 20.0, 16.0, 25.0, 25.0, 31.0, 47.0, 49.0, 47.0, 52.0, 62.0, 59.0, 58.0, 55.0, 62.0, 58.0, 51.0, 51.0, 40.0, 41.0, 18.0, 17.0, 25.0, 9.0, 15.0, 9.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27519190311431885, -0.2643825113773346, -0.25357311964035034, -0.2427637279033661, -0.23195433616638184, -0.22114494442939758, -0.21033555269241333, -0.19952616095542908, -0.18871676921844482, -0.17790737748146057, -0.16709798574447632, -0.15628859400749207, -0.1454792022705078, -0.13466981053352356, -0.1238604187965393, -0.11305102705955505, -0.1022416353225708, -0.09143224358558655, -0.0806228518486023, -0.06981346011161804, -0.05900406837463379, -0.048194676637649536, -0.03738528490066528, -0.02657589316368103, -0.015766501426696777, -0.004957109689712524, 0.0058522820472717285, 0.01666167378425598, 0.027471065521240234, 0.03828045725822449, 0.04908984899520874, 0.05989924073219299, 0.07070866227149963, 0.08151805400848389, 0.09232744574546814, 0.10313683748245239, 0.11394622921943665, 0.1247556209564209, 0.13556501269340515, 0.1463744044303894, 0.15718379616737366, 0.1679931879043579, 0.17880257964134216, 0.18961197137832642, 0.20042136311531067, 0.21123075485229492, 0.22204014658927917, 0.23284953832626343, 0.24365893006324768, 0.25446832180023193, 0.2652777135372162, 0.27608710527420044, 0.2868964970111847, 0.29770588874816895, 0.3085152804851532, 0.31932467222213745, 0.3301340639591217, 0.34094345569610596, 0.3517528474330902, 0.36256223917007446, 0.3733716309070587, 0.38418102264404297, 0.3949904143810272, 0.4057998061180115, 0.4166091978549957]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 7.0, 3.0, 12.0, 18.0, 35.0, 111.0, 369.0, 2133.0, 22338.0, 864903.0, 151378.0, 6036.0, 849.0, 199.0, 65.0, 27.0, 11.0, 10.0, 2.0, 4.0, 5.0, 0.0, 1.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.223876953125, -1.18408203125, -1.144287109375, -1.1044921875, -1.064697265625, -1.02490234375, -0.985107421875, -0.9453125, -0.905517578125, -0.86572265625, -0.825927734375, -0.7861328125, -0.746337890625, -0.70654296875, -0.666748046875, -0.626953125, -0.587158203125, -0.54736328125, -0.507568359375, -0.4677734375, -0.427978515625, -0.38818359375, -0.348388671875, -0.30859375, -0.268798828125, -0.22900390625, -0.189208984375, -0.1494140625, -0.109619140625, -0.06982421875, -0.030029296875, 0.009765625, 0.049560546875, 0.08935546875, 0.129150390625, 0.1689453125, 0.208740234375, 0.24853515625, 0.288330078125, 0.328125, 0.367919921875, 0.40771484375, 0.447509765625, 0.4873046875, 0.527099609375, 0.56689453125, 0.606689453125, 0.646484375, 0.686279296875, 0.72607421875, 0.765869140625, 0.8056640625, 0.845458984375, 0.88525390625, 0.925048828125, 0.96484375, 1.004638671875, 1.04443359375, 1.084228515625, 1.1240234375, 1.163818359375, 1.20361328125, 1.243408203125, 1.283203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 15.0, 16.0, 29.0, 42.0, 71.0, 98.0, 112.0, 114.0, 114.0, 114.0, 103.0, 69.0, 42.0, 29.0, 20.0, 3.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.5399551391601562, -0.4983673095703125, -0.45677947998046875, -0.415191650390625, -0.37360382080078125, -0.3320159912109375, -0.29042816162109375, -0.24884033203125, -0.20725250244140625, -0.1656646728515625, -0.12407684326171875, -0.082489013671875, -0.04090118408203125, 0.0006866455078125, 0.04227447509765625, 0.0838623046875, 0.12545013427734375, 0.1670379638671875, 0.20862579345703125, 0.250213623046875, 0.29180145263671875, 0.3333892822265625, 0.37497711181640625, 0.41656494140625, 0.45815277099609375, 0.4997406005859375, 0.5413284301757812, 0.582916259765625, 0.6245040893554688, 0.6660919189453125, 0.7076797485351562, 0.749267578125, 0.7908554077148438, 0.8324432373046875, 0.8740310668945312, 0.915618896484375, 0.9572067260742188, 0.9987945556640625, 1.0403823852539062, 1.08197021484375, 1.1235580444335938, 1.1651458740234375, 1.2067337036132812, 1.248321533203125, 1.2899093627929688, 1.3314971923828125, 1.3730850219726562, 1.4146728515625, 1.4562606811523438, 1.4978485107421875, 1.5394363403320312, 1.581024169921875, 1.6226119995117188, 1.6641998291015625, 1.7057876586914062, 1.74737548828125, 1.7889633178710938, 1.8305511474609375, 1.8721389770507812, 1.913726806640625, 1.9553146362304688, 1.9969024658203125, 2.0384902954101562, 2.080078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 12.0, 10.0, 11.0, 14.0, 32.0, 25.0, 43.0, 96.0, 144.0, 269.0, 685.0, 2066.0, 11721.0, 199846.0, 796426.0, 31122.0, 4167.0, 964.0, 383.0, 193.0, 114.0, 74.0, 37.0, 27.0, 20.0, 19.0, 11.0, 6.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.0732421875, -1.0465545654296875, -1.019866943359375, -0.9931793212890625, -0.96649169921875, -0.9398040771484375, -0.913116455078125, -0.8864288330078125, -0.8597412109375, -0.8330535888671875, -0.806365966796875, -0.7796783447265625, -0.75299072265625, -0.7263031005859375, -0.699615478515625, -0.6729278564453125, -0.646240234375, -0.6195526123046875, -0.592864990234375, -0.5661773681640625, -0.53948974609375, -0.5128021240234375, -0.486114501953125, -0.4594268798828125, -0.4327392578125, -0.4060516357421875, -0.379364013671875, -0.3526763916015625, -0.32598876953125, -0.2993011474609375, -0.272613525390625, -0.2459259033203125, -0.21923828125, -0.1925506591796875, -0.165863037109375, -0.1391754150390625, -0.11248779296875, -0.0858001708984375, -0.059112548828125, -0.0324249267578125, -0.0057373046875, 0.0209503173828125, 0.047637939453125, 0.0743255615234375, 0.10101318359375, 0.1277008056640625, 0.154388427734375, 0.1810760498046875, 0.207763671875, 0.2344512939453125, 0.261138916015625, 0.2878265380859375, 0.31451416015625, 0.3412017822265625, 0.367889404296875, 0.3945770263671875, 0.4212646484375, 0.4479522705078125, 0.474639892578125, 0.5013275146484375, 0.52801513671875, 0.5547027587890625, 0.581390380859375, 0.6080780029296875, 0.634765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 7.0, 6.0, 5.0, 7.0, 14.0, 21.0, 22.0, 16.0, 28.0, 31.0, 26.0, 22.0, 34.0, 40.0, 31.0, 38.0, 27.0, 42.0, 36.0, 38.0, 43.0, 51.0, 43.0, 41.0, 34.0, 31.0, 31.0, 24.0, 23.0, 26.0, 22.0, 12.0, 15.0, 19.0, 8.0, 8.0, 15.0, 6.0, 7.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5078125, -0.4907989501953125, -0.473785400390625, -0.4567718505859375, -0.43975830078125, -0.4227447509765625, -0.405731201171875, -0.3887176513671875, -0.3717041015625, -0.3546905517578125, -0.337677001953125, -0.3206634521484375, -0.30364990234375, -0.2866363525390625, -0.269622802734375, -0.2526092529296875, -0.235595703125, -0.2185821533203125, -0.201568603515625, -0.1845550537109375, -0.16754150390625, -0.1505279541015625, -0.133514404296875, -0.1165008544921875, -0.0994873046875, -0.0824737548828125, -0.065460205078125, -0.0484466552734375, -0.03143310546875, -0.0144195556640625, 0.002593994140625, 0.0196075439453125, 0.03662109375, 0.0536346435546875, 0.070648193359375, 0.0876617431640625, 0.10467529296875, 0.1216888427734375, 0.138702392578125, 0.1557159423828125, 0.1727294921875, 0.1897430419921875, 0.206756591796875, 0.2237701416015625, 0.24078369140625, 0.2577972412109375, 0.274810791015625, 0.2918243408203125, 0.308837890625, 0.3258514404296875, 0.342864990234375, 0.3598785400390625, 0.37689208984375, 0.3939056396484375, 0.410919189453125, 0.4279327392578125, 0.4449462890625, 0.4619598388671875, 0.478973388671875, 0.4959869384765625, 0.51300048828125, 0.5300140380859375, 0.547027587890625, 0.5640411376953125, 0.5810546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 12.0, 8.0, 16.0, 13.0, 43.0, 87.0, 150.0, 328.0, 759.0, 2249.0, 8951.0, 77434.0, 840400.0, 103267.0, 10794.0, 2486.0, 866.0, 347.0, 155.0, 71.0, 49.0, 25.0, 11.0, 8.0, 10.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2744140625, -0.26598358154296875, -0.2575531005859375, -0.24912261962890625, -0.240692138671875, -0.23226165771484375, -0.2238311767578125, -0.21540069580078125, -0.20697021484375, -0.19853973388671875, -0.1901092529296875, -0.18167877197265625, -0.173248291015625, -0.16481781005859375, -0.1563873291015625, -0.14795684814453125, -0.1395263671875, -0.13109588623046875, -0.1226654052734375, -0.11423492431640625, -0.105804443359375, -0.09737396240234375, -0.0889434814453125, -0.08051300048828125, -0.07208251953125, -0.06365203857421875, -0.0552215576171875, -0.04679107666015625, -0.038360595703125, -0.02993011474609375, -0.0214996337890625, -0.01306915283203125, -0.004638671875, 0.00379180908203125, 0.0122222900390625, 0.02065277099609375, 0.029083251953125, 0.03751373291015625, 0.0459442138671875, 0.05437469482421875, 0.06280517578125, 0.07123565673828125, 0.0796661376953125, 0.08809661865234375, 0.096527099609375, 0.10495758056640625, 0.1133880615234375, 0.12181854248046875, 0.1302490234375, 0.13867950439453125, 0.1471099853515625, 0.15554046630859375, 0.163970947265625, 0.17240142822265625, 0.1808319091796875, 0.18926239013671875, 0.19769287109375, 0.20612335205078125, 0.2145538330078125, 0.22298431396484375, 0.231414794921875, 0.23984527587890625, 0.2482757568359375, 0.25670623779296875, 0.26513671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 7.0, 3.0, 8.0, 14.0, 10.0, 13.0, 30.0, 29.0, 51.0, 66.0, 92.0, 142.0, 156.0, 99.0, 81.0, 48.0, 43.0, 28.0, 24.0, 16.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5787390768527985e-05, -2.493150532245636e-05, -2.4075619876384735e-05, -2.321973443031311e-05, -2.2363848984241486e-05, -2.150796353816986e-05, -2.0652078092098236e-05, -1.979619264602661e-05, -1.8940307199954987e-05, -1.8084421753883362e-05, -1.7228536307811737e-05, -1.6372650861740112e-05, -1.5516765415668488e-05, -1.4660879969596863e-05, -1.3804994523525238e-05, -1.2949109077453613e-05, -1.2093223631381989e-05, -1.1237338185310364e-05, -1.0381452739238739e-05, -9.525567293167114e-06, -8.66968184709549e-06, -7.813796401023865e-06, -6.95791095495224e-06, -6.102025508880615e-06, -5.2461400628089905e-06, -4.390254616737366e-06, -3.534369170665741e-06, -2.678483724594116e-06, -1.8225982785224915e-06, -9.667128324508667e-07, -1.1082738637924194e-07, 7.450580596923828e-07, 1.6009435057640076e-06, 2.4568289518356323e-06, 3.312714397907257e-06, 4.168599843978882e-06, 5.024485290050507e-06, 5.880370736122131e-06, 6.736256182193756e-06, 7.592141628265381e-06, 8.448027074337006e-06, 9.30391252040863e-06, 1.0159797966480255e-05, 1.101568341255188e-05, 1.1871568858623505e-05, 1.272745430469513e-05, 1.3583339750766754e-05, 1.4439225196838379e-05, 1.5295110642910004e-05, 1.615099608898163e-05, 1.7006881535053253e-05, 1.7862766981124878e-05, 1.8718652427196503e-05, 1.9574537873268127e-05, 2.0430423319339752e-05, 2.1286308765411377e-05, 2.2142194211483002e-05, 2.2998079657554626e-05, 2.385396510362625e-05, 2.4709850549697876e-05, 2.55657359957695e-05, 2.6421621441841125e-05, 2.727750688791275e-05, 2.8133392333984375e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 22.0, 24.0, 43.0, 66.0, 146.0, 270.0, 770.0, 3167.0, 27198.0, 807551.0, 197419.0, 9367.0, 1567.0, 467.0, 202.0, 86.0, 63.0, 28.0, 24.0, 21.0, 10.0, 1.0, 7.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35302734375, -0.3428802490234375, -0.332733154296875, -0.3225860595703125, -0.31243896484375, -0.3022918701171875, -0.292144775390625, -0.2819976806640625, -0.2718505859375, -0.2617034912109375, -0.251556396484375, -0.2414093017578125, -0.23126220703125, -0.2211151123046875, -0.210968017578125, -0.2008209228515625, -0.190673828125, -0.1805267333984375, -0.170379638671875, -0.1602325439453125, -0.15008544921875, -0.1399383544921875, -0.129791259765625, -0.1196441650390625, -0.1094970703125, -0.0993499755859375, -0.089202880859375, -0.0790557861328125, -0.06890869140625, -0.0587615966796875, -0.048614501953125, -0.0384674072265625, -0.0283203125, -0.0181732177734375, -0.008026123046875, 0.0021209716796875, 0.01226806640625, 0.0224151611328125, 0.032562255859375, 0.0427093505859375, 0.0528564453125, 0.0630035400390625, 0.073150634765625, 0.0832977294921875, 0.09344482421875, 0.1035919189453125, 0.113739013671875, 0.1238861083984375, 0.134033203125, 0.1441802978515625, 0.154327392578125, 0.1644744873046875, 0.17462158203125, 0.1847686767578125, 0.194915771484375, 0.2050628662109375, 0.2152099609375, 0.2253570556640625, 0.235504150390625, 0.2456512451171875, 0.25579833984375, 0.2659454345703125, 0.276092529296875, 0.2862396240234375, 0.29638671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 2.0, 10.0, 8.0, 19.0, 23.0, 29.0, 29.0, 41.0, 64.0, 89.0, 113.0, 132.0, 120.0, 97.0, 65.0, 49.0, 38.0, 15.0, 20.0, 12.0, 12.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0772705078125, -0.07463932037353516, -0.07200813293457031, -0.06937694549560547, -0.06674575805664062, -0.06411457061767578, -0.06148338317871094, -0.058852195739746094, -0.05622100830078125, -0.053589820861816406, -0.05095863342285156, -0.04832744598388672, -0.045696258544921875, -0.04306507110595703, -0.04043388366699219, -0.037802696228027344, -0.0351715087890625, -0.032540321350097656, -0.029909133911132812, -0.02727794647216797, -0.024646759033203125, -0.02201557159423828, -0.019384384155273438, -0.016753196716308594, -0.01412200927734375, -0.011490821838378906, -0.008859634399414062, -0.006228446960449219, -0.003597259521484375, -0.0009660720825195312, 0.0016651153564453125, 0.004296302795410156, 0.006927490234375, 0.009558677673339844, 0.012189865112304688, 0.014821052551269531, 0.017452239990234375, 0.02008342742919922, 0.022714614868164062, 0.025345802307128906, 0.02797698974609375, 0.030608177185058594, 0.03323936462402344, 0.03587055206298828, 0.038501739501953125, 0.04113292694091797, 0.04376411437988281, 0.046395301818847656, 0.0490264892578125, 0.051657676696777344, 0.05428886413574219, 0.05692005157470703, 0.059551239013671875, 0.06218242645263672, 0.06481361389160156, 0.0674448013305664, 0.07007598876953125, 0.0727071762084961, 0.07533836364746094, 0.07796955108642578, 0.08060073852539062, 0.08323192596435547, 0.08586311340332031, 0.08849430084228516, 0.09112548828125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 10.0, 11.0, 22.0, 45.0, 74.0, 142.0, 240.0, 196.0, 156.0, 53.0, 24.0, 14.0, 12.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.669635534286499, -1.611814022064209, -1.5539923906326294, -1.4961708784103394, -1.4383493661880493, -1.3805277347564697, -1.3227062225341797, -1.2648847103118896, -1.20706307888031, -1.14924156665802, -1.0914199352264404, -1.0335984230041504, -0.9757768511772156, -0.9179552793502808, -0.8601337671279907, -0.8023121953010559, -0.7444906830787659, -0.686669111251831, -0.628847599029541, -0.5710260272026062, -0.5132044553756714, -0.45538291335105896, -0.39756137132644653, -0.3397397994995117, -0.2819182574748993, -0.22409670054912567, -0.16627514362335205, -0.10845360159873962, -0.050632044672966, 0.007189512252807617, 0.06501105427742004, 0.12283262610435486, 0.18065416812896729, 0.2384757250547409, 0.2962972819805145, 0.35411882400512695, 0.41194039583206177, 0.4697619378566742, 0.5275834798812866, 0.5854050517082214, 0.6432266235351562, 0.7010481953620911, 0.7588697075843811, 0.8166912794113159, 0.8745128512382507, 0.9323344230651855, 0.9901559352874756, 1.0479774475097656, 1.1057989597320557, 1.1636204719543457, 1.2214421033859253, 1.2792636156082153, 1.3370851278305054, 1.394906759262085, 1.452728271484375, 1.510549783706665, 1.5683714151382446, 1.6261929273605347, 1.6840145587921143, 1.7418360710144043, 1.7996575832366943, 1.857479214668274, 1.915300726890564, 1.9731223583221436, 2.0309438705444336]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 12.0, 13.0, 23.0, 14.0, 40.0, 39.0, 38.0, 46.0, 44.0, 58.0, 50.0, 71.0, 49.0, 58.0, 54.0, 65.0, 55.0, 50.0, 47.0, 38.0, 37.0, 32.0, 18.0, 11.0, 10.0, 2.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9879714846611023, -0.9422454833984375, -0.8965195417404175, -0.8507936000823975, -0.8050675988197327, -0.7593415975570679, -0.7136156558990479, -0.6678897142410278, -0.622163712978363, -0.5764377117156982, -0.5307117700576782, -0.4849857985973358, -0.4392598271369934, -0.393533855676651, -0.3478078842163086, -0.3020819127559662, -0.2563559412956238, -0.21062996983528137, -0.16490399837493896, -0.11917802691459656, -0.07345205545425415, -0.027726083993911743, 0.017999887466430664, 0.06372585892677307, 0.10945183038711548, 0.15517780184745789, 0.2009037733078003, 0.2466297447681427, 0.2923557162284851, 0.3380816876888275, 0.3838076591491699, 0.42953363060951233, 0.47525954246520996, 0.52098548412323, 0.5667114853858948, 0.6124374866485596, 0.6581634283065796, 0.7038893699645996, 0.7496153712272644, 0.7953413724899292, 0.8410673141479492, 0.8867932558059692, 0.932519257068634, 0.9782452583312988, 1.0239711999893188, 1.0696971416473389, 1.1154232025146484, 1.1611491441726685, 1.2068750858306885, 1.2526010274887085, 1.2983269691467285, 1.344053030014038, 1.389778971672058, 1.4355049133300781, 1.4812309741973877, 1.5269569158554077, 1.5726828575134277, 1.6184087991714478, 1.6641347408294678, 1.7098608016967773, 1.7555867433547974, 1.8013126850128174, 1.847038745880127, 1.892764687538147, 1.938490629196167]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 16.0, 19.0, 20.0, 22.0, 30.0, 39.0, 56.0, 117.0, 207.0, 457.0, 1264.0, 4583.0, 27887.0, 948619.0, 3136535.0, 63728.0, 7523.0, 1851.0, 641.0, 258.0, 122.0, 77.0, 47.0, 35.0, 24.0, 23.0, 16.0, 8.0, 12.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2080078125, -1.1726531982421875, -1.137298583984375, -1.1019439697265625, -1.06658935546875, -1.0312347412109375, -0.995880126953125, -0.9605255126953125, -0.9251708984375, -0.8898162841796875, -0.854461669921875, -0.8191070556640625, -0.78375244140625, -0.7483978271484375, -0.713043212890625, -0.6776885986328125, -0.642333984375, -0.6069793701171875, -0.571624755859375, -0.5362701416015625, -0.50091552734375, -0.4655609130859375, -0.430206298828125, -0.3948516845703125, -0.3594970703125, -0.3241424560546875, -0.288787841796875, -0.2534332275390625, -0.21807861328125, -0.1827239990234375, -0.147369384765625, -0.1120147705078125, -0.07666015625, -0.0413055419921875, -0.005950927734375, 0.0294036865234375, 0.06475830078125, 0.1001129150390625, 0.135467529296875, 0.1708221435546875, 0.2061767578125, 0.2415313720703125, 0.276885986328125, 0.3122406005859375, 0.34759521484375, 0.3829498291015625, 0.418304443359375, 0.4536590576171875, 0.489013671875, 0.5243682861328125, 0.559722900390625, 0.5950775146484375, 0.63043212890625, 0.6657867431640625, 0.701141357421875, 0.7364959716796875, 0.7718505859375, 0.8072052001953125, 0.842559814453125, 0.8779144287109375, 0.91326904296875, 0.9486236572265625, 0.983978271484375, 1.0193328857421875, 1.0546875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 20.0, 17.0, 27.0, 26.0, 33.0, 40.0, 53.0, 43.0, 38.0, 60.0, 59.0, 51.0, 64.0, 72.0, 67.0, 52.0, 44.0, 37.0, 38.0, 39.0, 28.0, 19.0, 10.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4145774841308594, -0.40068817138671875, -0.3867988586425781, -0.3729095458984375, -0.3590202331542969, -0.34513092041015625, -0.3312416076660156, -0.317352294921875, -0.3034629821777344, -0.28957366943359375, -0.2756843566894531, -0.2617950439453125, -0.24790573120117188, -0.23401641845703125, -0.22012710571289062, -0.20623779296875, -0.19234848022460938, -0.17845916748046875, -0.16456985473632812, -0.1506805419921875, -0.13679122924804688, -0.12290191650390625, -0.10901260375976562, -0.095123291015625, -0.08123397827148438, -0.06734466552734375, -0.053455352783203125, -0.0395660400390625, -0.025676727294921875, -0.01178741455078125, 0.002101898193359375, 0.0159912109375, 0.029880523681640625, 0.04376983642578125, 0.057659149169921875, 0.0715484619140625, 0.08543777465820312, 0.09932708740234375, 0.11321640014648438, 0.127105712890625, 0.14099502563476562, 0.15488433837890625, 0.16877365112304688, 0.1826629638671875, 0.19655227661132812, 0.21044158935546875, 0.22433090209960938, 0.23822021484375, 0.2521095275878906, 0.26599884033203125, 0.2798881530761719, 0.2937774658203125, 0.3076667785644531, 0.32155609130859375, 0.3354454040527344, 0.349334716796875, 0.3632240295410156, 0.37711334228515625, 0.3910026550292969, 0.4048919677734375, 0.4187812805175781, 0.43267059326171875, 0.4465599060058594, 0.46044921875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 9.0, 12.0, 11.0, 16.0, 27.0, 44.0, 78.0, 111.0, 186.0, 365.0, 810.0, 2258.0, 7527.0, 41306.0, 857948.0, 3181389.0, 85328.0, 11896.0, 2933.0, 1009.0, 441.0, 230.0, 144.0, 69.0, 41.0, 17.0, 22.0, 9.0, 13.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.9078521728515625, -0.884063720703125, -0.8602752685546875, -0.83648681640625, -0.8126983642578125, -0.788909912109375, -0.7651214599609375, -0.7413330078125, -0.7175445556640625, -0.693756103515625, -0.6699676513671875, -0.64617919921875, -0.6223907470703125, -0.598602294921875, -0.5748138427734375, -0.551025390625, -0.5272369384765625, -0.503448486328125, -0.4796600341796875, -0.45587158203125, -0.4320831298828125, -0.408294677734375, -0.3845062255859375, -0.3607177734375, -0.3369293212890625, -0.313140869140625, -0.2893524169921875, -0.26556396484375, -0.2417755126953125, -0.217987060546875, -0.1941986083984375, -0.17041015625, -0.1466217041015625, -0.122833251953125, -0.0990447998046875, -0.07525634765625, -0.0514678955078125, -0.027679443359375, -0.0038909912109375, 0.0198974609375, 0.0436859130859375, 0.067474365234375, 0.0912628173828125, 0.11505126953125, 0.1388397216796875, 0.162628173828125, 0.1864166259765625, 0.210205078125, 0.2339935302734375, 0.257781982421875, 0.2815704345703125, 0.30535888671875, 0.3291473388671875, 0.352935791015625, 0.3767242431640625, 0.4005126953125, 0.4243011474609375, 0.448089599609375, 0.4718780517578125, 0.49566650390625, 0.5194549560546875, 0.543243408203125, 0.5670318603515625, 0.5908203125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 10.0, 9.0, 18.0, 15.0, 40.0, 50.0, 73.0, 129.0, 227.0, 436.0, 743.0, 861.0, 603.0, 329.0, 178.0, 111.0, 70.0, 53.0, 33.0, 21.0, 25.0, 5.0, 5.0, 8.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136962890625, -0.13054275512695312, -0.12412261962890625, -0.11770248413085938, -0.1112823486328125, -0.10486221313476562, -0.09844207763671875, -0.09202194213867188, -0.085601806640625, -0.07918167114257812, -0.07276153564453125, -0.06634140014648438, -0.0599212646484375, -0.053501129150390625, -0.04708099365234375, -0.040660858154296875, -0.03424072265625, -0.027820587158203125, -0.02140045166015625, -0.014980316162109375, -0.0085601806640625, -0.002140045166015625, 0.00428009033203125, 0.010700225830078125, 0.017120361328125, 0.023540496826171875, 0.02996063232421875, 0.036380767822265625, 0.0428009033203125, 0.049221038818359375, 0.05564117431640625, 0.062061309814453125, 0.0684814453125, 0.07490158081054688, 0.08132171630859375, 0.08774185180664062, 0.0941619873046875, 0.10058212280273438, 0.10700225830078125, 0.11342239379882812, 0.119842529296875, 0.12626266479492188, 0.13268280029296875, 0.13910293579101562, 0.1455230712890625, 0.15194320678710938, 0.15836334228515625, 0.16478347778320312, 0.17120361328125, 0.17762374877929688, 0.18404388427734375, 0.19046401977539062, 0.1968841552734375, 0.20330429077148438, 0.20972442626953125, 0.21614456176757812, 0.222564697265625, 0.22898483276367188, 0.23540496826171875, 0.24182510375976562, 0.2482452392578125, 0.2546653747558594, 0.26108551025390625, 0.2675056457519531, 0.27392578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 6.0, 9.0, 8.0, 10.0, 18.0, 25.0, 47.0, 61.0, 83.0, 98.0, 99.0, 98.0, 94.0, 113.0, 77.0, 39.0, 31.0, 25.0, 21.0, 13.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42179274559020996, -0.39984646439552307, -0.3779001832008362, -0.3559538722038269, -0.3340076208114624, -0.3120613098144531, -0.29011502861976624, -0.26816874742507935, -0.24622246623039246, -0.22427618503570557, -0.20232990384101868, -0.1803836077451706, -0.1584373265504837, -0.13649104535579681, -0.11454474925994873, -0.09259846806526184, -0.07065218687057495, -0.04870590195059776, -0.026759617030620575, -0.004813328385353088, 0.0171329528093338, 0.03907923400402069, 0.061025530099868774, 0.08297181129455566, 0.10491809248924255, 0.12686437368392944, 0.14881065487861633, 0.17075695097446442, 0.1927032321691513, 0.2146495133638382, 0.23659580945968628, 0.25854209065437317, 0.2804883122444153, 0.3024345934391022, 0.32438087463378906, 0.34632718563079834, 0.36827343702316284, 0.3902197480201721, 0.412166029214859, 0.4341123104095459, 0.4560585916042328, 0.4780048727989197, 0.49995115399360657, 0.5218974351882935, 0.5438437461853027, 0.5657899975776672, 0.5877363085746765, 0.609682559967041, 0.6316288709640503, 0.6535751819610596, 0.6755214333534241, 0.6974677443504333, 0.7194139957427979, 0.7413603067398071, 0.7633066177368164, 0.7852528691291809, 0.8071991205215454, 0.8291454315185547, 0.8510916829109192, 0.8730379939079285, 0.894984245300293, 0.9169305562973022, 0.9388768672943115, 0.960823118686676, 0.9827694296836853]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 2.0, 4.0, 8.0, 13.0, 19.0, 18.0, 18.0, 22.0, 26.0, 33.0, 32.0, 39.0, 40.0, 44.0, 48.0, 36.0, 49.0, 51.0, 55.0, 48.0, 40.0, 49.0, 49.0, 40.0, 28.0, 22.0, 36.0, 23.0, 18.0, 18.0, 14.0, 12.0, 7.0, 5.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3696340024471283, -0.3574292063713074, -0.34522441029548645, -0.3330196142196655, -0.3208147883415222, -0.3086099922657013, -0.29640519618988037, -0.28420040011405945, -0.2719956040382385, -0.2597908079624176, -0.24758599698543549, -0.23538120090961456, -0.22317638993263245, -0.21097159385681152, -0.1987667977809906, -0.18656200170516968, -0.17435717582702637, -0.16215237975120544, -0.14994756877422333, -0.1377427726984024, -0.1255379617214203, -0.11333316564559937, -0.10112836956977844, -0.08892356604337692, -0.0767187625169754, -0.06451395899057388, -0.05230915918946266, -0.04010435938835144, -0.02789955586194992, -0.0156947523355484, -0.003489956259727478, 0.008714847266674042, 0.02091968059539795, 0.03312448412179947, 0.04532928392291069, 0.05753408372402191, 0.06973888725042343, 0.08194369077682495, 0.09414848685264587, 0.1063532903790474, 0.11855809390544891, 0.13076288998126984, 0.14296770095825195, 0.15517249703407288, 0.1673772931098938, 0.17958210408687592, 0.19178690016269684, 0.20399171113967896, 0.21619650721549988, 0.2284013032913208, 0.24060611426830292, 0.25281089544296265, 0.26501572132110596, 0.2772205173969269, 0.2894253134727478, 0.3016301095485687, 0.31383490562438965, 0.32603970170021057, 0.3382444977760315, 0.3504493236541748, 0.3626541197299957, 0.37485891580581665, 0.3870637118816376, 0.3992685079574585, 0.4114733338356018]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 9.0, 10.0, 11.0, 20.0, 16.0, 33.0, 37.0, 44.0, 54.0, 108.0, 138.0, 260.0, 492.0, 1051.0, 2191.0, 5351.0, 14086.0, 40213.0, 119922.0, 306115.0, 336956.0, 144418.0, 48865.0, 16713.0, 6328.0, 2607.0, 1160.0, 523.0, 279.0, 195.0, 104.0, 59.0, 46.0, 37.0, 33.0, 24.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06671142578125, -0.06486272811889648, -0.06301403045654297, -0.06116533279418945, -0.05931663513183594, -0.05746793746948242, -0.055619239807128906, -0.05377054214477539, -0.051921844482421875, -0.05007314682006836, -0.048224449157714844, -0.04637575149536133, -0.04452705383300781, -0.0426783561706543, -0.04082965850830078, -0.038980960845947266, -0.03713226318359375, -0.035283565521240234, -0.03343486785888672, -0.0315861701965332, -0.029737472534179688, -0.027888774871826172, -0.026040077209472656, -0.02419137954711914, -0.022342681884765625, -0.02049398422241211, -0.018645286560058594, -0.016796588897705078, -0.014947891235351562, -0.013099193572998047, -0.011250495910644531, -0.009401798248291016, -0.0075531005859375, -0.005704402923583984, -0.0038557052612304688, -0.002007007598876953, -0.0001583099365234375, 0.0016903877258300781, 0.0035390853881835938, 0.005387783050537109, 0.007236480712890625, 0.00908517837524414, 0.010933876037597656, 0.012782573699951172, 0.014631271362304688, 0.016479969024658203, 0.01832866668701172, 0.020177364349365234, 0.02202606201171875, 0.023874759674072266, 0.02572345733642578, 0.027572154998779297, 0.029420852661132812, 0.03126955032348633, 0.033118247985839844, 0.03496694564819336, 0.036815643310546875, 0.03866434097290039, 0.040513038635253906, 0.04236173629760742, 0.04421043395996094, 0.04605913162231445, 0.04790782928466797, 0.049756526947021484, 0.051605224609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 2.0, 14.0, 8.0, 4.0, 14.0, 24.0, 28.0, 31.0, 35.0, 39.0, 52.0, 65.0, 52.0, 55.0, 79.0, 67.0, 59.0, 76.0, 65.0, 41.0, 31.0, 36.0, 33.0, 19.0, 20.0, 20.0, 3.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.252227783203125, -0.24127197265625, -0.230316162109375, -0.2193603515625, -0.208404541015625, -0.19744873046875, -0.186492919921875, -0.175537109375, -0.164581298828125, -0.15362548828125, -0.142669677734375, -0.1317138671875, -0.120758056640625, -0.10980224609375, -0.098846435546875, -0.087890625, -0.076934814453125, -0.06597900390625, -0.055023193359375, -0.0440673828125, -0.033111572265625, -0.02215576171875, -0.011199951171875, -0.000244140625, 0.010711669921875, 0.02166748046875, 0.032623291015625, 0.0435791015625, 0.054534912109375, 0.06549072265625, 0.076446533203125, 0.08740234375, 0.098358154296875, 0.10931396484375, 0.120269775390625, 0.1312255859375, 0.142181396484375, 0.15313720703125, 0.164093017578125, 0.175048828125, 0.186004638671875, 0.19696044921875, 0.207916259765625, 0.2188720703125, 0.229827880859375, 0.24078369140625, 0.251739501953125, 0.2626953125, 0.273651123046875, 0.28460693359375, 0.295562744140625, 0.3065185546875, 0.317474365234375, 0.32843017578125, 0.339385986328125, 0.350341796875, 0.361297607421875, 0.37225341796875, 0.383209228515625, 0.3941650390625, 0.405120849609375, 0.41607666015625, 0.427032470703125, 0.43798828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 13.0, 8.0, 17.0, 19.0, 35.0, 48.0, 85.0, 121.0, 224.0, 314.0, 607.0, 1193.0, 2585.0, 6025.0, 15687.0, 47961.0, 158344.0, 389619.0, 287210.0, 92509.0, 28246.0, 9734.0, 3991.0, 1788.0, 887.0, 509.0, 307.0, 190.0, 104.0, 56.0, 29.0, 32.0, 21.0, 14.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.07427978515625, -0.07236433029174805, -0.0704488754272461, -0.06853342056274414, -0.06661796569824219, -0.06470251083374023, -0.06278705596923828, -0.06087160110473633, -0.058956146240234375, -0.05704069137573242, -0.05512523651123047, -0.053209781646728516, -0.05129432678222656, -0.04937887191772461, -0.047463417053222656, -0.0455479621887207, -0.04363250732421875, -0.0417170524597168, -0.039801597595214844, -0.03788614273071289, -0.03597068786621094, -0.034055233001708984, -0.03213977813720703, -0.030224323272705078, -0.028308868408203125, -0.026393413543701172, -0.02447795867919922, -0.022562503814697266, -0.020647048950195312, -0.01873159408569336, -0.016816139221191406, -0.014900684356689453, -0.0129852294921875, -0.011069774627685547, -0.009154319763183594, -0.007238864898681641, -0.0053234100341796875, -0.0034079551696777344, -0.0014925003051757812, 0.0004229545593261719, 0.002338409423828125, 0.004253864288330078, 0.006169319152832031, 0.008084774017333984, 0.010000228881835938, 0.01191568374633789, 0.013831138610839844, 0.015746593475341797, 0.01766204833984375, 0.019577503204345703, 0.021492958068847656, 0.02340841293334961, 0.025323867797851562, 0.027239322662353516, 0.02915477752685547, 0.031070232391357422, 0.032985687255859375, 0.03490114212036133, 0.03681659698486328, 0.038732051849365234, 0.04064750671386719, 0.04256296157836914, 0.044478416442871094, 0.04639387130737305, 0.048309326171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 10.0, 9.0, 15.0, 11.0, 12.0, 18.0, 19.0, 25.0, 20.0, 35.0, 34.0, 32.0, 39.0, 36.0, 46.0, 39.0, 55.0, 41.0, 55.0, 41.0, 35.0, 49.0, 44.0, 34.0, 35.0, 32.0, 31.0, 21.0, 19.0, 12.0, 16.0, 12.0, 8.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.55615234375, -0.5408363342285156, -0.5255203247070312, -0.5102043151855469, -0.4948883056640625, -0.4795722961425781, -0.46425628662109375, -0.4489402770996094, -0.433624267578125, -0.4183082580566406, -0.40299224853515625, -0.3876762390136719, -0.3723602294921875, -0.3570442199707031, -0.34172821044921875, -0.3264122009277344, -0.31109619140625, -0.2957801818847656, -0.28046417236328125, -0.2651481628417969, -0.2498321533203125, -0.23451614379882812, -0.21920013427734375, -0.20388412475585938, -0.188568115234375, -0.17325210571289062, -0.15793609619140625, -0.14262008666992188, -0.1273040771484375, -0.11198806762695312, -0.09667205810546875, -0.08135604858398438, -0.0660400390625, -0.050724029541015625, -0.03540802001953125, -0.020092010498046875, -0.0047760009765625, 0.010540008544921875, 0.02585601806640625, 0.041172027587890625, 0.056488037109375, 0.07180404663085938, 0.08712005615234375, 0.10243606567382812, 0.1177520751953125, 0.13306808471679688, 0.14838409423828125, 0.16370010375976562, 0.17901611328125, 0.19433212280273438, 0.20964813232421875, 0.22496414184570312, 0.2402801513671875, 0.2555961608886719, 0.27091217041015625, 0.2862281799316406, 0.301544189453125, 0.3168601989746094, 0.33217620849609375, 0.3474922180175781, 0.3628082275390625, 0.3781242370605469, 0.39344024658203125, 0.4087562561035156, 0.424072265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 11.0, 21.0, 15.0, 26.0, 38.0, 53.0, 67.0, 103.0, 157.0, 246.0, 432.0, 764.0, 1341.0, 2692.0, 5752.0, 14690.0, 48505.0, 209496.0, 517549.0, 179473.0, 42993.0, 13226.0, 5206.0, 2491.0, 1322.0, 703.0, 417.0, 244.0, 175.0, 96.0, 77.0, 22.0, 42.0, 19.0, 10.0, 15.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020233154296875, -0.019568681716918945, -0.01890420913696289, -0.018239736557006836, -0.01757526397705078, -0.016910791397094727, -0.016246318817138672, -0.015581846237182617, -0.014917373657226562, -0.014252901077270508, -0.013588428497314453, -0.012923955917358398, -0.012259483337402344, -0.011595010757446289, -0.010930538177490234, -0.01026606559753418, -0.009601593017578125, -0.00893712043762207, -0.008272647857666016, -0.007608175277709961, -0.006943702697753906, -0.0062792301177978516, -0.005614757537841797, -0.004950284957885742, -0.0042858123779296875, -0.003621339797973633, -0.002956867218017578, -0.0022923946380615234, -0.0016279220581054688, -0.0009634494781494141, -0.0002989768981933594, 0.0003654956817626953, 0.00102996826171875, 0.0016944408416748047, 0.0023589134216308594, 0.003023386001586914, 0.0036878585815429688, 0.0043523311614990234, 0.005016803741455078, 0.005681276321411133, 0.0063457489013671875, 0.007010221481323242, 0.007674694061279297, 0.008339166641235352, 0.009003639221191406, 0.009668111801147461, 0.010332584381103516, 0.01099705696105957, 0.011661529541015625, 0.01232600212097168, 0.012990474700927734, 0.013654947280883789, 0.014319419860839844, 0.014983892440795898, 0.015648365020751953, 0.016312837600708008, 0.016977310180664062, 0.017641782760620117, 0.018306255340576172, 0.018970727920532227, 0.01963520050048828, 0.020299673080444336, 0.02096414566040039, 0.021628618240356445, 0.0222930908203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 7.0, 24.0, 24.0, 30.0, 47.0, 51.0, 54.0, 87.0, 71.0, 110.0, 104.0, 77.0, 88.0, 63.0, 39.0, 30.0, 32.0, 14.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4901161193847656e-05, -1.4456920325756073e-05, -1.401267945766449e-05, -1.3568438589572906e-05, -1.3124197721481323e-05, -1.267995685338974e-05, -1.2235715985298157e-05, -1.1791475117206573e-05, -1.134723424911499e-05, -1.0902993381023407e-05, -1.0458752512931824e-05, -1.001451164484024e-05, -9.570270776748657e-06, -9.126029908657074e-06, -8.68178904056549e-06, -8.237548172473907e-06, -7.793307304382324e-06, -7.349066436290741e-06, -6.904825568199158e-06, -6.4605847001075745e-06, -6.016343832015991e-06, -5.572102963924408e-06, -5.127862095832825e-06, -4.6836212277412415e-06, -4.239380359649658e-06, -3.795139491558075e-06, -3.3508986234664917e-06, -2.9066577553749084e-06, -2.462416887283325e-06, -2.018176019191742e-06, -1.5739351511001587e-06, -1.1296942830085754e-06, -6.854534149169922e-07, -2.4121254682540894e-07, 2.0302832126617432e-07, 6.472691893577576e-07, 1.0915100574493408e-06, 1.535750925540924e-06, 1.9799917936325073e-06, 2.4242326617240906e-06, 2.868473529815674e-06, 3.312714397907257e-06, 3.7569552659988403e-06, 4.201196134090424e-06, 4.645437002182007e-06, 5.08967787027359e-06, 5.533918738365173e-06, 5.978159606456757e-06, 6.42240047454834e-06, 6.866641342639923e-06, 7.310882210731506e-06, 7.75512307882309e-06, 8.199363946914673e-06, 8.643604815006256e-06, 9.08784568309784e-06, 9.532086551189423e-06, 9.976327419281006e-06, 1.0420568287372589e-05, 1.0864809155464172e-05, 1.1309050023555756e-05, 1.1753290891647339e-05, 1.2197531759738922e-05, 1.2641772627830505e-05, 1.3086013495922089e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 13.0, 17.0, 28.0, 35.0, 59.0, 74.0, 113.0, 124.0, 215.0, 379.0, 704.0, 1193.0, 2470.0, 5791.0, 14656.0, 41681.0, 126174.0, 318484.0, 330538.0, 134083.0, 44462.0, 15665.0, 6068.0, 2500.0, 1239.0, 610.0, 376.0, 236.0, 154.0, 109.0, 87.0, 49.0, 36.0, 34.0, 25.0, 13.0, 10.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0158538818359375, -0.015342950820922852, -0.014832019805908203, -0.014321088790893555, -0.013810157775878906, -0.013299226760864258, -0.01278829574584961, -0.012277364730834961, -0.011766433715820312, -0.011255502700805664, -0.010744571685791016, -0.010233640670776367, -0.009722709655761719, -0.00921177864074707, -0.008700847625732422, -0.008189916610717773, -0.007678985595703125, -0.0071680545806884766, -0.006657123565673828, -0.00614619255065918, -0.005635261535644531, -0.005124330520629883, -0.004613399505615234, -0.004102468490600586, -0.0035915374755859375, -0.003080606460571289, -0.0025696754455566406, -0.002058744430541992, -0.0015478134155273438, -0.0010368824005126953, -0.0005259513854980469, -1.5020370483398438e-05, 0.00049591064453125, 0.0010068416595458984, 0.0015177726745605469, 0.0020287036895751953, 0.0025396347045898438, 0.003050565719604492, 0.0035614967346191406, 0.004072427749633789, 0.0045833587646484375, 0.005094289779663086, 0.005605220794677734, 0.006116151809692383, 0.006627082824707031, 0.00713801383972168, 0.007648944854736328, 0.008159875869750977, 0.008670806884765625, 0.009181737899780273, 0.009692668914794922, 0.01020359992980957, 0.010714530944824219, 0.011225461959838867, 0.011736392974853516, 0.012247323989868164, 0.012758255004882812, 0.013269186019897461, 0.01378011703491211, 0.014291048049926758, 0.014801979064941406, 0.015312910079956055, 0.015823841094970703, 0.01633477210998535, 0.016845703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 7.0, 11.0, 11.0, 10.0, 12.0, 8.0, 19.0, 30.0, 25.0, 31.0, 29.0, 38.0, 62.0, 52.0, 49.0, 67.0, 57.0, 44.0, 52.0, 46.0, 50.0, 37.0, 32.0, 39.0, 31.0, 22.0, 27.0, 19.0, 16.0, 11.0, 9.0, 7.0, 8.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0048065185546875, -0.004659771919250488, -0.0045130252838134766, -0.004366278648376465, -0.004219532012939453, -0.004072785377502441, -0.00392603874206543, -0.003779292106628418, -0.0036325454711914062, -0.0034857988357543945, -0.003339052200317383, -0.003192305564880371, -0.0030455589294433594, -0.0028988122940063477, -0.002752065658569336, -0.0026053190231323242, -0.0024585723876953125, -0.0023118257522583008, -0.002165079116821289, -0.0020183324813842773, -0.0018715858459472656, -0.001724839210510254, -0.0015780925750732422, -0.0014313459396362305, -0.0012845993041992188, -0.001137852668762207, -0.0009911060333251953, -0.0008443593978881836, -0.0006976127624511719, -0.0005508661270141602, -0.00040411949157714844, -0.0002573728561401367, -0.000110626220703125, 3.612041473388672e-05, 0.00018286705017089844, 0.00032961368560791016, 0.0004763603210449219, 0.0006231069564819336, 0.0007698535919189453, 0.000916600227355957, 0.0010633468627929688, 0.0012100934982299805, 0.0013568401336669922, 0.001503586769104004, 0.0016503334045410156, 0.0017970800399780273, 0.001943826675415039, 0.0020905733108520508, 0.0022373199462890625, 0.0023840665817260742, 0.002530813217163086, 0.0026775598526000977, 0.0028243064880371094, 0.002971053123474121, 0.003117799758911133, 0.0032645463943481445, 0.0034112930297851562, 0.003558039665222168, 0.0037047863006591797, 0.0038515329360961914, 0.003998279571533203, 0.004145026206970215, 0.0042917728424072266, 0.004438519477844238, 0.00458526611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 17.0, 25.0, 52.0, 150.0, 210.0, 250.0, 166.0, 75.0, 28.0, 14.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1758981943130493, -1.1465601921081543, -1.1172221899032593, -1.0878841876983643, -1.0585461854934692, -1.0292081832885742, -0.9998701810836792, -0.9705321788787842, -0.9411941766738892, -0.9118561744689941, -0.8825181722640991, -0.8531801700592041, -0.8238421678543091, -0.7945041656494141, -0.765166163444519, -0.735828161239624, -0.706490159034729, -0.677152156829834, -0.647814154624939, -0.618476152420044, -0.5891381502151489, -0.5598001480102539, -0.5304621458053589, -0.5011241436004639, -0.47178614139556885, -0.44244813919067383, -0.4131101369857788, -0.3837721347808838, -0.35443413257598877, -0.32509613037109375, -0.29575812816619873, -0.2664201259613037, -0.23708206415176392, -0.2077440619468689, -0.17840605974197388, -0.14906805753707886, -0.11973005533218384, -0.09039205312728882, -0.0610540509223938, -0.03171604871749878, -0.0023780465126037598, 0.02695995569229126, 0.05629795789718628, 0.0856359601020813, 0.11497396230697632, 0.14431196451187134, 0.17364996671676636, 0.20298796892166138, 0.2323259711265564, 0.2616639733314514, 0.29100197553634644, 0.32033997774124146, 0.3496779799461365, 0.3790159821510315, 0.4083539843559265, 0.43769198656082153, 0.46702998876571655, 0.4963679909706116, 0.5257059931755066, 0.5550439953804016, 0.5843819975852966, 0.6137199997901917, 0.6430580019950867, 0.6723960041999817, 0.7017340064048767]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 9.0, 17.0, 19.0, 22.0, 25.0, 39.0, 38.0, 33.0, 59.0, 54.0, 62.0, 50.0, 60.0, 70.0, 61.0, 58.0, 52.0, 45.0, 36.0, 35.0, 31.0, 21.0, 23.0, 14.0, 7.0, 11.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2743450701236725, -0.26477813720703125, -0.2552111744880676, -0.2456442266702652, -0.23607727885246277, -0.22651033103466034, -0.2169433832168579, -0.20737643539905548, -0.19780948758125305, -0.18824253976345062, -0.1786755919456482, -0.16910864412784576, -0.15954169631004333, -0.1499747484922409, -0.14040780067443848, -0.13084085285663605, -0.12127390503883362, -0.11170695722103119, -0.10214000940322876, -0.09257306158542633, -0.0830061137676239, -0.07343916594982147, -0.06387221813201904, -0.054305270314216614, -0.044738322496414185, -0.035171374678611755, -0.025604426860809326, -0.016037479043006897, -0.006470531225204468, 0.0030964165925979614, 0.01266336441040039, 0.02223031222820282, 0.03179726004600525, 0.04136420786380768, 0.05093115568161011, 0.06049810349941254, 0.07006505131721497, 0.0796319991350174, 0.08919894695281982, 0.09876589477062225, 0.10833284258842468, 0.11789979040622711, 0.12746673822402954, 0.13703368604183197, 0.1466006338596344, 0.15616758167743683, 0.16573452949523926, 0.1753014773130417, 0.18486842513084412, 0.19443537294864655, 0.20400232076644897, 0.2135692685842514, 0.22313621640205383, 0.23270316421985626, 0.2422701120376587, 0.2518370747566223, 0.26140400767326355, 0.2709709405899048, 0.2805379033088684, 0.29010486602783203, 0.29967179894447327, 0.3092387318611145, 0.3188056945800781, 0.32837265729904175, 0.337939590215683]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 15.0, 11.0, 24.0, 38.0, 51.0, 81.0, 124.0, 193.0, 291.0, 556.0, 933.0, 1680.0, 3223.0, 6451.0, 13813.0, 32101.0, 91108.0, 333532.0, 387404.0, 109035.0, 37242.0, 15515.0, 7074.0, 3539.0, 1894.0, 1030.0, 597.0, 366.0, 230.0, 132.0, 88.0, 48.0, 36.0, 30.0, 19.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.290771484375, -0.2822380065917969, -0.27370452880859375, -0.2651710510253906, -0.2566375732421875, -0.24810409545898438, -0.23957061767578125, -0.23103713989257812, -0.222503662109375, -0.21397018432617188, -0.20543670654296875, -0.19690322875976562, -0.1883697509765625, -0.17983627319335938, -0.17130279541015625, -0.16276931762695312, -0.15423583984375, -0.14570236206054688, -0.13716888427734375, -0.12863540649414062, -0.1201019287109375, -0.11156845092773438, -0.10303497314453125, -0.09450149536132812, -0.085968017578125, -0.07743453979492188, -0.06890106201171875, -0.060367584228515625, -0.0518341064453125, -0.043300628662109375, -0.03476715087890625, -0.026233673095703125, -0.0177001953125, -0.009166717529296875, -0.00063323974609375, 0.007900238037109375, 0.0164337158203125, 0.024967193603515625, 0.03350067138671875, 0.042034149169921875, 0.050567626953125, 0.059101104736328125, 0.06763458251953125, 0.07616806030273438, 0.0847015380859375, 0.09323501586914062, 0.10176849365234375, 0.11030197143554688, 0.11883544921875, 0.12736892700195312, 0.13590240478515625, 0.14443588256835938, 0.1529693603515625, 0.16150283813476562, 0.17003631591796875, 0.17856979370117188, 0.187103271484375, 0.19563674926757812, 0.20417022705078125, 0.21270370483398438, 0.2212371826171875, 0.22977066040039062, 0.23830413818359375, 0.24683761596679688, 0.25537109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 16.0, 14.0, 12.0, 15.0, 30.0, 30.0, 36.0, 47.0, 45.0, 59.0, 42.0, 45.0, 67.0, 59.0, 71.0, 52.0, 58.0, 50.0, 44.0, 43.0, 29.0, 28.0, 16.0, 13.0, 15.0, 13.0, 6.0, 8.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47705078125, -0.4587249755859375, -0.440399169921875, -0.4220733642578125, -0.40374755859375, -0.3854217529296875, -0.367095947265625, -0.3487701416015625, -0.3304443359375, -0.3121185302734375, -0.293792724609375, -0.2754669189453125, -0.25714111328125, -0.2388153076171875, -0.220489501953125, -0.2021636962890625, -0.183837890625, -0.1655120849609375, -0.147186279296875, -0.1288604736328125, -0.11053466796875, -0.0922088623046875, -0.073883056640625, -0.0555572509765625, -0.0372314453125, -0.0189056396484375, -0.000579833984375, 0.0177459716796875, 0.03607177734375, 0.0543975830078125, 0.072723388671875, 0.0910491943359375, 0.109375, 0.1277008056640625, 0.146026611328125, 0.1643524169921875, 0.18267822265625, 0.2010040283203125, 0.219329833984375, 0.2376556396484375, 0.2559814453125, 0.2743072509765625, 0.292633056640625, 0.3109588623046875, 0.32928466796875, 0.3476104736328125, 0.365936279296875, 0.3842620849609375, 0.402587890625, 0.4209136962890625, 0.439239501953125, 0.4575653076171875, 0.47589111328125, 0.4942169189453125, 0.512542724609375, 0.5308685302734375, 0.5491943359375, 0.5675201416015625, 0.585845947265625, 0.6041717529296875, 0.62249755859375, 0.6408233642578125, 0.659149169921875, 0.6774749755859375, 0.69580078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 5.0, 9.0, 7.0, 9.0, 19.0, 27.0, 36.0, 53.0, 76.0, 125.0, 252.0, 655.0, 2635.0, 14666.0, 194610.0, 781092.0, 46200.0, 5882.0, 1252.0, 425.0, 162.0, 101.0, 71.0, 32.0, 37.0, 18.0, 18.0, 11.0, 11.0, 8.0, 7.0, 6.0, 7.0, 1.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.56201171875, -0.5421218872070312, -0.5222320556640625, -0.5023422241210938, -0.482452392578125, -0.46256256103515625, -0.4426727294921875, -0.42278289794921875, -0.40289306640625, -0.38300323486328125, -0.3631134033203125, -0.34322357177734375, -0.323333740234375, -0.30344390869140625, -0.2835540771484375, -0.26366424560546875, -0.2437744140625, -0.22388458251953125, -0.2039947509765625, -0.18410491943359375, -0.164215087890625, -0.14432525634765625, -0.1244354248046875, -0.10454559326171875, -0.08465576171875, -0.06476593017578125, -0.0448760986328125, -0.02498626708984375, -0.005096435546875, 0.01479339599609375, 0.0346832275390625, 0.05457305908203125, 0.074462890625, 0.09435272216796875, 0.1142425537109375, 0.13413238525390625, 0.154022216796875, 0.17391204833984375, 0.1938018798828125, 0.21369171142578125, 0.23358154296875, 0.25347137451171875, 0.2733612060546875, 0.29325103759765625, 0.313140869140625, 0.33303070068359375, 0.3529205322265625, 0.37281036376953125, 0.3927001953125, 0.41259002685546875, 0.4324798583984375, 0.45236968994140625, 0.472259521484375, 0.49214935302734375, 0.5120391845703125, 0.5319290161132812, 0.55181884765625, 0.5717086791992188, 0.5915985107421875, 0.6114883422851562, 0.631378173828125, 0.6512680053710938, 0.6711578369140625, 0.6910476684570312, 0.7109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 10.0, 10.0, 4.0, 10.0, 11.0, 13.0, 16.0, 7.0, 22.0, 35.0, 26.0, 28.0, 27.0, 36.0, 30.0, 42.0, 48.0, 57.0, 61.0, 52.0, 30.0, 39.0, 44.0, 48.0, 37.0, 28.0, 46.0, 36.0, 31.0, 28.0, 22.0, 9.0, 16.0, 13.0, 13.0, 2.0, 4.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49755859375, -0.480010986328125, -0.46246337890625, -0.444915771484375, -0.4273681640625, -0.409820556640625, -0.39227294921875, -0.374725341796875, -0.357177734375, -0.339630126953125, -0.32208251953125, -0.304534912109375, -0.2869873046875, -0.269439697265625, -0.25189208984375, -0.234344482421875, -0.216796875, -0.199249267578125, -0.18170166015625, -0.164154052734375, -0.1466064453125, -0.129058837890625, -0.11151123046875, -0.093963623046875, -0.076416015625, -0.058868408203125, -0.04132080078125, -0.023773193359375, -0.0062255859375, 0.011322021484375, 0.02886962890625, 0.046417236328125, 0.06396484375, 0.081512451171875, 0.09906005859375, 0.116607666015625, 0.1341552734375, 0.151702880859375, 0.16925048828125, 0.186798095703125, 0.204345703125, 0.221893310546875, 0.23944091796875, 0.256988525390625, 0.2745361328125, 0.292083740234375, 0.30963134765625, 0.327178955078125, 0.3447265625, 0.362274169921875, 0.37982177734375, 0.397369384765625, 0.4149169921875, 0.432464599609375, 0.45001220703125, 0.467559814453125, 0.485107421875, 0.502655029296875, 0.52020263671875, 0.537750244140625, 0.5552978515625, 0.572845458984375, 0.59039306640625, 0.607940673828125, 0.62548828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 7.0, 5.0, 14.0, 30.0, 40.0, 67.0, 124.0, 227.0, 408.0, 841.0, 1775.0, 4500.0, 18337.0, 298281.0, 681067.0, 32402.0, 5999.0, 2313.0, 1038.0, 476.0, 255.0, 129.0, 81.0, 57.0, 28.0, 12.0, 16.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24354171752929688, -0.23488616943359375, -0.22623062133789062, -0.2175750732421875, -0.20891952514648438, -0.20026397705078125, -0.19160842895507812, -0.182952880859375, -0.17429733276367188, -0.16564178466796875, -0.15698623657226562, -0.1483306884765625, -0.13967514038085938, -0.13101959228515625, -0.12236404418945312, -0.11370849609375, -0.10505294799804688, -0.09639739990234375, -0.08774185180664062, -0.0790863037109375, -0.07043075561523438, -0.06177520751953125, -0.053119659423828125, -0.044464111328125, -0.035808563232421875, -0.02715301513671875, -0.018497467041015625, -0.0098419189453125, -0.001186370849609375, 0.00746917724609375, 0.016124725341796875, 0.0247802734375, 0.033435821533203125, 0.04209136962890625, 0.050746917724609375, 0.0594024658203125, 0.06805801391601562, 0.07671356201171875, 0.08536911010742188, 0.094024658203125, 0.10268020629882812, 0.11133575439453125, 0.11999130249023438, 0.1286468505859375, 0.13730239868164062, 0.14595794677734375, 0.15461349487304688, 0.16326904296875, 0.17192459106445312, 0.18058013916015625, 0.18923568725585938, 0.1978912353515625, 0.20654678344726562, 0.21520233154296875, 0.22385787963867188, 0.232513427734375, 0.24116897583007812, 0.24982452392578125, 0.2584800720214844, 0.2671356201171875, 0.2757911682128906, 0.28444671630859375, 0.2931022644042969, 0.3017578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 16.0, 22.0, 49.0, 70.0, 132.0, 196.0, 206.0, 140.0, 59.0, 34.0, 24.0, 22.0, 5.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.725290298461914e-05, -3.576651215553284e-05, -3.428012132644653e-05, -3.279373049736023e-05, -3.1307339668273926e-05, -2.9820948839187622e-05, -2.833455801010132e-05, -2.6848167181015015e-05, -2.536177635192871e-05, -2.3875385522842407e-05, -2.2388994693756104e-05, -2.09026038646698e-05, -1.9416213035583496e-05, -1.7929822206497192e-05, -1.644343137741089e-05, -1.4957040548324585e-05, -1.3470649719238281e-05, -1.1984258890151978e-05, -1.0497868061065674e-05, -9.01147723197937e-06, -7.525086402893066e-06, -6.038695573806763e-06, -4.552304744720459e-06, -3.0659139156341553e-06, -1.5795230865478516e-06, -9.313225746154785e-08, 1.3932585716247559e-06, 2.8796494007110596e-06, 4.366040229797363e-06, 5.852431058883667e-06, 7.338821887969971e-06, 8.825212717056274e-06, 1.0311603546142578e-05, 1.1797994375228882e-05, 1.3284385204315186e-05, 1.477077603340149e-05, 1.6257166862487793e-05, 1.7743557691574097e-05, 1.92299485206604e-05, 2.0716339349746704e-05, 2.2202730178833008e-05, 2.368912100791931e-05, 2.5175511837005615e-05, 2.666190266609192e-05, 2.8148293495178223e-05, 2.9634684324264526e-05, 3.112107515335083e-05, 3.2607465982437134e-05, 3.409385681152344e-05, 3.558024764060974e-05, 3.7066638469696045e-05, 3.855302929878235e-05, 4.003942012786865e-05, 4.1525810956954956e-05, 4.301220178604126e-05, 4.4498592615127563e-05, 4.598498344421387e-05, 4.747137427330017e-05, 4.8957765102386475e-05, 5.044415593147278e-05, 5.193054676055908e-05, 5.3416937589645386e-05, 5.490332841873169e-05, 5.638971924781799e-05, 5.78761100769043e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 6.0, 10.0, 20.0, 30.0, 41.0, 64.0, 167.0, 456.0, 1443.0, 5423.0, 50558.0, 927910.0, 54436.0, 5712.0, 1406.0, 460.0, 185.0, 81.0, 43.0, 30.0, 15.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388427734375, -0.3764801025390625, -0.364532470703125, -0.3525848388671875, -0.34063720703125, -0.3286895751953125, -0.316741943359375, -0.3047943115234375, -0.2928466796875, -0.2808990478515625, -0.268951416015625, -0.2570037841796875, -0.24505615234375, -0.2331085205078125, -0.221160888671875, -0.2092132568359375, -0.197265625, -0.1853179931640625, -0.173370361328125, -0.1614227294921875, -0.14947509765625, -0.1375274658203125, -0.125579833984375, -0.1136322021484375, -0.1016845703125, -0.0897369384765625, -0.077789306640625, -0.0658416748046875, -0.05389404296875, -0.0419464111328125, -0.029998779296875, -0.0180511474609375, -0.006103515625, 0.0058441162109375, 0.017791748046875, 0.0297393798828125, 0.04168701171875, 0.0536346435546875, 0.065582275390625, 0.0775299072265625, 0.0894775390625, 0.1014251708984375, 0.113372802734375, 0.1253204345703125, 0.13726806640625, 0.1492156982421875, 0.161163330078125, 0.1731109619140625, 0.18505859375, 0.1970062255859375, 0.208953857421875, 0.2209014892578125, 0.23284912109375, 0.2447967529296875, 0.256744384765625, 0.2686920166015625, 0.2806396484375, 0.2925872802734375, 0.304534912109375, 0.3164825439453125, 0.32843017578125, 0.3403778076171875, 0.352325439453125, 0.3642730712890625, 0.376220703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 12.0, 6.0, 16.0, 24.0, 28.0, 45.0, 51.0, 104.0, 130.0, 161.0, 113.0, 107.0, 68.0, 30.0, 33.0, 16.0, 16.0, 10.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0799560546875, -0.0770425796508789, -0.07412910461425781, -0.07121562957763672, -0.06830215454101562, -0.06538867950439453, -0.06247520446777344, -0.059561729431152344, -0.05664825439453125, -0.053734779357910156, -0.05082130432128906, -0.04790782928466797, -0.044994354248046875, -0.04208087921142578, -0.03916740417480469, -0.036253929138183594, -0.0333404541015625, -0.030426979064941406, -0.027513504028320312, -0.02460002899169922, -0.021686553955078125, -0.01877307891845703, -0.015859603881835938, -0.012946128845214844, -0.01003265380859375, -0.007119178771972656, -0.0042057037353515625, -0.0012922286987304688, 0.001621246337890625, 0.004534721374511719, 0.0074481964111328125, 0.010361671447753906, 0.013275146484375, 0.016188621520996094, 0.019102096557617188, 0.02201557159423828, 0.024929046630859375, 0.02784252166748047, 0.030755996704101562, 0.033669471740722656, 0.03658294677734375, 0.039496421813964844, 0.04240989685058594, 0.04532337188720703, 0.048236846923828125, 0.05115032196044922, 0.05406379699707031, 0.056977272033691406, 0.0598907470703125, 0.0628042221069336, 0.06571769714355469, 0.06863117218017578, 0.07154464721679688, 0.07445812225341797, 0.07737159729003906, 0.08028507232666016, 0.08319854736328125, 0.08611202239990234, 0.08902549743652344, 0.09193897247314453, 0.09485244750976562, 0.09776592254638672, 0.10067939758300781, 0.1035928726196289, 0.10650634765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 8.0, 5.0, 19.0, 29.0, 46.0, 113.0, 148.0, 223.0, 180.0, 116.0, 56.0, 35.0, 18.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302221775054932, -0.48031696677207947, -0.43041178584098816, -0.38050657510757446, -0.33060139417648315, -0.28069618344306946, -0.23079097270965576, -0.18088579177856445, -0.13098058104515076, -0.08107538521289825, -0.031170181930065155, 0.018735021352767944, 0.06864021718502045, 0.11854541301727295, 0.16845062375068665, 0.21835580468177795, 0.26826101541519165, 0.31816622614860535, 0.36807140707969666, 0.41797661781311035, 0.46788179874420166, 0.517786979675293, 0.567692220211029, 0.6175974011421204, 0.6675026416778564, 0.7174078226089478, 0.7673130631446838, 0.8172182440757751, 0.8671234250068665, 0.9170286655426025, 0.9669338464736938, 1.0168390274047852, 1.0667442083358765, 1.1166493892669678, 1.166554570198059, 1.2164597511291504, 1.2663650512695312, 1.3162702322006226, 1.3661754131317139, 1.4160805940628052, 1.4659857749938965, 1.5158909559249878, 1.565796136856079, 1.61570143699646, 1.6656066179275513, 1.7155117988586426, 1.7654169797897339, 1.8153221607208252, 1.865227460861206, 1.9151326417922974, 1.9650378227233887, 2.0149431228637695, 2.0648481845855713, 2.114753484725952, 2.164658546447754, 2.2145638465881348, 2.2644689083099365, 2.3143742084503174, 2.364279270172119, 2.4141845703125, 2.4640896320343018, 2.5139949321746826, 2.5638999938964844, 2.6138052940368652, 2.663710594177246]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 5.0, 6.0, 11.0, 10.0, 14.0, 9.0, 9.0, 23.0, 18.0, 19.0, 21.0, 19.0, 20.0, 24.0, 24.0, 28.0, 23.0, 34.0, 28.0, 36.0, 35.0, 33.0, 43.0, 35.0, 34.0, 44.0, 34.0, 24.0, 32.0, 41.0, 29.0, 30.0, 21.0, 20.0, 22.0, 24.0, 14.0, 19.0, 9.0, 14.0, 10.0, 2.0, 11.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0], "bins": [-0.7506343722343445, -0.7271214127540588, -0.7036084532737732, -0.6800954937934875, -0.6565825939178467, -0.633069634437561, -0.6095566749572754, -0.5860437154769897, -0.5625307559967041, -0.5390177965164185, -0.5155048370361328, -0.49199190735816956, -0.4684789478778839, -0.44496598839759827, -0.421453058719635, -0.39794009923934937, -0.3744271397590637, -0.3509141802787781, -0.32740122079849243, -0.3038882911205292, -0.28037533164024353, -0.2568623721599579, -0.23334942758083344, -0.20983648300170898, -0.18632352352142334, -0.1628105640411377, -0.13929761946201324, -0.1157846674323082, -0.09227171540260315, -0.0687587633728981, -0.045245811343193054, -0.021732866764068604, 0.001780092716217041, 0.02529304474592209, 0.048805996775627136, 0.07231894880533218, 0.09583190083503723, 0.11934485286474228, 0.14285780489444733, 0.16637074947357178, 0.18988370895385742, 0.21339666843414307, 0.23690961301326752, 0.26042255759239197, 0.2839355170726776, 0.30744847655296326, 0.3309614062309265, 0.35447436571121216, 0.3779873251914978, 0.40150028467178345, 0.4250132441520691, 0.44852617383003235, 0.472039133310318, 0.49555209279060364, 0.5190650224685669, 0.5425779819488525, 0.5660909414291382, 0.5896039009094238, 0.6131168603897095, 0.6366298198699951, 0.6601427793502808, 0.6836556792259216, 0.7071686387062073, 0.7306815981864929, 0.7541945576667786]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 10.0, 24.0, 46.0, 99.0, 217.0, 536.0, 1611.0, 7012.0, 98068.0, 3906889.0, 169328.0, 7977.0, 1532.0, 487.0, 174.0, 92.0, 53.0, 24.0, 19.0, 16.0, 15.0, 7.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9287109375, -0.887542724609375, -0.84637451171875, -0.805206298828125, -0.7640380859375, -0.722869873046875, -0.68170166015625, -0.640533447265625, -0.599365234375, -0.558197021484375, -0.51702880859375, -0.475860595703125, -0.4346923828125, -0.393524169921875, -0.35235595703125, -0.311187744140625, -0.27001953125, -0.228851318359375, -0.18768310546875, -0.146514892578125, -0.1053466796875, -0.064178466796875, -0.02301025390625, 0.018157958984375, 0.059326171875, 0.100494384765625, 0.14166259765625, 0.182830810546875, 0.2239990234375, 0.265167236328125, 0.30633544921875, 0.347503662109375, 0.388671875, 0.429840087890625, 0.47100830078125, 0.512176513671875, 0.5533447265625, 0.594512939453125, 0.63568115234375, 0.676849365234375, 0.718017578125, 0.759185791015625, 0.80035400390625, 0.841522216796875, 0.8826904296875, 0.923858642578125, 0.96502685546875, 1.006195068359375, 1.04736328125, 1.088531494140625, 1.12969970703125, 1.170867919921875, 1.2120361328125, 1.253204345703125, 1.29437255859375, 1.335540771484375, 1.376708984375, 1.417877197265625, 1.45904541015625, 1.500213623046875, 1.5413818359375, 1.582550048828125, 1.62371826171875, 1.664886474609375, 1.7060546875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 18.0, 16.0, 25.0, 44.0, 30.0, 61.0, 58.0, 76.0, 77.0, 83.0, 105.0, 81.0, 72.0, 65.0, 43.0, 40.0, 27.0, 16.0, 18.0, 12.0, 7.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36767578125, -0.3507843017578125, -0.333892822265625, -0.3170013427734375, -0.30010986328125, -0.2832183837890625, -0.266326904296875, -0.2494354248046875, -0.2325439453125, -0.2156524658203125, -0.198760986328125, -0.1818695068359375, -0.16497802734375, -0.1480865478515625, -0.131195068359375, -0.1143035888671875, -0.097412109375, -0.0805206298828125, -0.063629150390625, -0.0467376708984375, -0.02984619140625, -0.0129547119140625, 0.003936767578125, 0.0208282470703125, 0.0377197265625, 0.0546112060546875, 0.071502685546875, 0.0883941650390625, 0.10528564453125, 0.1221771240234375, 0.139068603515625, 0.1559600830078125, 0.1728515625, 0.1897430419921875, 0.206634521484375, 0.2235260009765625, 0.24041748046875, 0.2573089599609375, 0.274200439453125, 0.2910919189453125, 0.3079833984375, 0.3248748779296875, 0.341766357421875, 0.3586578369140625, 0.37554931640625, 0.3924407958984375, 0.409332275390625, 0.4262237548828125, 0.443115234375, 0.4600067138671875, 0.476898193359375, 0.4937896728515625, 0.51068115234375, 0.5275726318359375, 0.544464111328125, 0.5613555908203125, 0.5782470703125, 0.5951385498046875, 0.612030029296875, 0.6289215087890625, 0.64581298828125, 0.6627044677734375, 0.679595947265625, 0.6964874267578125, 0.71337890625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 11.0, 13.0, 20.0, 35.0, 43.0, 68.0, 150.0, 305.0, 745.0, 2057.0, 7603.0, 58638.0, 3135952.0, 949897.0, 30979.0, 4959.0, 1526.0, 655.0, 290.0, 134.0, 76.0, 45.0, 28.0, 10.0, 10.0, 10.0, 4.0, 6.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7245025634765625, -0.697540283203125, -0.6705780029296875, -0.64361572265625, -0.6166534423828125, -0.589691162109375, -0.5627288818359375, -0.5357666015625, -0.5088043212890625, -0.481842041015625, -0.4548797607421875, -0.42791748046875, -0.4009552001953125, -0.373992919921875, -0.3470306396484375, -0.320068359375, -0.2931060791015625, -0.266143798828125, -0.2391815185546875, -0.21221923828125, -0.1852569580078125, -0.158294677734375, -0.1313323974609375, -0.1043701171875, -0.0774078369140625, -0.050445556640625, -0.0234832763671875, 0.00347900390625, 0.0304412841796875, 0.057403564453125, 0.0843658447265625, 0.111328125, 0.1382904052734375, 0.165252685546875, 0.1922149658203125, 0.21917724609375, 0.2461395263671875, 0.273101806640625, 0.3000640869140625, 0.3270263671875, 0.3539886474609375, 0.380950927734375, 0.4079132080078125, 0.43487548828125, 0.4618377685546875, 0.488800048828125, 0.5157623291015625, 0.542724609375, 0.5696868896484375, 0.596649169921875, 0.6236114501953125, 0.65057373046875, 0.6775360107421875, 0.704498291015625, 0.7314605712890625, 0.7584228515625, 0.7853851318359375, 0.812347412109375, 0.8393096923828125, 0.86627197265625, 0.8932342529296875, 0.920196533203125, 0.9471588134765625, 0.97412109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 7.0, 6.0, 8.0, 11.0, 15.0, 21.0, 33.0, 42.0, 67.0, 107.0, 174.0, 274.0, 458.0, 679.0, 791.0, 499.0, 334.0, 182.0, 107.0, 72.0, 60.0, 36.0, 30.0, 15.0, 7.0, 8.0, 8.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1920166015625, -0.18670654296875, -0.181396484375, -0.17608642578125, -0.1707763671875, -0.16546630859375, -0.16015625, -0.15484619140625, -0.1495361328125, -0.14422607421875, -0.138916015625, -0.13360595703125, -0.1282958984375, -0.12298583984375, -0.11767578125, -0.11236572265625, -0.1070556640625, -0.10174560546875, -0.096435546875, -0.09112548828125, -0.0858154296875, -0.08050537109375, -0.0751953125, -0.06988525390625, -0.0645751953125, -0.05926513671875, -0.053955078125, -0.04864501953125, -0.0433349609375, -0.03802490234375, -0.03271484375, -0.02740478515625, -0.0220947265625, -0.01678466796875, -0.011474609375, -0.00616455078125, -0.0008544921875, 0.00445556640625, 0.009765625, 0.01507568359375, 0.0203857421875, 0.02569580078125, 0.031005859375, 0.03631591796875, 0.0416259765625, 0.04693603515625, 0.05224609375, 0.05755615234375, 0.0628662109375, 0.06817626953125, 0.073486328125, 0.07879638671875, 0.0841064453125, 0.08941650390625, 0.0947265625, 0.10003662109375, 0.1053466796875, 0.11065673828125, 0.115966796875, 0.12127685546875, 0.1265869140625, 0.13189697265625, 0.13720703125, 0.14251708984375, 0.1478271484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 6.0, 4.0, 12.0, 15.0, 17.0, 17.0, 48.0, 94.0, 87.0, 120.0, 116.0, 123.0, 96.0, 88.0, 62.0, 38.0, 23.0, 14.0, 9.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6215534806251526, -0.5973003506660461, -0.5730472207069397, -0.548794150352478, -0.5245410203933716, -0.5002878904342651, -0.4760347604751587, -0.45178163051605225, -0.4275285303592682, -0.40327540040016174, -0.3790223002433777, -0.35476917028427124, -0.3305160403251648, -0.30626294016838074, -0.2820098102092743, -0.25775671005249023, -0.2335035800933838, -0.20925046503543854, -0.1849973499774933, -0.16074422001838684, -0.1364911049604416, -0.11223798990249634, -0.08798485994338989, -0.06373174488544464, -0.03947862982749939, -0.01522551104426384, 0.00902760773897171, 0.03328073024749756, 0.05753384530544281, 0.08178696036338806, 0.1060400903224945, 0.13029320538043976, 0.154546320438385, 0.17879943549633026, 0.2030525505542755, 0.22730568051338196, 0.251558780670166, 0.27581191062927246, 0.3000650405883789, 0.32431817054748535, 0.3485712707042694, 0.37282440066337585, 0.3970775008201599, 0.42133063077926636, 0.4455837607383728, 0.46983686089515686, 0.4940899908542633, 0.5183430910110474, 0.5425962209701538, 0.5668493509292603, 0.5911024808883667, 0.6153556108474731, 0.6396086812019348, 0.6638618111610413, 0.6881149411201477, 0.7123680710792542, 0.7366211414337158, 0.7608742713928223, 0.7851274013519287, 0.8093805313110352, 0.8336336016654968, 0.8578867316246033, 0.8821398615837097, 0.9063929915428162, 0.9306461215019226]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 5.0, 11.0, 15.0, 17.0, 12.0, 16.0, 17.0, 20.0, 32.0, 31.0, 35.0, 22.0, 32.0, 41.0, 28.0, 35.0, 44.0, 44.0, 41.0, 42.0, 32.0, 49.0, 39.0, 44.0, 34.0, 27.0, 28.0, 18.0, 28.0, 19.0, 19.0, 18.0, 13.0, 12.0, 11.0, 9.0, 11.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.3360586166381836, -0.3264901638031006, -0.3169217109680176, -0.30735328793525696, -0.29778483510017395, -0.28821638226509094, -0.27864792943000793, -0.2690794765949249, -0.2595110535621643, -0.2499426007270813, -0.24037416279315948, -0.23080570995807648, -0.22123727202415466, -0.21166881918907166, -0.20210036635398865, -0.19253191351890564, -0.18296346068382263, -0.17339500784873962, -0.1638265699148178, -0.1542581170797348, -0.144689679145813, -0.13512122631072998, -0.12555277347564697, -0.11598432809114456, -0.10641588270664215, -0.09684743732213974, -0.08727899193763733, -0.07771053910255432, -0.06814209371805191, -0.0585736483335495, -0.04900519922375679, -0.03943675011396408, -0.02986830472946167, -0.02029985748231411, -0.01073141023516655, -0.0011629629880189896, 0.00840548425912857, 0.01797392964363098, 0.02754237875342369, 0.0371108278632164, 0.04667927324771881, 0.05624771863222122, 0.06581616401672363, 0.07538461685180664, 0.08495306223630905, 0.09452150762081146, 0.10408996045589447, 0.11365840584039688, 0.12322685122489929, 0.1327953040599823, 0.1423637419939041, 0.15193219482898712, 0.16150063276290894, 0.17106908559799194, 0.18063753843307495, 0.19020599126815796, 0.19977442920207977, 0.20934288203716278, 0.2189113199710846, 0.2284797728061676, 0.2380482256412506, 0.24761666357517242, 0.25718510150909424, 0.26675355434417725, 0.27632200717926025]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 9.0, 13.0, 21.0, 34.0, 23.0, 42.0, 66.0, 110.0, 158.0, 291.0, 608.0, 1482.0, 3967.0, 12130.0, 41339.0, 160637.0, 441022.0, 281229.0, 74517.0, 20375.0, 6348.0, 2282.0, 859.0, 402.0, 210.0, 97.0, 68.0, 56.0, 30.0, 25.0, 20.0, 14.0, 18.0, 8.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0694580078125, -0.06703948974609375, -0.0646209716796875, -0.06220245361328125, -0.059783935546875, -0.05736541748046875, -0.0549468994140625, -0.05252838134765625, -0.05010986328125, -0.04769134521484375, -0.0452728271484375, -0.04285430908203125, -0.040435791015625, -0.03801727294921875, -0.0355987548828125, -0.03318023681640625, -0.03076171875, -0.02834320068359375, -0.0259246826171875, -0.02350616455078125, -0.021087646484375, -0.01866912841796875, -0.0162506103515625, -0.01383209228515625, -0.01141357421875, -0.00899505615234375, -0.0065765380859375, -0.00415802001953125, -0.001739501953125, 0.00067901611328125, 0.0030975341796875, 0.00551605224609375, 0.0079345703125, 0.01035308837890625, 0.0127716064453125, 0.01519012451171875, 0.017608642578125, 0.02002716064453125, 0.0224456787109375, 0.02486419677734375, 0.02728271484375, 0.02970123291015625, 0.0321197509765625, 0.03453826904296875, 0.036956787109375, 0.03937530517578125, 0.0417938232421875, 0.04421234130859375, 0.046630859375, 0.04904937744140625, 0.0514678955078125, 0.05388641357421875, 0.056304931640625, 0.05872344970703125, 0.0611419677734375, 0.06356048583984375, 0.06597900390625, 0.06839752197265625, 0.0708160400390625, 0.07323455810546875, 0.075653076171875, 0.07807159423828125, 0.0804901123046875, 0.08290863037109375, 0.0853271484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 8.0, 11.0, 14.0, 27.0, 33.0, 32.0, 42.0, 67.0, 58.0, 68.0, 85.0, 82.0, 90.0, 70.0, 60.0, 49.0, 51.0, 39.0, 32.0, 19.0, 24.0, 7.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.426513671875, -0.41339874267578125, -0.4002838134765625, -0.38716888427734375, -0.374053955078125, -0.36093902587890625, -0.3478240966796875, -0.33470916748046875, -0.32159423828125, -0.30847930908203125, -0.2953643798828125, -0.28224945068359375, -0.269134521484375, -0.25601959228515625, -0.2429046630859375, -0.22978973388671875, -0.2166748046875, -0.20355987548828125, -0.1904449462890625, -0.17733001708984375, -0.164215087890625, -0.15110015869140625, -0.1379852294921875, -0.12487030029296875, -0.11175537109375, -0.09864044189453125, -0.0855255126953125, -0.07241058349609375, -0.059295654296875, -0.04618072509765625, -0.0330657958984375, -0.01995086669921875, -0.0068359375, 0.00627899169921875, 0.0193939208984375, 0.03250885009765625, 0.045623779296875, 0.05873870849609375, 0.0718536376953125, 0.08496856689453125, 0.09808349609375, 0.11119842529296875, 0.1243133544921875, 0.13742828369140625, 0.150543212890625, 0.16365814208984375, 0.1767730712890625, 0.18988800048828125, 0.2030029296875, 0.21611785888671875, 0.2292327880859375, 0.24234771728515625, 0.255462646484375, 0.26857757568359375, 0.2816925048828125, 0.29480743408203125, 0.30792236328125, 0.32103729248046875, 0.3341522216796875, 0.34726715087890625, 0.360382080078125, 0.37349700927734375, 0.3866119384765625, 0.39972686767578125, 0.412841796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 13.0, 10.0, 29.0, 29.0, 41.0, 78.0, 107.0, 151.0, 247.0, 452.0, 826.0, 1691.0, 3410.0, 7459.0, 17551.0, 45987.0, 126785.0, 293994.0, 315727.0, 145012.0, 52643.0, 20143.0, 8303.0, 3757.0, 1831.0, 924.0, 510.0, 295.0, 163.0, 124.0, 70.0, 45.0, 35.0, 28.0, 14.0, 17.0, 13.0, 16.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040252685546875, -0.03858041763305664, -0.03690814971923828, -0.03523588180541992, -0.03356361389160156, -0.0318913459777832, -0.030219078063964844, -0.028546810150146484, -0.026874542236328125, -0.025202274322509766, -0.023530006408691406, -0.021857738494873047, -0.020185470581054688, -0.018513202667236328, -0.01684093475341797, -0.01516866683959961, -0.01349639892578125, -0.01182413101196289, -0.010151863098144531, -0.008479595184326172, -0.0068073272705078125, -0.005135059356689453, -0.0034627914428710938, -0.0017905235290527344, -0.000118255615234375, 0.0015540122985839844, 0.0032262802124023438, 0.004898548126220703, 0.0065708160400390625, 0.008243083953857422, 0.009915351867675781, 0.01158761978149414, 0.0132598876953125, 0.01493215560913086, 0.01660442352294922, 0.018276691436767578, 0.019948959350585938, 0.021621227264404297, 0.023293495178222656, 0.024965763092041016, 0.026638031005859375, 0.028310298919677734, 0.029982566833496094, 0.03165483474731445, 0.03332710266113281, 0.03499937057495117, 0.03667163848876953, 0.03834390640258789, 0.04001617431640625, 0.04168844223022461, 0.04336071014404297, 0.04503297805786133, 0.04670524597167969, 0.04837751388549805, 0.050049781799316406, 0.051722049713134766, 0.053394317626953125, 0.055066585540771484, 0.056738853454589844, 0.0584111213684082, 0.06008338928222656, 0.06175565719604492, 0.06342792510986328, 0.06510019302368164, 0.0667724609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 11.0, 20.0, 18.0, 21.0, 9.0, 23.0, 20.0, 28.0, 23.0, 27.0, 22.0, 28.0, 28.0, 38.0, 36.0, 43.0, 42.0, 37.0, 36.0, 48.0, 39.0, 42.0, 30.0, 28.0, 42.0, 34.0, 23.0, 25.0, 30.0, 21.0, 14.0, 14.0, 19.0, 13.0, 6.0, 7.0, 5.0, 8.0, 4.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.453369140625, -0.4403266906738281, -0.42728424072265625, -0.4142417907714844, -0.4011993408203125, -0.3881568908691406, -0.37511444091796875, -0.3620719909667969, -0.349029541015625, -0.3359870910644531, -0.32294464111328125, -0.3099021911621094, -0.2968597412109375, -0.2838172912597656, -0.27077484130859375, -0.2577323913574219, -0.24468994140625, -0.23164749145507812, -0.21860504150390625, -0.20556259155273438, -0.1925201416015625, -0.17947769165039062, -0.16643524169921875, -0.15339279174804688, -0.140350341796875, -0.12730789184570312, -0.11426544189453125, -0.10122299194335938, -0.0881805419921875, -0.07513809204101562, -0.06209564208984375, -0.049053192138671875, -0.0360107421875, -0.022968292236328125, -0.00992584228515625, 0.003116607666015625, 0.0161590576171875, 0.029201507568359375, 0.04224395751953125, 0.055286407470703125, 0.068328857421875, 0.08137130737304688, 0.09441375732421875, 0.10745620727539062, 0.1204986572265625, 0.13354110717773438, 0.14658355712890625, 0.15962600708007812, 0.17266845703125, 0.18571090698242188, 0.19875335693359375, 0.21179580688476562, 0.2248382568359375, 0.23788070678710938, 0.25092315673828125, 0.2639656066894531, 0.277008056640625, 0.2900505065917969, 0.30309295654296875, 0.3161354064941406, 0.3291778564453125, 0.3422203063964844, 0.35526275634765625, 0.3683052062988281, 0.38134765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 9.0, 22.0, 15.0, 18.0, 33.0, 47.0, 111.0, 173.0, 287.0, 483.0, 858.0, 1803.0, 3996.0, 10684.0, 35453.0, 156670.0, 484103.0, 268392.0, 58833.0, 15783.0, 5573.0, 2418.0, 1203.0, 633.0, 343.0, 203.0, 131.0, 89.0, 46.0, 45.0, 27.0, 23.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02655029296875, -0.025826454162597656, -0.025102615356445312, -0.02437877655029297, -0.023654937744140625, -0.02293109893798828, -0.022207260131835938, -0.021483421325683594, -0.02075958251953125, -0.020035743713378906, -0.019311904907226562, -0.01858806610107422, -0.017864227294921875, -0.01714038848876953, -0.016416549682617188, -0.015692710876464844, -0.0149688720703125, -0.014245033264160156, -0.013521194458007812, -0.012797355651855469, -0.012073516845703125, -0.011349678039550781, -0.010625839233398438, -0.009902000427246094, -0.00917816162109375, -0.008454322814941406, -0.0077304840087890625, -0.007006645202636719, -0.006282806396484375, -0.005558967590332031, -0.0048351287841796875, -0.004111289978027344, -0.003387451171875, -0.0026636123657226562, -0.0019397735595703125, -0.0012159347534179688, -0.000492095947265625, 0.00023174285888671875, 0.0009555816650390625, 0.0016794204711914062, 0.00240325927734375, 0.0031270980834960938, 0.0038509368896484375, 0.004574775695800781, 0.005298614501953125, 0.006022453308105469, 0.0067462921142578125, 0.007470130920410156, 0.0081939697265625, 0.008917808532714844, 0.009641647338867188, 0.010365486145019531, 0.011089324951171875, 0.011813163757324219, 0.012537002563476562, 0.013260841369628906, 0.01398468017578125, 0.014708518981933594, 0.015432357788085938, 0.01615619659423828, 0.016880035400390625, 0.01760387420654297, 0.018327713012695312, 0.019051551818847656, 0.019775390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 19.0, 15.0, 28.0, 37.0, 48.0, 51.0, 86.0, 80.0, 104.0, 107.0, 81.0, 88.0, 62.0, 41.0, 45.0, 23.0, 22.0, 16.0, 3.0, 15.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4066696166992188e-05, -1.3568438589572906e-05, -1.3070181012153625e-05, -1.2571923434734344e-05, -1.2073665857315063e-05, -1.1575408279895782e-05, -1.1077150702476501e-05, -1.057889312505722e-05, -1.008063554763794e-05, -9.582377970218658e-06, -9.084120392799377e-06, -8.585862815380096e-06, -8.087605237960815e-06, -7.5893476605415344e-06, -7.091090083122253e-06, -6.592832505702972e-06, -6.094574928283691e-06, -5.59631735086441e-06, -5.098059773445129e-06, -4.599802196025848e-06, -4.101544618606567e-06, -3.6032870411872864e-06, -3.1050294637680054e-06, -2.6067718863487244e-06, -2.1085143089294434e-06, -1.6102567315101624e-06, -1.1119991540908813e-06, -6.137415766716003e-07, -1.1548399925231934e-07, 3.8277357816696167e-07, 8.810311555862427e-07, 1.3792887330055237e-06, 1.8775463104248047e-06, 2.3758038878440857e-06, 2.8740614652633667e-06, 3.3723190426826477e-06, 3.870576620101929e-06, 4.36883419752121e-06, 4.867091774940491e-06, 5.365349352359772e-06, 5.863606929779053e-06, 6.361864507198334e-06, 6.860122084617615e-06, 7.358379662036896e-06, 7.856637239456177e-06, 8.354894816875458e-06, 8.853152394294739e-06, 9.35140997171402e-06, 9.8496675491333e-06, 1.0347925126552582e-05, 1.0846182703971863e-05, 1.1344440281391144e-05, 1.1842697858810425e-05, 1.2340955436229706e-05, 1.2839213013648987e-05, 1.3337470591068268e-05, 1.3835728168487549e-05, 1.433398574590683e-05, 1.483224332332611e-05, 1.5330500900745392e-05, 1.5828758478164673e-05, 1.6327016055583954e-05, 1.6825273633003235e-05, 1.7323531210422516e-05, 1.7821788787841797e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 7.0, 7.0, 12.0, 19.0, 20.0, 29.0, 45.0, 67.0, 132.0, 185.0, 345.0, 722.0, 1556.0, 4466.0, 15375.0, 69882.0, 326642.0, 463226.0, 128542.0, 26243.0, 6783.0, 2200.0, 896.0, 465.0, 237.0, 163.0, 86.0, 55.0, 42.0, 27.0, 17.0, 17.0, 13.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02264404296875, -0.021868228912353516, -0.02109241485595703, -0.020316600799560547, -0.019540786743164062, -0.018764972686767578, -0.017989158630371094, -0.01721334457397461, -0.016437530517578125, -0.01566171646118164, -0.014885902404785156, -0.014110088348388672, -0.013334274291992188, -0.012558460235595703, -0.011782646179199219, -0.011006832122802734, -0.01023101806640625, -0.009455204010009766, -0.008679389953613281, -0.007903575897216797, -0.0071277618408203125, -0.006351947784423828, -0.005576133728027344, -0.004800319671630859, -0.004024505615234375, -0.0032486915588378906, -0.0024728775024414062, -0.0016970634460449219, -0.0009212493896484375, -0.00014543533325195312, 0.0006303787231445312, 0.0014061927795410156, 0.0021820068359375, 0.0029578208923339844, 0.0037336349487304688, 0.004509449005126953, 0.0052852630615234375, 0.006061077117919922, 0.006836891174316406, 0.007612705230712891, 0.008388519287109375, 0.00916433334350586, 0.009940147399902344, 0.010715961456298828, 0.011491775512695312, 0.012267589569091797, 0.013043403625488281, 0.013819217681884766, 0.01459503173828125, 0.015370845794677734, 0.01614665985107422, 0.016922473907470703, 0.017698287963867188, 0.018474102020263672, 0.019249916076660156, 0.02002573013305664, 0.020801544189453125, 0.02157735824584961, 0.022353172302246094, 0.023128986358642578, 0.023904800415039062, 0.024680614471435547, 0.02545642852783203, 0.026232242584228516, 0.027008056640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 6.0, 10.0, 17.0, 21.0, 22.0, 39.0, 55.0, 56.0, 70.0, 73.0, 94.0, 92.0, 79.0, 91.0, 76.0, 42.0, 54.0, 26.0, 19.0, 12.0, 15.0, 10.0, 6.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0092620849609375, -0.00902026891708374, -0.00877845287322998, -0.00853663682937622, -0.008294820785522461, -0.008053004741668701, -0.007811188697814941, -0.007569372653961182, -0.007327556610107422, -0.007085740566253662, -0.006843924522399902, -0.006602108478546143, -0.006360292434692383, -0.006118476390838623, -0.005876660346984863, -0.0056348443031311035, -0.005393028259277344, -0.005151212215423584, -0.004909396171569824, -0.0046675801277160645, -0.004425764083862305, -0.004183948040008545, -0.003942131996154785, -0.0037003159523010254, -0.0034584999084472656, -0.003216683864593506, -0.002974867820739746, -0.0027330517768859863, -0.0024912357330322266, -0.002249419689178467, -0.002007603645324707, -0.0017657876014709473, -0.0015239715576171875, -0.0012821555137634277, -0.001040339469909668, -0.0007985234260559082, -0.0005567073822021484, -0.00031489133834838867, -7.30752944946289e-05, 0.00016874074935913086, 0.0004105567932128906, 0.0006523728370666504, 0.0008941888809204102, 0.00113600492477417, 0.0013778209686279297, 0.0016196370124816895, 0.0018614530563354492, 0.002103269100189209, 0.0023450851440429688, 0.0025869011878967285, 0.0028287172317504883, 0.003070533275604248, 0.003312349319458008, 0.0035541653633117676, 0.0037959814071655273, 0.004037797451019287, 0.004279613494873047, 0.004521429538726807, 0.004763245582580566, 0.005005061626434326, 0.005246877670288086, 0.005488693714141846, 0.0057305097579956055, 0.005972325801849365, 0.006214141845703125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 29.0, 40.0, 115.0, 229.0, 241.0, 200.0, 81.0, 33.0, 20.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7753782272338867, -0.7435557842254639, -0.7117332816123962, -0.6799108386039734, -0.6480883359909058, -0.6162658929824829, -0.5844434499740601, -0.5526210069656372, -0.5207985043525696, -0.48897603154182434, -0.4571535587310791, -0.42533111572265625, -0.393508642911911, -0.36168617010116577, -0.3298637270927429, -0.2980412542819977, -0.26621878147125244, -0.2343963086605072, -0.20257385075092316, -0.1707513928413391, -0.13892892003059387, -0.10710644721984863, -0.07528398931026459, -0.04346153140068054, -0.011639058589935303, 0.02018340677022934, 0.05200587213039398, 0.08382833749055862, 0.11565080285072327, 0.1474732756614685, 0.17929573357105255, 0.2111181914806366, 0.24294066429138184, 0.2747631371021271, 0.3065856099128723, 0.33840805292129517, 0.3702305257320404, 0.40205299854278564, 0.4338754415512085, 0.46569791436195374, 0.497520387172699, 0.5293428301811218, 0.5611653327941895, 0.5929877758026123, 0.6248102188110352, 0.6566327214241028, 0.6884551644325256, 0.7202776670455933, 0.7521001100540161, 0.783922553062439, 0.8157450556755066, 0.8475674986839294, 0.8793900012969971, 0.9112124443054199, 0.9430348873138428, 0.9748573303222656, 1.0066797733306885, 1.0385022163391113, 1.0703246593475342, 1.1021472215652466, 1.1339696645736694, 1.1657921075820923, 1.1976145505905151, 1.229436993598938, 1.2612595558166504]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 5.0, 2.0, 5.0, 5.0, 9.0, 8.0, 22.0, 15.0, 17.0, 21.0, 21.0, 25.0, 45.0, 24.0, 34.0, 33.0, 44.0, 40.0, 48.0, 44.0, 44.0, 46.0, 45.0, 45.0, 45.0, 51.0, 34.0, 25.0, 29.0, 22.0, 24.0, 24.0, 21.0, 13.0, 13.0, 6.0, 9.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.2497846633195877, -0.2425040602684021, -0.2352234423160553, -0.2279428392648697, -0.2206622213125229, -0.21338161826133728, -0.20610100030899048, -0.19882039725780487, -0.19153979420661926, -0.18425919115543365, -0.17697857320308685, -0.16969797015190125, -0.16241735219955444, -0.15513674914836884, -0.14785614609718323, -0.14057552814483643, -0.13329491019248962, -0.12601430714130402, -0.11873368918895721, -0.1114530861377716, -0.1041724681854248, -0.0968918651342392, -0.08961125463247299, -0.08233064413070679, -0.07505003362894058, -0.06776942312717438, -0.06048881262540817, -0.053208205848932266, -0.04592759534716606, -0.03864698484539986, -0.03136637806892395, -0.024085767567157745, -0.016805142164230347, -0.009524532593786716, -0.0022439230233430862, 0.005036685615777969, 0.012317296117544174, 0.01959790661931038, 0.026878513395786285, 0.03415912389755249, 0.041439734399318695, 0.0487203449010849, 0.056000955402851105, 0.06328156590461731, 0.07056216895580292, 0.07784278690814972, 0.08512338995933533, 0.09240400046110153, 0.09968461096286774, 0.10696522146463394, 0.11424583196640015, 0.12152643501758575, 0.12880705296993256, 0.13608765602111816, 0.14336827397346497, 0.15064887702465057, 0.15792948007583618, 0.1652100831270218, 0.1724907010793686, 0.1797713041305542, 0.187051922082901, 0.1943325251340866, 0.20161312818527222, 0.20889374613761902, 0.21617436408996582]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 9.0, 13.0, 16.0, 16.0, 28.0, 39.0, 75.0, 92.0, 134.0, 242.0, 362.0, 577.0, 1018.0, 1968.0, 3805.0, 9002.0, 30185.0, 224484.0, 679510.0, 70076.0, 15213.0, 5574.0, 2665.0, 1366.0, 830.0, 449.0, 283.0, 163.0, 101.0, 72.0, 61.0, 29.0, 32.0, 22.0, 12.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.363525390625, -0.35065460205078125, -0.3377838134765625, -0.32491302490234375, -0.312042236328125, -0.29917144775390625, -0.2863006591796875, -0.27342987060546875, -0.26055908203125, -0.24768829345703125, -0.2348175048828125, -0.22194671630859375, -0.209075927734375, -0.19620513916015625, -0.1833343505859375, -0.17046356201171875, -0.1575927734375, -0.14472198486328125, -0.1318511962890625, -0.11898040771484375, -0.106109619140625, -0.09323883056640625, -0.0803680419921875, -0.06749725341796875, -0.05462646484375, -0.04175567626953125, -0.0288848876953125, -0.01601409912109375, -0.003143310546875, 0.00972747802734375, 0.0225982666015625, 0.03546905517578125, 0.04833984375, 0.06121063232421875, 0.0740814208984375, 0.08695220947265625, 0.099822998046875, 0.11269378662109375, 0.1255645751953125, 0.13843536376953125, 0.15130615234375, 0.16417694091796875, 0.1770477294921875, 0.18991851806640625, 0.202789306640625, 0.21566009521484375, 0.2285308837890625, 0.24140167236328125, 0.2542724609375, 0.26714324951171875, 0.2800140380859375, 0.29288482666015625, 0.305755615234375, 0.31862640380859375, 0.3314971923828125, 0.34436798095703125, 0.35723876953125, 0.37010955810546875, 0.3829803466796875, 0.39585113525390625, 0.408721923828125, 0.42159271240234375, 0.4344635009765625, 0.44733428955078125, 0.460205078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 9.0, 10.0, 12.0, 10.0, 19.0, 15.0, 17.0, 21.0, 34.0, 27.0, 36.0, 40.0, 51.0, 39.0, 42.0, 37.0, 43.0, 48.0, 57.0, 41.0, 40.0, 51.0, 39.0, 48.0, 27.0, 13.0, 31.0, 25.0, 22.0, 19.0, 12.0, 14.0, 6.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42333984375, -0.40883636474609375, -0.3943328857421875, -0.37982940673828125, -0.365325927734375, -0.35082244873046875, -0.3363189697265625, -0.32181549072265625, -0.30731201171875, -0.29280853271484375, -0.2783050537109375, -0.26380157470703125, -0.249298095703125, -0.23479461669921875, -0.2202911376953125, -0.20578765869140625, -0.1912841796875, -0.17678070068359375, -0.1622772216796875, -0.14777374267578125, -0.133270263671875, -0.11876678466796875, -0.1042633056640625, -0.08975982666015625, -0.07525634765625, -0.06075286865234375, -0.0462493896484375, -0.03174591064453125, -0.017242431640625, -0.00273895263671875, 0.0117645263671875, 0.02626800537109375, 0.040771484375, 0.05527496337890625, 0.0697784423828125, 0.08428192138671875, 0.098785400390625, 0.11328887939453125, 0.1277923583984375, 0.14229583740234375, 0.15679931640625, 0.17130279541015625, 0.1858062744140625, 0.20030975341796875, 0.214813232421875, 0.22931671142578125, 0.2438201904296875, 0.25832366943359375, 0.2728271484375, 0.28733062744140625, 0.3018341064453125, 0.31633758544921875, 0.330841064453125, 0.34534454345703125, 0.3598480224609375, 0.37435150146484375, 0.38885498046875, 0.40335845947265625, 0.4178619384765625, 0.43236541748046875, 0.446868896484375, 0.46137237548828125, 0.4758758544921875, 0.49037933349609375, 0.5048828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 6.0, 10.0, 20.0, 30.0, 36.0, 78.0, 115.0, 277.0, 739.0, 2146.0, 9324.0, 193624.0, 818968.0, 18261.0, 3216.0, 963.0, 368.0, 144.0, 84.0, 51.0, 24.0, 16.0, 9.0, 5.0, 4.0, 7.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.65771484375, -0.635162353515625, -0.61260986328125, -0.590057373046875, -0.5675048828125, -0.544952392578125, -0.52239990234375, -0.499847412109375, -0.477294921875, -0.454742431640625, -0.43218994140625, -0.409637451171875, -0.3870849609375, -0.364532470703125, -0.34197998046875, -0.319427490234375, -0.296875, -0.274322509765625, -0.25177001953125, -0.229217529296875, -0.2066650390625, -0.184112548828125, -0.16156005859375, -0.139007568359375, -0.116455078125, -0.093902587890625, -0.07135009765625, -0.048797607421875, -0.0262451171875, -0.003692626953125, 0.01885986328125, 0.041412353515625, 0.06396484375, 0.086517333984375, 0.10906982421875, 0.131622314453125, 0.1541748046875, 0.176727294921875, 0.19927978515625, 0.221832275390625, 0.244384765625, 0.266937255859375, 0.28948974609375, 0.312042236328125, 0.3345947265625, 0.357147216796875, 0.37969970703125, 0.402252197265625, 0.4248046875, 0.447357177734375, 0.46990966796875, 0.492462158203125, 0.5150146484375, 0.537567138671875, 0.56011962890625, 0.582672119140625, 0.605224609375, 0.627777099609375, 0.65032958984375, 0.672882080078125, 0.6954345703125, 0.717987060546875, 0.74053955078125, 0.763092041015625, 0.78564453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 9.0, 9.0, 12.0, 9.0, 13.0, 25.0, 31.0, 21.0, 23.0, 28.0, 41.0, 40.0, 36.0, 41.0, 49.0, 51.0, 43.0, 51.0, 54.0, 50.0, 44.0, 43.0, 32.0, 30.0, 35.0, 37.0, 19.0, 20.0, 11.0, 15.0, 14.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5160980224609375, -0.498016357421875, -0.4799346923828125, -0.46185302734375, -0.4437713623046875, -0.425689697265625, -0.4076080322265625, -0.3895263671875, -0.3714447021484375, -0.353363037109375, -0.3352813720703125, -0.31719970703125, -0.2991180419921875, -0.281036376953125, -0.2629547119140625, -0.244873046875, -0.2267913818359375, -0.208709716796875, -0.1906280517578125, -0.17254638671875, -0.1544647216796875, -0.136383056640625, -0.1183013916015625, -0.1002197265625, -0.0821380615234375, -0.064056396484375, -0.0459747314453125, -0.02789306640625, -0.0098114013671875, 0.008270263671875, 0.0263519287109375, 0.04443359375, 0.0625152587890625, 0.080596923828125, 0.0986785888671875, 0.11676025390625, 0.1348419189453125, 0.152923583984375, 0.1710052490234375, 0.1890869140625, 0.2071685791015625, 0.225250244140625, 0.2433319091796875, 0.26141357421875, 0.2794952392578125, 0.297576904296875, 0.3156585693359375, 0.333740234375, 0.3518218994140625, 0.369903564453125, 0.3879852294921875, 0.40606689453125, 0.4241485595703125, 0.442230224609375, 0.4603118896484375, 0.4783935546875, 0.4964752197265625, 0.514556884765625, 0.5326385498046875, 0.55072021484375, 0.5688018798828125, 0.586883544921875, 0.6049652099609375, 0.623046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 11.0, 15.0, 39.0, 62.0, 178.0, 572.0, 2915.0, 51029.0, 971190.0, 20024.0, 1833.0, 388.0, 149.0, 58.0, 31.0, 15.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352294921875, -0.3384132385253906, -0.32453155517578125, -0.3106498718261719, -0.2967681884765625, -0.2828865051269531, -0.26900482177734375, -0.2551231384277344, -0.241241455078125, -0.22735977172851562, -0.21347808837890625, -0.19959640502929688, -0.1857147216796875, -0.17183303833007812, -0.15795135498046875, -0.14406967163085938, -0.13018798828125, -0.11630630493164062, -0.10242462158203125, -0.08854293823242188, -0.0746612548828125, -0.060779571533203125, -0.04689788818359375, -0.033016204833984375, -0.019134521484375, -0.005252838134765625, 0.00862884521484375, 0.022510528564453125, 0.0363922119140625, 0.050273895263671875, 0.06415557861328125, 0.07803726196289062, 0.0919189453125, 0.10580062866210938, 0.11968231201171875, 0.13356399536132812, 0.1474456787109375, 0.16132736206054688, 0.17520904541015625, 0.18909072875976562, 0.202972412109375, 0.21685409545898438, 0.23073577880859375, 0.24461746215820312, 0.2584991455078125, 0.2723808288574219, 0.28626251220703125, 0.3001441955566406, 0.31402587890625, 0.3279075622558594, 0.34178924560546875, 0.3556709289550781, 0.3695526123046875, 0.3834342956542969, 0.39731597900390625, 0.4111976623535156, 0.425079345703125, 0.4389610290527344, 0.45284271240234375, 0.4667243957519531, 0.4806060791015625, 0.4944877624511719, 0.5083694458007812, 0.5222511291503906, 0.5361328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 5.0, 15.0, 9.0, 23.0, 20.0, 47.0, 57.0, 87.0, 154.0, 180.0, 142.0, 82.0, 59.0, 49.0, 17.0, 13.0, 12.0, 7.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910064697265625e-05, -3.810971975326538e-05, -3.711879253387451e-05, -3.612786531448364e-05, -3.5136938095092773e-05, -3.4146010875701904e-05, -3.3155083656311035e-05, -3.2164156436920166e-05, -3.11732292175293e-05, -3.0182301998138428e-05, -2.919137477874756e-05, -2.820044755935669e-05, -2.720952033996582e-05, -2.621859312057495e-05, -2.5227665901184082e-05, -2.4236738681793213e-05, -2.3245811462402344e-05, -2.2254884243011475e-05, -2.1263957023620605e-05, -2.0273029804229736e-05, -1.9282102584838867e-05, -1.8291175365447998e-05, -1.730024814605713e-05, -1.630932092666626e-05, -1.531839370727539e-05, -1.4327466487884521e-05, -1.3336539268493652e-05, -1.2345612049102783e-05, -1.1354684829711914e-05, -1.0363757610321045e-05, -9.372830390930176e-06, -8.381903171539307e-06, -7.3909759521484375e-06, -6.400048732757568e-06, -5.409121513366699e-06, -4.41819429397583e-06, -3.427267074584961e-06, -2.436339855194092e-06, -1.4454126358032227e-06, -4.544854164123535e-07, 5.364418029785156e-07, 1.5273690223693848e-06, 2.518296241760254e-06, 3.509223461151123e-06, 4.500150680541992e-06, 5.491077899932861e-06, 6.4820051193237305e-06, 7.4729323387146e-06, 8.463859558105469e-06, 9.454786777496338e-06, 1.0445713996887207e-05, 1.1436641216278076e-05, 1.2427568435668945e-05, 1.3418495655059814e-05, 1.4409422874450684e-05, 1.5400350093841553e-05, 1.6391277313232422e-05, 1.738220453262329e-05, 1.837313175201416e-05, 1.936405897140503e-05, 2.03549861907959e-05, 2.1345913410186768e-05, 2.2336840629577637e-05, 2.3327767848968506e-05, 2.4318695068359375e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 15.0, 14.0, 26.0, 43.0, 96.0, 205.0, 469.0, 1301.0, 4921.0, 61194.0, 943611.0, 31176.0, 3633.0, 1057.0, 402.0, 154.0, 81.0, 47.0, 25.0, 16.0, 10.0, 13.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.52001953125, -0.5071487426757812, -0.4942779541015625, -0.48140716552734375, -0.468536376953125, -0.45566558837890625, -0.4427947998046875, -0.42992401123046875, -0.41705322265625, -0.40418243408203125, -0.3913116455078125, -0.37844085693359375, -0.365570068359375, -0.35269927978515625, -0.3398284912109375, -0.32695770263671875, -0.3140869140625, -0.30121612548828125, -0.2883453369140625, -0.27547454833984375, -0.262603759765625, -0.24973297119140625, -0.2368621826171875, -0.22399139404296875, -0.21112060546875, -0.19824981689453125, -0.1853790283203125, -0.17250823974609375, -0.159637451171875, -0.14676666259765625, -0.1338958740234375, -0.12102508544921875, -0.108154296875, -0.09528350830078125, -0.0824127197265625, -0.06954193115234375, -0.056671142578125, -0.04380035400390625, -0.0309295654296875, -0.01805877685546875, -0.00518798828125, 0.00768280029296875, 0.0205535888671875, 0.03342437744140625, 0.046295166015625, 0.05916595458984375, 0.0720367431640625, 0.08490753173828125, 0.0977783203125, 0.11064910888671875, 0.1235198974609375, 0.13639068603515625, 0.149261474609375, 0.16213226318359375, 0.1750030517578125, 0.18787384033203125, 0.20074462890625, 0.21361541748046875, 0.2264862060546875, 0.23935699462890625, 0.252227783203125, 0.26509857177734375, 0.2779693603515625, 0.29084014892578125, 0.3037109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 16.0, 13.0, 27.0, 19.0, 38.0, 62.0, 100.0, 232.0, 201.0, 93.0, 49.0, 37.0, 27.0, 24.0, 12.0, 9.0, 5.0, 3.0, 8.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080322265625, -0.07695960998535156, -0.07359695434570312, -0.07023429870605469, -0.06687164306640625, -0.06350898742675781, -0.060146331787109375, -0.05678367614746094, -0.0534210205078125, -0.05005836486816406, -0.046695709228515625, -0.04333305358886719, -0.03997039794921875, -0.03660774230957031, -0.033245086669921875, -0.029882431030273438, -0.026519775390625, -0.023157119750976562, -0.019794464111328125, -0.016431808471679688, -0.01306915283203125, -0.009706497192382812, -0.006343841552734375, -0.0029811859130859375, 0.0003814697265625, 0.0037441253662109375, 0.007106781005859375, 0.010469436645507812, 0.01383209228515625, 0.017194747924804688, 0.020557403564453125, 0.023920059204101562, 0.02728271484375, 0.030645370483398438, 0.034008026123046875, 0.03737068176269531, 0.04073333740234375, 0.04409599304199219, 0.047458648681640625, 0.05082130432128906, 0.0541839599609375, 0.05754661560058594, 0.060909271240234375, 0.06427192687988281, 0.06763458251953125, 0.07099723815917969, 0.07435989379882812, 0.07772254943847656, 0.081085205078125, 0.08444786071777344, 0.08781051635742188, 0.09117317199707031, 0.09453582763671875, 0.09789848327636719, 0.10126113891601562, 0.10462379455566406, 0.1079864501953125, 0.11134910583496094, 0.11471176147460938, 0.11807441711425781, 0.12143707275390625, 0.12479972839355469, 0.12816238403320312, 0.13152503967285156, 0.1348876953125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 11.0, 29.0, 51.0, 165.0, 292.0, 253.0, 121.0, 38.0, 25.0, 13.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.731217861175537, -1.661611795425415, -1.592005729675293, -1.522399663925171, -1.4527935981750488, -1.3831875324249268, -1.3135814666748047, -1.2439754009246826, -1.1743693351745605, -1.1047632694244385, -1.0351572036743164, -0.9655511379241943, -0.8959450721740723, -0.8263390064239502, -0.7567330002784729, -0.6871269345283508, -0.6175209283828735, -0.5479148626327515, -0.4783087968826294, -0.4087027609348297, -0.33909669518470764, -0.26949062943458557, -0.1998845934867859, -0.13027852773666382, -0.06067246198654175, 0.008933596312999725, 0.0785396546125412, 0.14814570546150208, 0.21775177121162415, 0.2873578369617462, 0.3569638729095459, 0.42656993865966797, 0.49617600440979004, 0.5657820701599121, 0.6353881359100342, 0.7049942016601562, 0.7746002674102783, 0.8442063331604004, 0.9138123393058777, 0.9834184050559998, 1.0530245304107666, 1.1226305961608887, 1.1922366619110107, 1.2618427276611328, 1.3314487934112549, 1.401054859161377, 1.470660924911499, 1.540266990661621, 1.6098729372024536, 1.6794790029525757, 1.7490850687026978, 1.8186911344528198, 1.888297200202942, 1.957903265953064, 2.0275092124938965, 2.0971152782440186, 2.1667213439941406, 2.2363274097442627, 2.3059334754943848, 2.375539541244507, 2.445145606994629, 2.514751672744751, 2.584357738494873, 2.653963804244995, 2.723569869995117]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 3.0, 3.0, 6.0, 8.0, 9.0, 10.0, 14.0, 16.0, 12.0, 18.0, 20.0, 17.0, 20.0, 34.0, 30.0, 32.0, 21.0, 50.0, 26.0, 22.0, 45.0, 44.0, 37.0, 40.0, 36.0, 38.0, 42.0, 37.0, 26.0, 35.0, 29.0, 30.0, 28.0, 15.0, 23.0, 22.0, 16.0, 13.0, 13.0, 12.0, 11.0, 7.0, 5.0, 4.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.8226771354675293, -0.7981719374656677, -0.7736666798591614, -0.7491614818572998, -0.7246562242507935, -0.7001510262489319, -0.6756458282470703, -0.651140570640564, -0.6266353726387024, -0.6021301746368408, -0.5776249170303345, -0.5531197190284729, -0.5286145210266113, -0.504109263420105, -0.4796040654182434, -0.45509883761405945, -0.4305936098098755, -0.40608838200569153, -0.38158315420150757, -0.357077956199646, -0.33257272839546204, -0.3080675005912781, -0.2835623025894165, -0.25905707478523254, -0.23455184698104858, -0.21004661917686462, -0.18554140627384186, -0.1610361933708191, -0.13653096556663513, -0.11202574521303177, -0.0875205248594284, -0.06301531195640564, -0.038510143756866455, -0.014004923403263092, 0.010500296950340271, 0.035005517303943634, 0.059510737657547, 0.08401595801115036, 0.10852117836475372, 0.1330263912677765, 0.15753161907196045, 0.1820368468761444, 0.20654205977916718, 0.23104727268218994, 0.2555525004863739, 0.28005772829055786, 0.30456292629241943, 0.3290681540966034, 0.35357338190078735, 0.3780786097049713, 0.4025838375091553, 0.42708903551101685, 0.4515942633152008, 0.47609949111938477, 0.5006046891212463, 0.5251098871231079, 0.5496151447296143, 0.5741203427314758, 0.5986256003379822, 0.6231307983398438, 0.6476360559463501, 0.6721412539482117, 0.6966464519500732, 0.7211517095565796, 0.7456569075584412]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 11.0, 18.0, 20.0, 53.0, 74.0, 177.0, 309.0, 835.0, 2211.0, 8258.0, 65724.0, 3036684.0, 1043191.0, 29026.0, 5113.0, 1485.0, 569.0, 227.0, 117.0, 59.0, 37.0, 17.0, 10.0, 13.0, 5.0, 6.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8955078125, -0.8664779663085938, -0.8374481201171875, -0.8084182739257812, -0.779388427734375, -0.7503585815429688, -0.7213287353515625, -0.6922988891601562, -0.66326904296875, -0.6342391967773438, -0.6052093505859375, -0.5761795043945312, -0.547149658203125, -0.5181198120117188, -0.4890899658203125, -0.46006011962890625, -0.4310302734375, -0.40200042724609375, -0.3729705810546875, -0.34394073486328125, -0.314910888671875, -0.28588104248046875, -0.2568511962890625, -0.22782135009765625, -0.19879150390625, -0.16976165771484375, -0.1407318115234375, -0.11170196533203125, -0.082672119140625, -0.05364227294921875, -0.0246124267578125, 0.00441741943359375, 0.033447265625, 0.06247711181640625, 0.0915069580078125, 0.12053680419921875, 0.149566650390625, 0.17859649658203125, 0.2076263427734375, 0.23665618896484375, 0.26568603515625, 0.29471588134765625, 0.3237457275390625, 0.35277557373046875, 0.381805419921875, 0.41083526611328125, 0.4398651123046875, 0.46889495849609375, 0.4979248046875, 0.5269546508789062, 0.5559844970703125, 0.5850143432617188, 0.614044189453125, 0.6430740356445312, 0.6721038818359375, 0.7011337280273438, 0.73016357421875, 0.7591934204101562, 0.7882232666015625, 0.8172531127929688, 0.846282958984375, 0.8753128051757812, 0.9043426513671875, 0.9333724975585938, 0.96240234375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 6.0, 5.0, 15.0, 12.0, 13.0, 20.0, 25.0, 23.0, 29.0, 30.0, 35.0, 30.0, 38.0, 41.0, 59.0, 53.0, 46.0, 45.0, 53.0, 43.0, 54.0, 41.0, 38.0, 41.0, 36.0, 29.0, 26.0, 25.0, 12.0, 15.0, 12.0, 7.0, 6.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.265869140625, -0.2570304870605469, -0.24819183349609375, -0.23935317993164062, -0.2305145263671875, -0.22167587280273438, -0.21283721923828125, -0.20399856567382812, -0.195159912109375, -0.18632125854492188, -0.17748260498046875, -0.16864395141601562, -0.1598052978515625, -0.15096664428710938, -0.14212799072265625, -0.13328933715820312, -0.12445068359375, -0.11561203002929688, -0.10677337646484375, -0.09793472290039062, -0.0890960693359375, -0.08025741577148438, -0.07141876220703125, -0.06258010864257812, -0.053741455078125, -0.044902801513671875, -0.03606414794921875, -0.027225494384765625, -0.0183868408203125, -0.009548187255859375, -0.00070953369140625, 0.008129119873046875, 0.0169677734375, 0.025806427001953125, 0.03464508056640625, 0.043483734130859375, 0.0523223876953125, 0.061161041259765625, 0.06999969482421875, 0.07883834838867188, 0.087677001953125, 0.09651565551757812, 0.10535430908203125, 0.11419296264648438, 0.1230316162109375, 0.13187026977539062, 0.14070892333984375, 0.14954757690429688, 0.15838623046875, 0.16722488403320312, 0.17606353759765625, 0.18490219116210938, 0.1937408447265625, 0.20257949829101562, 0.21141815185546875, 0.22025680541992188, 0.229095458984375, 0.23793411254882812, 0.24677276611328125, 0.2556114196777344, 0.2644500732421875, 0.2732887268066406, 0.28212738037109375, 0.2909660339355469, 0.2998046875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 7.0, 6.0, 15.0, 15.0, 22.0, 34.0, 46.0, 51.0, 89.0, 125.0, 271.0, 390.0, 857.0, 2170.0, 6318.0, 28099.0, 278861.0, 3612183.0, 229796.0, 25331.0, 5907.0, 1929.0, 755.0, 423.0, 200.0, 120.0, 78.0, 47.0, 39.0, 19.0, 16.0, 18.0, 7.0, 7.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.71728515625, -0.6981430053710938, -0.6790008544921875, -0.6598587036132812, -0.640716552734375, -0.6215744018554688, -0.6024322509765625, -0.5832901000976562, -0.56414794921875, -0.5450057983398438, -0.5258636474609375, -0.5067214965820312, -0.487579345703125, -0.46843719482421875, -0.4492950439453125, -0.43015289306640625, -0.4110107421875, -0.39186859130859375, -0.3727264404296875, -0.35358428955078125, -0.334442138671875, -0.31529998779296875, -0.2961578369140625, -0.27701568603515625, -0.25787353515625, -0.23873138427734375, -0.2195892333984375, -0.20044708251953125, -0.181304931640625, -0.16216278076171875, -0.1430206298828125, -0.12387847900390625, -0.104736328125, -0.08559417724609375, -0.0664520263671875, -0.04730987548828125, -0.028167724609375, -0.00902557373046875, 0.0101165771484375, 0.02925872802734375, 0.04840087890625, 0.06754302978515625, 0.0866851806640625, 0.10582733154296875, 0.124969482421875, 0.14411163330078125, 0.1632537841796875, 0.18239593505859375, 0.2015380859375, 0.22068023681640625, 0.2398223876953125, 0.25896453857421875, 0.278106689453125, 0.29724884033203125, 0.3163909912109375, 0.33553314208984375, 0.35467529296875, 0.37381744384765625, 0.3929595947265625, 0.41210174560546875, 0.431243896484375, 0.45038604736328125, 0.4695281982421875, 0.48867034912109375, 0.5078125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 14.0, 14.0, 21.0, 35.0, 53.0, 73.0, 103.0, 207.0, 395.0, 661.0, 879.0, 663.0, 364.0, 203.0, 139.0, 67.0, 50.0, 31.0, 30.0, 13.0, 17.0, 6.0, 5.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17822265625, -0.1727313995361328, -0.16724014282226562, -0.16174888610839844, -0.15625762939453125, -0.15076637268066406, -0.14527511596679688, -0.1397838592529297, -0.1342926025390625, -0.1288013458251953, -0.12331008911132812, -0.11781883239746094, -0.11232757568359375, -0.10683631896972656, -0.10134506225585938, -0.09585380554199219, -0.090362548828125, -0.08487129211425781, -0.07938003540039062, -0.07388877868652344, -0.06839752197265625, -0.06290626525878906, -0.057415008544921875, -0.05192375183105469, -0.0464324951171875, -0.04094123840332031, -0.035449981689453125, -0.029958724975585938, -0.02446746826171875, -0.018976211547851562, -0.013484954833984375, -0.007993698120117188, -0.00250244140625, 0.0029888153076171875, 0.008480072021484375, 0.013971328735351562, 0.01946258544921875, 0.024953842163085938, 0.030445098876953125, 0.03593635559082031, 0.0414276123046875, 0.04691886901855469, 0.052410125732421875, 0.05790138244628906, 0.06339263916015625, 0.06888389587402344, 0.07437515258789062, 0.07986640930175781, 0.085357666015625, 0.09084892272949219, 0.09634017944335938, 0.10183143615722656, 0.10732269287109375, 0.11281394958496094, 0.11830520629882812, 0.12379646301269531, 0.1292877197265625, 0.1347789764404297, 0.14027023315429688, 0.14576148986816406, 0.15125274658203125, 0.15674400329589844, 0.16223526000976562, 0.1677265167236328, 0.1732177734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 10.0, 11.0, 15.0, 16.0, 25.0, 37.0, 53.0, 81.0, 98.0, 99.0, 145.0, 105.0, 120.0, 57.0, 43.0, 32.0, 20.0, 14.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5308326482772827, -0.5080342292785645, -0.4852357804775238, -0.46243736147880554, -0.4396389126777649, -0.41684049367904663, -0.39404207468032837, -0.3712436556816101, -0.34844520688056946, -0.3256467878818512, -0.30284833908081055, -0.2800499200820923, -0.257251501083374, -0.23445305228233337, -0.2116546332836151, -0.18885619938373566, -0.1660577654838562, -0.14325933158397675, -0.12046090513467789, -0.09766247868537903, -0.07486404478549957, -0.05206561088562012, -0.029267191886901855, -0.0064687579870224, 0.016329675912857056, 0.03912810608744621, 0.06192653626203537, 0.08472496271133423, 0.10752339661121368, 0.13032183051109314, 0.1531202495098114, 0.17591868340969086, 0.1987171173095703, 0.22151555120944977, 0.24431398510932922, 0.2671124041080475, 0.28991085290908813, 0.3127092719078064, 0.33550769090652466, 0.3583061099052429, 0.38110455870628357, 0.40390297770500183, 0.4267014265060425, 0.44949984550476074, 0.472298264503479, 0.49509671330451965, 0.5178951025009155, 0.5406935811042786, 0.5634920001029968, 0.5862904191017151, 0.6090888381004333, 0.6318873167037964, 0.6546857357025146, 0.6774841547012329, 0.7002825736999512, 0.7230809926986694, 0.7458794116973877, 0.768677830696106, 0.7914762496948242, 0.8142746686935425, 0.8370731472969055, 0.8598715662956238, 0.882669985294342, 0.9054684042930603, 0.9282668828964233]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 8.0, 7.0, 7.0, 12.0, 12.0, 13.0, 26.0, 23.0, 24.0, 33.0, 30.0, 46.0, 32.0, 38.0, 30.0, 30.0, 37.0, 37.0, 39.0, 46.0, 48.0, 41.0, 36.0, 42.0, 42.0, 34.0, 25.0, 26.0, 33.0, 23.0, 23.0, 20.0, 19.0, 10.0, 13.0, 10.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31847622990608215, -0.30862683057785034, -0.29877740144729614, -0.28892800211906433, -0.2790786027908325, -0.2692291736602783, -0.2593797743320465, -0.2495303601026535, -0.2396809458732605, -0.2298315316438675, -0.2199821174144745, -0.21013271808624268, -0.20028330385684967, -0.19043388962745667, -0.18058449029922485, -0.17073507606983185, -0.16088566184043884, -0.15103624761104584, -0.14118683338165283, -0.13133743405342102, -0.12148801982402802, -0.11163860559463501, -0.1017891988158226, -0.09193979203701019, -0.08209037780761719, -0.07224096357822418, -0.062391556799411774, -0.05254214629530907, -0.04269273579120636, -0.03284332528710365, -0.022993914783000946, -0.013144508004188538, -0.00329512357711792, 0.006554286926984787, 0.016403697431087494, 0.0262531079351902, 0.03610251843929291, 0.045951928943395615, 0.05580133944749832, 0.06565074622631073, 0.07550016045570374, 0.08534957468509674, 0.09519898146390915, 0.10504838824272156, 0.11489780247211456, 0.12474721670150757, 0.13459661602973938, 0.14444603025913239, 0.1542954444885254, 0.1641448587179184, 0.1739942729473114, 0.1838436722755432, 0.19369308650493622, 0.20354250073432922, 0.21339190006256104, 0.22324131429195404, 0.23309072852134705, 0.24294014275074005, 0.25278955698013306, 0.26263895630836487, 0.2724883556365967, 0.2823377847671509, 0.2921871840953827, 0.3020365834236145, 0.3118860125541687]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 0.0, 3.0, 10.0, 14.0, 31.0, 46.0, 138.0, 345.0, 923.0, 2830.0, 10380.0, 119000.0, 827631.0, 74976.0, 8535.0, 2364.0, 786.0, 275.0, 132.0, 51.0, 27.0, 17.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16079139709472656, -0.15446853637695312, -0.1481456756591797, -0.14182281494140625, -0.1354999542236328, -0.12917709350585938, -0.12285423278808594, -0.1165313720703125, -0.11020851135253906, -0.10388565063476562, -0.09756278991699219, -0.09123992919921875, -0.08491706848144531, -0.07859420776367188, -0.07227134704589844, -0.065948486328125, -0.05962562561035156, -0.053302764892578125, -0.04697990417480469, -0.04065704345703125, -0.03433418273925781, -0.028011322021484375, -0.021688461303710938, -0.0153656005859375, -0.009042739868164062, -0.002719879150390625, 0.0036029815673828125, 0.00992584228515625, 0.016248703002929688, 0.022571563720703125, 0.028894424438476562, 0.03521728515625, 0.04154014587402344, 0.047863006591796875, 0.05418586730957031, 0.06050872802734375, 0.06683158874511719, 0.07315444946289062, 0.07947731018066406, 0.0858001708984375, 0.09212303161621094, 0.09844589233398438, 0.10476875305175781, 0.11109161376953125, 0.11741447448730469, 0.12373733520507812, 0.13006019592285156, 0.136383056640625, 0.14270591735839844, 0.14902877807617188, 0.1553516387939453, 0.16167449951171875, 0.1679973602294922, 0.17432022094726562, 0.18064308166503906, 0.1869659423828125, 0.19328880310058594, 0.19961166381835938, 0.2059345245361328, 0.21225738525390625, 0.2185802459716797, 0.22490310668945312, 0.23122596740722656, 0.237548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 7.0, 2.0, 7.0, 14.0, 15.0, 17.0, 23.0, 28.0, 39.0, 38.0, 35.0, 42.0, 54.0, 28.0, 49.0, 53.0, 43.0, 59.0, 52.0, 57.0, 48.0, 38.0, 36.0, 43.0, 23.0, 31.0, 21.0, 28.0, 20.0, 11.0, 12.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2832679748535156, -0.27527618408203125, -0.2672843933105469, -0.2592926025390625, -0.2513008117675781, -0.24330902099609375, -0.23531723022460938, -0.227325439453125, -0.21933364868164062, -0.21134185791015625, -0.20335006713867188, -0.1953582763671875, -0.18736648559570312, -0.17937469482421875, -0.17138290405273438, -0.16339111328125, -0.15539932250976562, -0.14740753173828125, -0.13941574096679688, -0.1314239501953125, -0.12343215942382812, -0.11544036865234375, -0.10744857788085938, -0.099456787109375, -0.09146499633789062, -0.08347320556640625, -0.07548141479492188, -0.0674896240234375, -0.059497833251953125, -0.05150604248046875, -0.043514251708984375, -0.0355224609375, -0.027530670166015625, -0.01953887939453125, -0.011547088623046875, -0.0035552978515625, 0.004436492919921875, 0.01242828369140625, 0.020420074462890625, 0.028411865234375, 0.036403656005859375, 0.04439544677734375, 0.052387237548828125, 0.0603790283203125, 0.06837081909179688, 0.07636260986328125, 0.08435440063476562, 0.09234619140625, 0.10033798217773438, 0.10832977294921875, 0.11632156372070312, 0.1243133544921875, 0.13230514526367188, 0.14029693603515625, 0.14828872680664062, 0.156280517578125, 0.16427230834960938, 0.17226409912109375, 0.18025588989257812, 0.1882476806640625, 0.19623947143554688, 0.20423126220703125, 0.21222305297851562, 0.22021484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 9.0, 12.0, 10.0, 16.0, 26.0, 43.0, 72.0, 133.0, 225.0, 441.0, 862.0, 1917.0, 4857.0, 15250.0, 74528.0, 496114.0, 380762.0, 53749.0, 12138.0, 3971.0, 1680.0, 762.0, 397.0, 218.0, 134.0, 93.0, 52.0, 26.0, 20.0, 15.0, 11.0, 8.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10253620147705078, -0.09942054748535156, -0.09630489349365234, -0.09318923950195312, -0.0900735855102539, -0.08695793151855469, -0.08384227752685547, -0.08072662353515625, -0.07761096954345703, -0.07449531555175781, -0.0713796615600586, -0.06826400756835938, -0.06514835357666016, -0.06203269958496094, -0.05891704559326172, -0.0558013916015625, -0.05268573760986328, -0.04957008361816406, -0.046454429626464844, -0.043338775634765625, -0.040223121643066406, -0.03710746765136719, -0.03399181365966797, -0.03087615966796875, -0.02776050567626953, -0.024644851684570312, -0.021529197692871094, -0.018413543701171875, -0.015297889709472656, -0.012182235717773438, -0.009066581726074219, -0.005950927734375, -0.0028352737426757812, 0.0002803802490234375, 0.0033960342407226562, 0.006511688232421875, 0.009627342224121094, 0.012742996215820312, 0.01585865020751953, 0.01897430419921875, 0.02208995819091797, 0.025205612182617188, 0.028321266174316406, 0.031436920166015625, 0.034552574157714844, 0.03766822814941406, 0.04078388214111328, 0.0438995361328125, 0.04701519012451172, 0.05013084411621094, 0.053246498107910156, 0.056362152099609375, 0.059477806091308594, 0.06259346008300781, 0.06570911407470703, 0.06882476806640625, 0.07194042205810547, 0.07505607604980469, 0.0781717300415039, 0.08128738403320312, 0.08440303802490234, 0.08751869201660156, 0.09063434600830078, 0.09375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 12.0, 10.0, 15.0, 18.0, 29.0, 32.0, 28.0, 38.0, 42.0, 42.0, 32.0, 60.0, 53.0, 58.0, 71.0, 58.0, 42.0, 49.0, 40.0, 34.0, 30.0, 27.0, 24.0, 28.0, 19.0, 25.0, 15.0, 13.0, 4.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453125, -0.4381866455078125, -0.423248291015625, -0.4083099365234375, -0.39337158203125, -0.3784332275390625, -0.363494873046875, -0.3485565185546875, -0.3336181640625, -0.3186798095703125, -0.303741455078125, -0.2888031005859375, -0.27386474609375, -0.2589263916015625, -0.243988037109375, -0.2290496826171875, -0.214111328125, -0.1991729736328125, -0.184234619140625, -0.1692962646484375, -0.15435791015625, -0.1394195556640625, -0.124481201171875, -0.1095428466796875, -0.0946044921875, -0.0796661376953125, -0.064727783203125, -0.0497894287109375, -0.03485107421875, -0.0199127197265625, -0.004974365234375, 0.0099639892578125, 0.02490234375, 0.0398406982421875, 0.054779052734375, 0.0697174072265625, 0.08465576171875, 0.0995941162109375, 0.114532470703125, 0.1294708251953125, 0.1444091796875, 0.1593475341796875, 0.174285888671875, 0.1892242431640625, 0.20416259765625, 0.2191009521484375, 0.234039306640625, 0.2489776611328125, 0.263916015625, 0.2788543701171875, 0.293792724609375, 0.3087310791015625, 0.32366943359375, 0.3386077880859375, 0.353546142578125, 0.3684844970703125, 0.3834228515625, 0.3983612060546875, 0.413299560546875, 0.4282379150390625, 0.44317626953125, 0.4581146240234375, 0.473052978515625, 0.4879913330078125, 0.5029296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 14.0, 15.0, 24.0, 35.0, 48.0, 78.0, 105.0, 172.0, 252.0, 410.0, 748.0, 1427.0, 2772.0, 6212.0, 16022.0, 53096.0, 221021.0, 488824.0, 185438.0, 45874.0, 14584.0, 5701.0, 2522.0, 1355.0, 693.0, 416.0, 250.0, 128.0, 93.0, 66.0, 37.0, 30.0, 28.0, 18.0, 14.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.022613525390625, -0.021956920623779297, -0.021300315856933594, -0.02064371109008789, -0.019987106323242188, -0.019330501556396484, -0.01867389678955078, -0.018017292022705078, -0.017360687255859375, -0.016704082489013672, -0.01604747772216797, -0.015390872955322266, -0.014734268188476562, -0.01407766342163086, -0.013421058654785156, -0.012764453887939453, -0.01210784912109375, -0.011451244354248047, -0.010794639587402344, -0.01013803482055664, -0.009481430053710938, -0.008824825286865234, -0.008168220520019531, -0.007511615753173828, -0.006855010986328125, -0.006198406219482422, -0.005541801452636719, -0.004885196685791016, -0.0042285919189453125, -0.0035719871520996094, -0.0029153823852539062, -0.002258777618408203, -0.0016021728515625, -0.0009455680847167969, -0.00028896331787109375, 0.0003676414489746094, 0.0010242462158203125, 0.0016808509826660156, 0.0023374557495117188, 0.002994060516357422, 0.003650665283203125, 0.004307270050048828, 0.004963874816894531, 0.005620479583740234, 0.0062770843505859375, 0.006933689117431641, 0.007590293884277344, 0.008246898651123047, 0.00890350341796875, 0.009560108184814453, 0.010216712951660156, 0.01087331771850586, 0.011529922485351562, 0.012186527252197266, 0.012843132019042969, 0.013499736785888672, 0.014156341552734375, 0.014812946319580078, 0.015469551086425781, 0.016126155853271484, 0.016782760620117188, 0.01743936538696289, 0.018095970153808594, 0.018752574920654297, 0.0194091796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 9.0, 12.0, 14.0, 11.0, 23.0, 26.0, 27.0, 29.0, 37.0, 43.0, 64.0, 55.0, 60.0, 78.0, 67.0, 81.0, 57.0, 56.0, 45.0, 46.0, 23.0, 28.0, 23.0, 14.0, 9.0, 15.0, 4.0, 12.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0462477803230286e-05, -1.0136514902114868e-05, -9.81055200099945e-06, -9.484589099884033e-06, -9.158626198768616e-06, -8.832663297653198e-06, -8.50670039653778e-06, -8.180737495422363e-06, -7.854774594306946e-06, -7.528811693191528e-06, -7.202848792076111e-06, -6.876885890960693e-06, -6.550922989845276e-06, -6.224960088729858e-06, -5.898997187614441e-06, -5.5730342864990234e-06, -5.247071385383606e-06, -4.9211084842681885e-06, -4.595145583152771e-06, -4.2691826820373535e-06, -3.943219780921936e-06, -3.6172568798065186e-06, -3.291293978691101e-06, -2.9653310775756836e-06, -2.639368176460266e-06, -2.3134052753448486e-06, -1.987442374229431e-06, -1.6614794731140137e-06, -1.3355165719985962e-06, -1.0095536708831787e-06, -6.835907697677612e-07, -3.5762786865234375e-07, -3.166496753692627e-08, 2.942979335784912e-07, 6.202608346939087e-07, 9.462237358093262e-07, 1.2721866369247437e-06, 1.5981495380401611e-06, 1.9241124391555786e-06, 2.250075340270996e-06, 2.5760382413864136e-06, 2.902001142501831e-06, 3.2279640436172485e-06, 3.553926944732666e-06, 3.8798898458480835e-06, 4.205852746963501e-06, 4.5318156480789185e-06, 4.857778549194336e-06, 5.183741450309753e-06, 5.509704351425171e-06, 5.835667252540588e-06, 6.161630153656006e-06, 6.487593054771423e-06, 6.813555955886841e-06, 7.139518857002258e-06, 7.465481758117676e-06, 7.791444659233093e-06, 8.11740756034851e-06, 8.443370461463928e-06, 8.769333362579346e-06, 9.095296263694763e-06, 9.42125916481018e-06, 9.747222065925598e-06, 1.0073184967041016e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 11.0, 13.0, 12.0, 27.0, 32.0, 57.0, 83.0, 126.0, 208.0, 355.0, 588.0, 1178.0, 2445.0, 6165.0, 17354.0, 59239.0, 222912.0, 442147.0, 211720.0, 56557.0, 16501.0, 5819.0, 2368.0, 1145.0, 576.0, 313.0, 219.0, 131.0, 78.0, 59.0, 24.0, 22.0, 13.0, 14.0, 5.0, 4.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175628662109375, -0.016899585723876953, -0.016236305236816406, -0.01557302474975586, -0.014909744262695312, -0.014246463775634766, -0.013583183288574219, -0.012919902801513672, -0.012256622314453125, -0.011593341827392578, -0.010930061340332031, -0.010266780853271484, -0.009603500366210938, -0.00894021987915039, -0.008276939392089844, -0.007613658905029297, -0.00695037841796875, -0.006287097930908203, -0.005623817443847656, -0.004960536956787109, -0.0042972564697265625, -0.0036339759826660156, -0.0029706954956054688, -0.002307415008544922, -0.001644134521484375, -0.0009808540344238281, -0.00031757354736328125, 0.0003457069396972656, 0.0010089874267578125, 0.0016722679138183594, 0.0023355484008789062, 0.002998828887939453, 0.003662109375, 0.004325389862060547, 0.004988670349121094, 0.005651950836181641, 0.0063152313232421875, 0.006978511810302734, 0.007641792297363281, 0.008305072784423828, 0.008968353271484375, 0.009631633758544922, 0.010294914245605469, 0.010958194732666016, 0.011621475219726562, 0.01228475570678711, 0.012948036193847656, 0.013611316680908203, 0.01427459716796875, 0.014937877655029297, 0.015601158142089844, 0.01626443862915039, 0.016927719116210938, 0.017590999603271484, 0.01825428009033203, 0.018917560577392578, 0.019580841064453125, 0.020244121551513672, 0.02090740203857422, 0.021570682525634766, 0.022233963012695312, 0.02289724349975586, 0.023560523986816406, 0.024223804473876953, 0.0248870849609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 8.0, 8.0, 12.0, 15.0, 19.0, 19.0, 29.0, 31.0, 42.0, 48.0, 49.0, 65.0, 80.0, 70.0, 59.0, 59.0, 51.0, 58.0, 60.0, 34.0, 28.0, 28.0, 28.0, 13.0, 22.0, 5.0, 8.0, 6.0, 4.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.007099151611328125, -0.006922602653503418, -0.006746053695678711, -0.006569504737854004, -0.006392955780029297, -0.00621640682220459, -0.006039857864379883, -0.005863308906555176, -0.005686759948730469, -0.005510210990905762, -0.005333662033081055, -0.005157113075256348, -0.004980564117431641, -0.004804015159606934, -0.0046274662017822266, -0.0044509172439575195, -0.0042743682861328125, -0.0040978193283081055, -0.0039212703704833984, -0.0037447214126586914, -0.0035681724548339844, -0.0033916234970092773, -0.0032150745391845703, -0.0030385255813598633, -0.0028619766235351562, -0.0026854276657104492, -0.002508878707885742, -0.002332329750061035, -0.002155780792236328, -0.001979231834411621, -0.001802682876586914, -0.001626133918762207, -0.0014495849609375, -0.001273036003112793, -0.001096487045288086, -0.0009199380874633789, -0.0007433891296386719, -0.0005668401718139648, -0.0003902912139892578, -0.00021374225616455078, -3.719329833984375e-05, 0.00013935565948486328, 0.0003159046173095703, 0.0004924535751342773, 0.0006690025329589844, 0.0008455514907836914, 0.0010221004486083984, 0.0011986494064331055, 0.0013751983642578125, 0.0015517473220825195, 0.0017282962799072266, 0.0019048452377319336, 0.0020813941955566406, 0.0022579431533813477, 0.0024344921112060547, 0.0026110410690307617, 0.0027875900268554688, 0.0029641389846801758, 0.003140687942504883, 0.00331723690032959, 0.003493785858154297, 0.003670334815979004, 0.003846883773803711, 0.004023432731628418, 0.004199981689453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 12.0, 27.0, 46.0, 105.0, 211.0, 270.0, 179.0, 91.0, 40.0, 10.0, 6.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5026878714561462, -0.4737480580806732, -0.4448082447052002, -0.4158684015274048, -0.38692858815193176, -0.35798877477645874, -0.32904893159866333, -0.3001091182231903, -0.2711693048477173, -0.24222949147224426, -0.21328966319561005, -0.18434983491897583, -0.1554100215435028, -0.12647020816802979, -0.09753037989139557, -0.06859055161476135, -0.03965073823928833, -0.01071091741323471, 0.01822890341281891, 0.04716872423887253, 0.07610854506492615, 0.10504835844039917, 0.1339881867170334, 0.1629280149936676, 0.19186782836914062, 0.22080764174461365, 0.24974747002124786, 0.2786872982978821, 0.3076271116733551, 0.3365669250488281, 0.36550676822662354, 0.39444658160209656, 0.4233863353729248, 0.4523261487483978, 0.48126596212387085, 0.5102058053016663, 0.5391455888748169, 0.5680854320526123, 0.5970252752304077, 0.6259651184082031, 0.6549049019813538, 0.6838447451591492, 0.7127845287322998, 0.7417243719100952, 0.7706642150878906, 0.7996039986610413, 0.8285438418388367, 0.8574836254119873, 0.8864234685897827, 0.9153633117675781, 0.9443030953407288, 0.9732429385185242, 1.0021827220916748, 1.0311225652694702, 1.0600624084472656, 1.089002251625061, 1.1179420948028564, 1.1468819379806519, 1.1758217811584473, 1.2047615051269531, 1.2337013483047485, 1.262641191482544, 1.2915810346603394, 1.3205208778381348, 1.3494606018066406]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 1.0, 16.0, 8.0, 15.0, 15.0, 25.0, 24.0, 42.0, 33.0, 56.0, 42.0, 44.0, 36.0, 54.0, 37.0, 57.0, 62.0, 63.0, 40.0, 55.0, 42.0, 36.0, 34.0, 32.0, 29.0, 28.0, 21.0, 14.0, 9.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.29349470138549805, -0.28555718064308167, -0.2776196599006653, -0.2696821391582489, -0.2617446184158325, -0.25380709767341614, -0.24586959183216095, -0.23793207108974457, -0.22999455034732819, -0.2220570296049118, -0.21411950886249542, -0.20618198812007904, -0.19824448227882385, -0.19030696153640747, -0.1823694407939911, -0.1744319200515747, -0.16649439930915833, -0.15855687856674194, -0.15061935782432556, -0.14268183708190918, -0.1347443163394928, -0.12680679559707642, -0.11886928975582123, -0.11093176901340485, -0.10299424827098846, -0.09505672752857208, -0.0871192067861557, -0.07918169349431992, -0.07124417275190353, -0.06330665200948715, -0.05536913499236107, -0.047431617975234985, -0.039494067430496216, -0.031556546688079834, -0.02361902967095375, -0.015681510791182518, -0.007743991911411285, 0.00019352883100509644, 0.00813104584813118, 0.016068562865257263, 0.024006083607673645, 0.03194360435009003, 0.03988112136721611, 0.047818638384342194, 0.055756159126758575, 0.06369367986917496, 0.07163119316101074, 0.07956871390342712, 0.0875062346458435, 0.09544375538825989, 0.10338127613067627, 0.11131878942251205, 0.11925631016492844, 0.12719383835792542, 0.1351313441991806, 0.14306886494159698, 0.15100638568401337, 0.15894390642642975, 0.16688142716884613, 0.1748189479112625, 0.1827564537525177, 0.19069397449493408, 0.19863149523735046, 0.20656901597976685, 0.21450653672218323]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 9.0, 8.0, 12.0, 16.0, 34.0, 46.0, 71.0, 118.0, 219.0, 419.0, 787.0, 1548.0, 3218.0, 7573.0, 19814.0, 61345.0, 723252.0, 172201.0, 35335.0, 12534.0, 5225.0, 2288.0, 1176.0, 535.0, 296.0, 176.0, 103.0, 58.0, 38.0, 14.0, 18.0, 12.0, 8.0, 7.0, 3.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.29596710205078125, -0.2860260009765625, -0.27608489990234375, -0.266143798828125, -0.25620269775390625, -0.2462615966796875, -0.23632049560546875, -0.22637939453125, -0.21643829345703125, -0.2064971923828125, -0.19655609130859375, -0.186614990234375, -0.17667388916015625, -0.1667327880859375, -0.15679168701171875, -0.1468505859375, -0.13690948486328125, -0.1269683837890625, -0.11702728271484375, -0.107086181640625, -0.09714508056640625, -0.0872039794921875, -0.07726287841796875, -0.06732177734375, -0.05738067626953125, -0.0474395751953125, -0.03749847412109375, -0.027557373046875, -0.01761627197265625, -0.0076751708984375, 0.00226593017578125, 0.01220703125, 0.02214813232421875, 0.0320892333984375, 0.04203033447265625, 0.051971435546875, 0.06191253662109375, 0.0718536376953125, 0.08179473876953125, 0.09173583984375, 0.10167694091796875, 0.1116180419921875, 0.12155914306640625, 0.131500244140625, 0.14144134521484375, 0.1513824462890625, 0.16132354736328125, 0.1712646484375, 0.18120574951171875, 0.1911468505859375, 0.20108795166015625, 0.211029052734375, 0.22097015380859375, 0.2309112548828125, 0.24085235595703125, 0.25079345703125, 0.26073455810546875, 0.2706756591796875, 0.28061676025390625, 0.290557861328125, 0.30049896240234375, 0.3104400634765625, 0.32038116455078125, 0.330322265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 11.0, 12.0, 14.0, 24.0, 29.0, 43.0, 41.0, 64.0, 59.0, 52.0, 72.0, 61.0, 113.0, 63.0, 60.0, 64.0, 52.0, 41.0, 39.0, 31.0, 21.0, 16.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6651153564453125, -0.642730712890625, -0.6203460693359375, -0.59796142578125, -0.5755767822265625, -0.553192138671875, -0.5308074951171875, -0.5084228515625, -0.4860382080078125, -0.463653564453125, -0.4412689208984375, -0.41888427734375, -0.3964996337890625, -0.374114990234375, -0.3517303466796875, -0.329345703125, -0.3069610595703125, -0.284576416015625, -0.2621917724609375, -0.23980712890625, -0.2174224853515625, -0.195037841796875, -0.1726531982421875, -0.1502685546875, -0.1278839111328125, -0.105499267578125, -0.0831146240234375, -0.06072998046875, -0.0383453369140625, -0.015960693359375, 0.0064239501953125, 0.02880859375, 0.0511932373046875, 0.073577880859375, 0.0959625244140625, 0.11834716796875, 0.1407318115234375, 0.163116455078125, 0.1855010986328125, 0.2078857421875, 0.2302703857421875, 0.252655029296875, 0.2750396728515625, 0.29742431640625, 0.3198089599609375, 0.342193603515625, 0.3645782470703125, 0.386962890625, 0.4093475341796875, 0.431732177734375, 0.4541168212890625, 0.47650146484375, 0.4988861083984375, 0.521270751953125, 0.5436553955078125, 0.5660400390625, 0.5884246826171875, 0.610809326171875, 0.6331939697265625, 0.65557861328125, 0.6779632568359375, 0.700347900390625, 0.7227325439453125, 0.7451171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 8.0, 16.0, 6.0, 15.0, 21.0, 21.0, 18.0, 27.0, 53.0, 47.0, 79.0, 94.0, 153.0, 418.0, 2624.0, 40775.0, 963344.0, 37367.0, 2453.0, 460.0, 137.0, 90.0, 83.0, 53.0, 41.0, 40.0, 28.0, 22.0, 9.0, 6.0, 12.0, 6.0, 11.0, 3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.7556228637695312, -0.7299957275390625, -0.7043685913085938, -0.678741455078125, -0.6531143188476562, -0.6274871826171875, -0.6018600463867188, -0.57623291015625, -0.5506057739257812, -0.5249786376953125, -0.49935150146484375, -0.473724365234375, -0.44809722900390625, -0.4224700927734375, -0.39684295654296875, -0.3712158203125, -0.34558868408203125, -0.3199615478515625, -0.29433441162109375, -0.268707275390625, -0.24308013916015625, -0.2174530029296875, -0.19182586669921875, -0.16619873046875, -0.14057159423828125, -0.1149444580078125, -0.08931732177734375, -0.063690185546875, -0.03806304931640625, -0.0124359130859375, 0.01319122314453125, 0.038818359375, 0.06444549560546875, 0.0900726318359375, 0.11569976806640625, 0.141326904296875, 0.16695404052734375, 0.1925811767578125, 0.21820831298828125, 0.24383544921875, 0.26946258544921875, 0.2950897216796875, 0.32071685791015625, 0.346343994140625, 0.37197113037109375, 0.3975982666015625, 0.42322540283203125, 0.4488525390625, 0.47447967529296875, 0.5001068115234375, 0.5257339477539062, 0.551361083984375, 0.5769882202148438, 0.6026153564453125, 0.6282424926757812, 0.65386962890625, 0.6794967651367188, 0.7051239013671875, 0.7307510375976562, 0.756378173828125, 0.7820053100585938, 0.8076324462890625, 0.8332595825195312, 0.85888671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 1.0, 4.0, 3.0, 8.0, 7.0, 9.0, 16.0, 11.0, 20.0, 25.0, 28.0, 33.0, 26.0, 50.0, 45.0, 41.0, 59.0, 44.0, 36.0, 59.0, 59.0, 64.0, 53.0, 38.0, 40.0, 34.0, 29.0, 29.0, 24.0, 25.0, 19.0, 13.0, 16.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6376953125, -0.618560791015625, -0.59942626953125, -0.580291748046875, -0.5611572265625, -0.542022705078125, -0.52288818359375, -0.503753662109375, -0.484619140625, -0.465484619140625, -0.44635009765625, -0.427215576171875, -0.4080810546875, -0.388946533203125, -0.36981201171875, -0.350677490234375, -0.33154296875, -0.312408447265625, -0.29327392578125, -0.274139404296875, -0.2550048828125, -0.235870361328125, -0.21673583984375, -0.197601318359375, -0.178466796875, -0.159332275390625, -0.14019775390625, -0.121063232421875, -0.1019287109375, -0.082794189453125, -0.06365966796875, -0.044525146484375, -0.025390625, -0.006256103515625, 0.01287841796875, 0.032012939453125, 0.0511474609375, 0.070281982421875, 0.08941650390625, 0.108551025390625, 0.127685546875, 0.146820068359375, 0.16595458984375, 0.185089111328125, 0.2042236328125, 0.223358154296875, 0.24249267578125, 0.261627197265625, 0.28076171875, 0.299896240234375, 0.31903076171875, 0.338165283203125, 0.3572998046875, 0.376434326171875, 0.39556884765625, 0.414703369140625, 0.433837890625, 0.452972412109375, 0.47210693359375, 0.491241455078125, 0.5103759765625, 0.529510498046875, 0.54864501953125, 0.567779541015625, 0.5869140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 11.0, 20.0, 14.0, 17.0, 26.0, 49.0, 90.0, 178.0, 325.0, 776.0, 2071.0, 7648.0, 83154.0, 915758.0, 31207.0, 4498.0, 1379.0, 650.0, 293.0, 142.0, 86.0, 50.0, 41.0, 15.0, 12.0, 14.0, 4.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.355224609375, -0.3470268249511719, -0.33882904052734375, -0.3306312561035156, -0.3224334716796875, -0.3142356872558594, -0.30603790283203125, -0.2978401184082031, -0.289642333984375, -0.2814445495605469, -0.27324676513671875, -0.2650489807128906, -0.2568511962890625, -0.24865341186523438, -0.24045562744140625, -0.23225784301757812, -0.22406005859375, -0.21586227416992188, -0.20766448974609375, -0.19946670532226562, -0.1912689208984375, -0.18307113647460938, -0.17487335205078125, -0.16667556762695312, -0.158477783203125, -0.15027999877929688, -0.14208221435546875, -0.13388442993164062, -0.1256866455078125, -0.11748886108398438, -0.10929107666015625, -0.10109329223632812, -0.0928955078125, -0.08469772338867188, -0.07649993896484375, -0.06830215454101562, -0.0601043701171875, -0.051906585693359375, -0.04370880126953125, -0.035511016845703125, -0.027313232421875, -0.019115447998046875, -0.01091766357421875, -0.002719879150390625, 0.0054779052734375, 0.013675689697265625, 0.02187347412109375, 0.030071258544921875, 0.03826904296875, 0.046466827392578125, 0.05466461181640625, 0.06286239624023438, 0.0710601806640625, 0.07925796508789062, 0.08745574951171875, 0.09565353393554688, 0.103851318359375, 0.11204910278320312, 0.12024688720703125, 0.12844467163085938, 0.1366424560546875, 0.14484024047851562, 0.15303802490234375, 0.16123580932617188, 0.16943359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 13.0, 14.0, 20.0, 35.0, 48.0, 148.0, 517.0, 81.0, 48.0, 32.0, 16.0, 12.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.860494613647461e-05, -6.705615669488907e-05, -6.550736725330353e-05, -6.395857781171799e-05, -6.240978837013245e-05, -6.0860998928546906e-05, -5.9312209486961365e-05, -5.7763420045375824e-05, -5.621463060379028e-05, -5.466584116220474e-05, -5.31170517206192e-05, -5.156826227903366e-05, -5.001947283744812e-05, -4.847068339586258e-05, -4.692189395427704e-05, -4.53731045126915e-05, -4.382431507110596e-05, -4.2275525629520416e-05, -4.0726736187934875e-05, -3.9177946746349335e-05, -3.7629157304763794e-05, -3.608036786317825e-05, -3.453157842159271e-05, -3.298278898000717e-05, -3.143399953842163e-05, -2.988521009683609e-05, -2.833642065525055e-05, -2.678763121366501e-05, -2.5238841772079468e-05, -2.3690052330493927e-05, -2.2141262888908386e-05, -2.0592473447322845e-05, -1.9043684005737305e-05, -1.7494894564151764e-05, -1.5946105122566223e-05, -1.4397315680980682e-05, -1.2848526239395142e-05, -1.12997367978096e-05, -9.75094735622406e-06, -8.20215791463852e-06, -6.6533684730529785e-06, -5.104579031467438e-06, -3.555789589881897e-06, -2.007000148296356e-06, -4.5821070671081543e-07, 1.0905787348747253e-06, 2.639368176460266e-06, 4.188157618045807e-06, 5.736947059631348e-06, 7.2857365012168884e-06, 8.83452594280243e-06, 1.038331538438797e-05, 1.193210482597351e-05, 1.3480894267559052e-05, 1.5029683709144592e-05, 1.6578473150730133e-05, 1.8127262592315674e-05, 1.9676052033901215e-05, 2.1224841475486755e-05, 2.2773630917072296e-05, 2.4322420358657837e-05, 2.5871209800243378e-05, 2.741999924182892e-05, 2.896878868341446e-05, 3.0517578125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 11.0, 18.0, 32.0, 93.0, 163.0, 265.0, 519.0, 1166.0, 4470.0, 90519.0, 932297.0, 15328.0, 2086.0, 763.0, 373.0, 201.0, 100.0, 57.0, 33.0, 20.0, 8.0, 4.0, 3.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.322265625, -0.3104400634765625, -0.298614501953125, -0.2867889404296875, -0.27496337890625, -0.2631378173828125, -0.251312255859375, -0.2394866943359375, -0.2276611328125, -0.2158355712890625, -0.204010009765625, -0.1921844482421875, -0.18035888671875, -0.1685333251953125, -0.156707763671875, -0.1448822021484375, -0.133056640625, -0.1212310791015625, -0.109405517578125, -0.0975799560546875, -0.08575439453125, -0.0739288330078125, -0.062103271484375, -0.0502777099609375, -0.0384521484375, -0.0266265869140625, -0.014801025390625, -0.0029754638671875, 0.00885009765625, 0.0206756591796875, 0.032501220703125, 0.0443267822265625, 0.05615234375, 0.0679779052734375, 0.079803466796875, 0.0916290283203125, 0.10345458984375, 0.1152801513671875, 0.127105712890625, 0.1389312744140625, 0.1507568359375, 0.1625823974609375, 0.174407958984375, 0.1862335205078125, 0.19805908203125, 0.2098846435546875, 0.221710205078125, 0.2335357666015625, 0.245361328125, 0.2571868896484375, 0.269012451171875, 0.2808380126953125, 0.29266357421875, 0.3044891357421875, 0.316314697265625, 0.3281402587890625, 0.3399658203125, 0.3517913818359375, 0.363616943359375, 0.3754425048828125, 0.38726806640625, 0.3990936279296875, 0.410919189453125, 0.4227447509765625, 0.4345703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 10.0, 16.0, 30.0, 52.0, 69.0, 361.0, 289.0, 65.0, 39.0, 24.0, 18.0, 14.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14690303802490234, -0.1429271697998047, -0.13895130157470703, -0.13497543334960938, -0.13099956512451172, -0.12702369689941406, -0.1230478286743164, -0.11907196044921875, -0.1150960922241211, -0.11112022399902344, -0.10714435577392578, -0.10316848754882812, -0.09919261932373047, -0.09521675109863281, -0.09124088287353516, -0.0872650146484375, -0.08328914642333984, -0.07931327819824219, -0.07533740997314453, -0.07136154174804688, -0.06738567352294922, -0.06340980529785156, -0.059433937072753906, -0.05545806884765625, -0.051482200622558594, -0.04750633239746094, -0.04353046417236328, -0.039554595947265625, -0.03557872772216797, -0.03160285949707031, -0.027626991271972656, -0.023651123046875, -0.019675254821777344, -0.015699386596679688, -0.011723518371582031, -0.007747650146484375, -0.0037717819213867188, 0.0002040863037109375, 0.004179954528808594, 0.00815582275390625, 0.012131690979003906, 0.016107559204101562, 0.02008342742919922, 0.024059295654296875, 0.02803516387939453, 0.03201103210449219, 0.035986900329589844, 0.0399627685546875, 0.043938636779785156, 0.04791450500488281, 0.05189037322998047, 0.055866241455078125, 0.05984210968017578, 0.06381797790527344, 0.0677938461303711, 0.07176971435546875, 0.0757455825805664, 0.07972145080566406, 0.08369731903076172, 0.08767318725585938, 0.09164905548095703, 0.09562492370605469, 0.09960079193115234, 0.10357666015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 9.0, 23.0, 65.0, 188.0, 355.0, 262.0, 77.0, 23.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4813905656337738, -0.3963336944580078, -0.31127679347991943, -0.22621992230415344, -0.14116302132606506, -0.056106120347976685, 0.02895072102546692, 0.1140076220035553, 0.19906452298164368, 0.28412139415740967, 0.36917829513549805, 0.45423516631126404, 0.5392920970916748, 0.6243489980697632, 0.709405779838562, 0.7944626808166504, 0.8795195817947388, 0.9645764827728271, 1.0496333837509155, 1.134690284729004, 1.2197470664978027, 1.3048040866851807, 1.3898608684539795, 1.4749177694320679, 1.5599746704101562, 1.6450315713882446, 1.730088472366333, 1.8151452541351318, 1.9002022743225098, 1.9852590560913086, 2.0703158378601074, 2.1553728580474854, 2.2404298782348633, 2.325486660003662, 2.41054368019104, 2.495600461959839, 2.580657482147217, 2.6657142639160156, 2.7507710456848145, 2.8358280658721924, 2.9208850860595703, 3.005941867828369, 3.090998888015747, 3.176055669784546, 3.261112689971924, 3.3461694717407227, 3.4312262535095215, 3.5162832736968994, 3.6013400554656982, 3.686396837234497, 3.771453857421875, 3.856510639190674, 3.9415676593780518, 4.02662467956543, 4.1116814613342285, 4.196738243103027, 4.281795024871826, 4.366851806640625, 4.451908588409424, 4.536965847015381, 4.62202262878418, 4.7070794105529785, 4.792136192321777, 4.877193450927734, 4.962250232696533]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 4.0, 2.0, 12.0, 16.0, 10.0, 10.0, 19.0, 11.0, 25.0, 20.0, 26.0, 23.0, 23.0, 35.0, 38.0, 42.0, 38.0, 47.0, 30.0, 51.0, 36.0, 40.0, 38.0, 45.0, 39.0, 38.0, 30.0, 47.0, 36.0, 26.0, 23.0, 18.0, 11.0, 19.0, 8.0, 14.0, 11.0, 10.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8738496899604797, -0.8473448157310486, -0.8208399415016174, -0.7943350672721863, -0.7678301930427551, -0.741325318813324, -0.7148204445838928, -0.6883155703544617, -0.6618106961250305, -0.6353058218955994, -0.6088009476661682, -0.5822960734367371, -0.5557911992073059, -0.5292863249778748, -0.5027814507484436, -0.47627657651901245, -0.4497717320919037, -0.42326685786247253, -0.3967619836330414, -0.37025710940361023, -0.3437522351741791, -0.3172473907470703, -0.29074251651763916, -0.264237642288208, -0.23773275315761566, -0.2112278789281845, -0.18472300469875336, -0.1582181453704834, -0.13171327114105225, -0.1052083969116211, -0.07870352268218994, -0.05219864845275879, -0.025693774223327637, 0.0008110981434583664, 0.02731597051024437, 0.05382084101438522, 0.08032571524381638, 0.10683058202266693, 0.13333545625209808, 0.15984033048152924, 0.1863452047109604, 0.21285007894039154, 0.2393549531698227, 0.26585981249809265, 0.2923646867275238, 0.31886956095695496, 0.3453744351863861, 0.37187930941581726, 0.3983841836452484, 0.42488905787467957, 0.4513939321041107, 0.47789880633354187, 0.5044036507606506, 0.5309085249900818, 0.5574133992195129, 0.5839182734489441, 0.6104231476783752, 0.6369280219078064, 0.6634328961372375, 0.6899377703666687, 0.7164426445960999, 0.742947518825531, 0.7694523930549622, 0.7959572672843933, 0.8224621415138245]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 10.0, 17.0, 23.0, 23.0, 30.0, 50.0, 56.0, 146.0, 251.0, 452.0, 1401.0, 4552.0, 21710.0, 419023.0, 3617665.0, 112161.0, 12039.0, 2807.0, 978.0, 386.0, 178.0, 97.0, 71.0, 51.0, 24.0, 21.0, 18.0, 6.0, 6.0, 3.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.7046051025390625, -0.676788330078125, -0.6489715576171875, -0.62115478515625, -0.5933380126953125, -0.565521240234375, -0.5377044677734375, -0.5098876953125, -0.4820709228515625, -0.454254150390625, -0.4264373779296875, -0.39862060546875, -0.3708038330078125, -0.342987060546875, -0.3151702880859375, -0.287353515625, -0.2595367431640625, -0.231719970703125, -0.2039031982421875, -0.17608642578125, -0.1482696533203125, -0.120452880859375, -0.0926361083984375, -0.0648193359375, -0.0370025634765625, -0.009185791015625, 0.0186309814453125, 0.04644775390625, 0.0742645263671875, 0.102081298828125, 0.1298980712890625, 0.15771484375, 0.1855316162109375, 0.213348388671875, 0.2411651611328125, 0.26898193359375, 0.2967987060546875, 0.324615478515625, 0.3524322509765625, 0.3802490234375, 0.4080657958984375, 0.435882568359375, 0.4636993408203125, 0.49151611328125, 0.5193328857421875, 0.547149658203125, 0.5749664306640625, 0.602783203125, 0.6305999755859375, 0.658416748046875, 0.6862335205078125, 0.71405029296875, 0.7418670654296875, 0.769683837890625, 0.7975006103515625, 0.8253173828125, 0.8531341552734375, 0.880950927734375, 0.9087677001953125, 0.93658447265625, 0.9644012451171875, 0.992218017578125, 1.0200347900390625, 1.0478515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 5.0, 7.0, 7.0, 21.0, 15.0, 12.0, 21.0, 19.0, 36.0, 25.0, 44.0, 39.0, 47.0, 48.0, 40.0, 51.0, 60.0, 59.0, 57.0, 51.0, 50.0, 36.0, 37.0, 41.0, 33.0, 29.0, 23.0, 9.0, 20.0, 12.0, 11.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.2958564758300781, -0.28702545166015625, -0.2781944274902344, -0.2693634033203125, -0.2605323791503906, -0.25170135498046875, -0.24287033081054688, -0.234039306640625, -0.22520828247070312, -0.21637725830078125, -0.20754623413085938, -0.1987152099609375, -0.18988418579101562, -0.18105316162109375, -0.17222213745117188, -0.16339111328125, -0.15456008911132812, -0.14572906494140625, -0.13689804077148438, -0.1280670166015625, -0.11923599243164062, -0.11040496826171875, -0.10157394409179688, -0.092742919921875, -0.08391189575195312, -0.07508087158203125, -0.06624984741210938, -0.0574188232421875, -0.048587799072265625, -0.03975677490234375, -0.030925750732421875, -0.0220947265625, -0.013263702392578125, -0.00443267822265625, 0.004398345947265625, 0.0132293701171875, 0.022060394287109375, 0.03089141845703125, 0.039722442626953125, 0.048553466796875, 0.057384490966796875, 0.06621551513671875, 0.07504653930664062, 0.0838775634765625, 0.09270858764648438, 0.10153961181640625, 0.11037063598632812, 0.11920166015625, 0.12803268432617188, 0.13686370849609375, 0.14569473266601562, 0.1545257568359375, 0.16335678100585938, 0.17218780517578125, 0.18101882934570312, 0.189849853515625, 0.19868087768554688, 0.20751190185546875, 0.21634292602539062, 0.2251739501953125, 0.23400497436523438, 0.24283599853515625, 0.2516670227050781, 0.260498046875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 11.0, 23.0, 31.0, 50.0, 133.0, 313.0, 871.0, 3555.0, 42983.0, 3934223.0, 202189.0, 7672.0, 1428.0, 445.0, 167.0, 76.0, 51.0, 15.0, 16.0, 8.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2099609375, -1.1705322265625, -1.131103515625, -1.0916748046875, -1.05224609375, -1.0128173828125, -0.973388671875, -0.9339599609375, -0.89453125, -0.8551025390625, -0.815673828125, -0.7762451171875, -0.73681640625, -0.6973876953125, -0.657958984375, -0.6185302734375, -0.5791015625, -0.5396728515625, -0.500244140625, -0.4608154296875, -0.42138671875, -0.3819580078125, -0.342529296875, -0.3031005859375, -0.263671875, -0.2242431640625, -0.184814453125, -0.1453857421875, -0.10595703125, -0.0665283203125, -0.027099609375, 0.0123291015625, 0.0517578125, 0.0911865234375, 0.130615234375, 0.1700439453125, 0.20947265625, 0.2489013671875, 0.288330078125, 0.3277587890625, 0.3671875, 0.4066162109375, 0.446044921875, 0.4854736328125, 0.52490234375, 0.5643310546875, 0.603759765625, 0.6431884765625, 0.6826171875, 0.7220458984375, 0.761474609375, 0.8009033203125, 0.84033203125, 0.8797607421875, 0.919189453125, 0.9586181640625, 0.998046875, 1.0374755859375, 1.076904296875, 1.1163330078125, 1.15576171875, 1.1951904296875, 1.234619140625, 1.2740478515625, 1.3134765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 12.0, 14.0, 41.0, 53.0, 94.0, 173.0, 363.0, 841.0, 1210.0, 676.0, 274.0, 139.0, 63.0, 45.0, 26.0, 14.0, 11.0, 5.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334228515625, -0.32614707946777344, -0.3180656433105469, -0.3099842071533203, -0.30190277099609375, -0.2938213348388672, -0.2857398986816406, -0.27765846252441406, -0.2695770263671875, -0.26149559020996094, -0.2534141540527344, -0.2453327178955078, -0.23725128173828125, -0.2291698455810547, -0.22108840942382812, -0.21300697326660156, -0.204925537109375, -0.19684410095214844, -0.18876266479492188, -0.1806812286376953, -0.17259979248046875, -0.1645183563232422, -0.15643692016601562, -0.14835548400878906, -0.1402740478515625, -0.13219261169433594, -0.12411117553710938, -0.11602973937988281, -0.10794830322265625, -0.09986686706542969, -0.09178543090820312, -0.08370399475097656, -0.07562255859375, -0.06754112243652344, -0.059459686279296875, -0.05137825012207031, -0.04329681396484375, -0.03521537780761719, -0.027133941650390625, -0.019052505493164062, -0.0109710693359375, -0.0028896331787109375, 0.005191802978515625, 0.013273239135742188, 0.02135467529296875, 0.029436111450195312, 0.037517547607421875, 0.04559898376464844, 0.053680419921875, 0.06176185607910156, 0.06984329223632812, 0.07792472839355469, 0.08600616455078125, 0.09408760070800781, 0.10216903686523438, 0.11025047302246094, 0.1183319091796875, 0.12641334533691406, 0.13449478149414062, 0.1425762176513672, 0.15065765380859375, 0.1587390899658203, 0.16682052612304688, 0.17490196228027344, 0.1829833984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 20.0, 16.0, 39.0, 43.0, 74.0, 80.0, 100.0, 121.0, 128.0, 107.0, 96.0, 54.0, 38.0, 30.0, 11.0, 16.0, 11.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7881006598472595, -0.7657932639122009, -0.7434858679771423, -0.7211785316467285, -0.6988711357116699, -0.6765637397766113, -0.6542563438415527, -0.6319489479064941, -0.6096415519714355, -0.587334156036377, -0.5650267601013184, -0.5427193641662598, -0.520412027835846, -0.49810463190078735, -0.47579723596572876, -0.45348984003067017, -0.43118247389793396, -0.40887507796287537, -0.38656771183013916, -0.36426031589508057, -0.341952919960022, -0.3196455240249634, -0.2973381578922272, -0.2750307619571686, -0.2527233958244324, -0.23041601479053497, -0.20810861885547638, -0.18580123782157898, -0.16349384188652039, -0.14118646085262299, -0.11887907981872559, -0.09657168388366699, -0.0742642879486084, -0.0519568994641304, -0.029649514704942703, -0.007342129945755005, 0.014965258538722992, 0.03727264702320099, 0.05958002805709839, 0.08188742399215698, 0.10419480502605438, 0.12650218605995178, 0.14880958199501038, 0.17111696302890778, 0.19342434406280518, 0.21573173999786377, 0.23803912103176117, 0.26034653186798096, 0.28265389800071716, 0.30496129393577576, 0.32726866006851196, 0.34957605600357056, 0.37188345193862915, 0.39419084787368774, 0.41649821400642395, 0.43880560994148254, 0.46111297607421875, 0.48342037200927734, 0.5057277679443359, 0.5280351638793945, 0.5503425002098083, 0.5726498961448669, 0.5949572920799255, 0.6172646880149841, 0.6395720839500427]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 9.0, 13.0, 16.0, 15.0, 14.0, 20.0, 17.0, 20.0, 27.0, 32.0, 46.0, 27.0, 31.0, 48.0, 39.0, 57.0, 47.0, 38.0, 39.0, 44.0, 43.0, 26.0, 33.0, 29.0, 29.0, 31.0, 26.0, 21.0, 22.0, 20.0, 9.0, 19.0, 17.0, 8.0, 9.0, 5.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32736608386039734, -0.3176831007003784, -0.3080001473426819, -0.29831716418266296, -0.28863418102264404, -0.2789512276649475, -0.2692682445049286, -0.25958526134490967, -0.24990229308605194, -0.2402193248271942, -0.2305363416671753, -0.22085337340831757, -0.21117040514945984, -0.20148742198944092, -0.1918044537305832, -0.18212148547172546, -0.17243850231170654, -0.16275553405284882, -0.1530725508928299, -0.14338958263397217, -0.13370659947395325, -0.12402363121509552, -0.11434066295623779, -0.10465768724679947, -0.09497471153736115, -0.08529173582792282, -0.0756087601184845, -0.06592579185962677, -0.056242816150188446, -0.04655984044075012, -0.0368768684566021, -0.02719389647245407, -0.017510920763015747, -0.007827946916222572, 0.0018550269305706024, 0.011538000777363777, 0.021220974624156952, 0.030903950333595276, 0.0405869223177433, 0.05026989430189133, 0.05995287001132965, 0.06963584572076797, 0.0793188214302063, 0.08900178968906403, 0.09868476539850235, 0.10836774110794067, 0.1180507093667984, 0.12773367762565613, 0.13741666078567505, 0.14709962904453278, 0.1567826122045517, 0.16646558046340942, 0.17614856362342834, 0.18583153188228607, 0.1955145001411438, 0.20519748330116272, 0.21488045156002045, 0.22456341981887817, 0.2342464029788971, 0.24392937123775482, 0.25361233949661255, 0.26329532265663147, 0.2729783058166504, 0.2826612591743469, 0.29234424233436584]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 5.0, 11.0, 8.0, 18.0, 20.0, 40.0, 63.0, 101.0, 258.0, 455.0, 932.0, 2073.0, 4916.0, 12592.0, 48545.0, 530922.0, 391153.0, 37620.0, 10989.0, 4365.0, 1812.0, 829.0, 369.0, 202.0, 102.0, 49.0, 29.0, 18.0, 17.0, 6.0, 6.0, 6.0, 7.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1983642578125, -0.19173622131347656, -0.18510818481445312, -0.1784801483154297, -0.17185211181640625, -0.1652240753173828, -0.15859603881835938, -0.15196800231933594, -0.1453399658203125, -0.13871192932128906, -0.13208389282226562, -0.1254558563232422, -0.11882781982421875, -0.11219978332519531, -0.10557174682617188, -0.09894371032714844, -0.092315673828125, -0.08568763732910156, -0.07905960083007812, -0.07243156433105469, -0.06580352783203125, -0.05917549133300781, -0.052547454833984375, -0.04591941833496094, -0.0392913818359375, -0.03266334533691406, -0.026035308837890625, -0.019407272338867188, -0.01277923583984375, -0.0061511993408203125, 0.000476837158203125, 0.0071048736572265625, 0.01373291015625, 0.020360946655273438, 0.026988983154296875, 0.03361701965332031, 0.04024505615234375, 0.04687309265136719, 0.053501129150390625, 0.06012916564941406, 0.0667572021484375, 0.07338523864746094, 0.08001327514648438, 0.08664131164550781, 0.09326934814453125, 0.09989738464355469, 0.10652542114257812, 0.11315345764160156, 0.119781494140625, 0.12640953063964844, 0.13303756713867188, 0.1396656036376953, 0.14629364013671875, 0.1529216766357422, 0.15954971313476562, 0.16617774963378906, 0.1728057861328125, 0.17943382263183594, 0.18606185913085938, 0.1926898956298828, 0.19931793212890625, 0.2059459686279297, 0.21257400512695312, 0.21920204162597656, 0.225830078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 14.0, 13.0, 17.0, 20.0, 21.0, 25.0, 25.0, 42.0, 42.0, 56.0, 36.0, 66.0, 63.0, 58.0, 55.0, 56.0, 52.0, 44.0, 50.0, 47.0, 35.0, 32.0, 25.0, 24.0, 19.0, 20.0, 8.0, 9.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2749481201171875, -0.265472412109375, -0.2559967041015625, -0.24652099609375, -0.2370452880859375, -0.227569580078125, -0.2180938720703125, -0.2086181640625, -0.1991424560546875, -0.189666748046875, -0.1801910400390625, -0.17071533203125, -0.1612396240234375, -0.151763916015625, -0.1422882080078125, -0.1328125, -0.1233367919921875, -0.113861083984375, -0.1043853759765625, -0.09490966796875, -0.0854339599609375, -0.075958251953125, -0.0664825439453125, -0.0570068359375, -0.0475311279296875, -0.038055419921875, -0.0285797119140625, -0.01910400390625, -0.0096282958984375, -0.000152587890625, 0.0093231201171875, 0.018798828125, 0.0282745361328125, 0.037750244140625, 0.0472259521484375, 0.05670166015625, 0.0661773681640625, 0.075653076171875, 0.0851287841796875, 0.0946044921875, 0.1040802001953125, 0.113555908203125, 0.1230316162109375, 0.13250732421875, 0.1419830322265625, 0.151458740234375, 0.1609344482421875, 0.17041015625, 0.1798858642578125, 0.189361572265625, 0.1988372802734375, 0.20831298828125, 0.2177886962890625, 0.227264404296875, 0.2367401123046875, 0.2462158203125, 0.2556915283203125, 0.265167236328125, 0.2746429443359375, 0.28411865234375, 0.2935943603515625, 0.303070068359375, 0.3125457763671875, 0.322021484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 13.0, 17.0, 18.0, 29.0, 42.0, 40.0, 81.0, 122.0, 138.0, 219.0, 339.0, 578.0, 951.0, 1671.0, 3203.0, 6877.0, 15393.0, 41863.0, 148197.0, 448736.0, 268096.0, 69813.0, 22853.0, 9428.0, 4385.0, 2244.0, 1237.0, 687.0, 418.0, 256.0, 167.0, 123.0, 91.0, 55.0, 35.0, 39.0, 31.0, 21.0, 18.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0916748046875, -0.08895587921142578, -0.08623695373535156, -0.08351802825927734, -0.08079910278320312, -0.0780801773071289, -0.07536125183105469, -0.07264232635498047, -0.06992340087890625, -0.06720447540283203, -0.06448554992675781, -0.061766624450683594, -0.059047698974609375, -0.056328773498535156, -0.05360984802246094, -0.05089092254638672, -0.0481719970703125, -0.04545307159423828, -0.04273414611816406, -0.040015220642089844, -0.037296295166015625, -0.034577369689941406, -0.03185844421386719, -0.02913951873779297, -0.02642059326171875, -0.02370166778564453, -0.020982742309570312, -0.018263816833496094, -0.015544891357421875, -0.012825965881347656, -0.010107040405273438, -0.007388114929199219, -0.004669189453125, -0.0019502639770507812, 0.0007686614990234375, 0.0034875869750976562, 0.006206512451171875, 0.008925437927246094, 0.011644363403320312, 0.014363288879394531, 0.01708221435546875, 0.01980113983154297, 0.022520065307617188, 0.025238990783691406, 0.027957916259765625, 0.030676841735839844, 0.03339576721191406, 0.03611469268798828, 0.0388336181640625, 0.04155254364013672, 0.04427146911621094, 0.046990394592285156, 0.049709320068359375, 0.052428245544433594, 0.05514717102050781, 0.05786609649658203, 0.06058502197265625, 0.06330394744873047, 0.06602287292480469, 0.0687417984008789, 0.07146072387695312, 0.07417964935302734, 0.07689857482910156, 0.07961750030517578, 0.08233642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 11.0, 4.0, 6.0, 16.0, 14.0, 18.0, 11.0, 14.0, 17.0, 18.0, 26.0, 32.0, 24.0, 40.0, 35.0, 57.0, 48.0, 56.0, 50.0, 41.0, 45.0, 56.0, 35.0, 44.0, 39.0, 41.0, 34.0, 43.0, 21.0, 18.0, 10.0, 12.0, 13.0, 10.0, 10.0, 9.0, 2.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.49017333984375, -0.4739990234375, -0.45782470703125, -0.441650390625, -0.42547607421875, -0.4093017578125, -0.39312744140625, -0.376953125, -0.36077880859375, -0.3446044921875, -0.32843017578125, -0.312255859375, -0.29608154296875, -0.2799072265625, -0.26373291015625, -0.24755859375, -0.23138427734375, -0.2152099609375, -0.19903564453125, -0.182861328125, -0.16668701171875, -0.1505126953125, -0.13433837890625, -0.1181640625, -0.10198974609375, -0.0858154296875, -0.06964111328125, -0.053466796875, -0.03729248046875, -0.0211181640625, -0.00494384765625, 0.01123046875, 0.02740478515625, 0.0435791015625, 0.05975341796875, 0.075927734375, 0.09210205078125, 0.1082763671875, 0.12445068359375, 0.140625, 0.15679931640625, 0.1729736328125, 0.18914794921875, 0.205322265625, 0.22149658203125, 0.2376708984375, 0.25384521484375, 0.27001953125, 0.28619384765625, 0.3023681640625, 0.31854248046875, 0.334716796875, 0.35089111328125, 0.3670654296875, 0.38323974609375, 0.3994140625, 0.41558837890625, 0.4317626953125, 0.44793701171875, 0.464111328125, 0.48028564453125, 0.4964599609375, 0.51263427734375, 0.52880859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 7.0, 19.0, 17.0, 37.0, 54.0, 93.0, 150.0, 320.0, 611.0, 1228.0, 3025.0, 9222.0, 44813.0, 379836.0, 523678.0, 66679.0, 12088.0, 3629.0, 1476.0, 699.0, 361.0, 191.0, 109.0, 59.0, 47.0, 26.0, 22.0, 14.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041656494140625, -0.04046964645385742, -0.039282798767089844, -0.038095951080322266, -0.03690910339355469, -0.03572225570678711, -0.03453540802001953, -0.03334856033325195, -0.032161712646484375, -0.030974864959716797, -0.02978801727294922, -0.02860116958618164, -0.027414321899414062, -0.026227474212646484, -0.025040626525878906, -0.023853778839111328, -0.02266693115234375, -0.021480083465576172, -0.020293235778808594, -0.019106388092041016, -0.017919540405273438, -0.01673269271850586, -0.015545845031738281, -0.014358997344970703, -0.013172149658203125, -0.011985301971435547, -0.010798454284667969, -0.00961160659790039, -0.008424758911132812, -0.007237911224365234, -0.006051063537597656, -0.004864215850830078, -0.0036773681640625, -0.002490520477294922, -0.0013036727905273438, -0.00011682510375976562, 0.0010700225830078125, 0.0022568702697753906, 0.0034437179565429688, 0.004630565643310547, 0.005817413330078125, 0.007004261016845703, 0.008191108703613281, 0.00937795639038086, 0.010564804077148438, 0.011751651763916016, 0.012938499450683594, 0.014125347137451172, 0.01531219482421875, 0.016499042510986328, 0.017685890197753906, 0.018872737884521484, 0.020059585571289062, 0.02124643325805664, 0.02243328094482422, 0.023620128631591797, 0.024806976318359375, 0.025993824005126953, 0.02718067169189453, 0.02836751937866211, 0.029554367065429688, 0.030741214752197266, 0.031928062438964844, 0.03311491012573242, 0.0343017578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 15.0, 8.0, 16.0, 34.0, 56.0, 87.0, 124.0, 138.0, 140.0, 133.0, 93.0, 52.0, 35.0, 24.0, 13.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-05, -2.299528568983078e-05, -2.214871346950531e-05, -2.130214124917984e-05, -2.045556902885437e-05, -1.96089968085289e-05, -1.876242458820343e-05, -1.791585236787796e-05, -1.706928014755249e-05, -1.622270792722702e-05, -1.537613570690155e-05, -1.452956348657608e-05, -1.368299126625061e-05, -1.283641904592514e-05, -1.198984682559967e-05, -1.11432746052742e-05, -1.029670238494873e-05, -9.45013016462326e-06, -8.60355794429779e-06, -7.75698572397232e-06, -6.910413503646851e-06, -6.063841283321381e-06, -5.217269062995911e-06, -4.370696842670441e-06, -3.5241246223449707e-06, -2.6775524020195007e-06, -1.8309801816940308e-06, -9.844079613685608e-07, -1.3783574104309082e-07, 7.087364792823792e-07, 1.5553086996078491e-06, 2.401880919933319e-06, 3.248453140258789e-06, 4.095025360584259e-06, 4.941597580909729e-06, 5.788169801235199e-06, 6.634742021560669e-06, 7.481314241886139e-06, 8.327886462211609e-06, 9.174458682537079e-06, 1.0021030902862549e-05, 1.0867603123188019e-05, 1.1714175343513489e-05, 1.2560747563838959e-05, 1.3407319784164429e-05, 1.4253892004489899e-05, 1.5100464224815369e-05, 1.594703644514084e-05, 1.679360866546631e-05, 1.764018088579178e-05, 1.848675310611725e-05, 1.933332532644272e-05, 2.017989754676819e-05, 2.102646976709366e-05, 2.187304198741913e-05, 2.27196142077446e-05, 2.356618642807007e-05, 2.441275864839554e-05, 2.5259330868721008e-05, 2.6105903089046478e-05, 2.6952475309371948e-05, 2.7799047529697418e-05, 2.8645619750022888e-05, 2.9492191970348358e-05, 3.0338764190673828e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 13.0, 18.0, 22.0, 26.0, 44.0, 67.0, 146.0, 238.0, 431.0, 813.0, 1470.0, 3254.0, 8793.0, 33870.0, 169471.0, 545038.0, 223441.0, 43398.0, 10623.0, 3728.0, 1623.0, 815.0, 497.0, 280.0, 150.0, 94.0, 64.0, 36.0, 30.0, 17.0, 11.0, 8.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0], "bins": [-0.03485107421875, -0.033843278884887695, -0.03283548355102539, -0.031827688217163086, -0.03081989288330078, -0.029812097549438477, -0.028804302215576172, -0.027796506881713867, -0.026788711547851562, -0.025780916213989258, -0.024773120880126953, -0.02376532554626465, -0.022757530212402344, -0.02174973487854004, -0.020741939544677734, -0.01973414421081543, -0.018726348876953125, -0.01771855354309082, -0.016710758209228516, -0.01570296287536621, -0.014695167541503906, -0.013687372207641602, -0.012679576873779297, -0.011671781539916992, -0.010663986206054688, -0.009656190872192383, -0.008648395538330078, -0.0076406002044677734, -0.006632804870605469, -0.005625009536743164, -0.004617214202880859, -0.0036094188690185547, -0.00260162353515625, -0.0015938282012939453, -0.0005860328674316406, 0.00042176246643066406, 0.0014295578002929688, 0.0024373531341552734, 0.003445148468017578, 0.004452943801879883, 0.0054607391357421875, 0.006468534469604492, 0.007476329803466797, 0.008484125137329102, 0.009491920471191406, 0.010499715805053711, 0.011507511138916016, 0.01251530647277832, 0.013523101806640625, 0.01453089714050293, 0.015538692474365234, 0.01654648780822754, 0.017554283142089844, 0.01856207847595215, 0.019569873809814453, 0.020577669143676758, 0.021585464477539062, 0.022593259811401367, 0.023601055145263672, 0.024608850479125977, 0.02561664581298828, 0.026624441146850586, 0.02763223648071289, 0.028640031814575195, 0.0296478271484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 5.0, 8.0, 9.0, 11.0, 15.0, 19.0, 20.0, 35.0, 39.0, 56.0, 60.0, 100.0, 91.0, 76.0, 62.0, 72.0, 64.0, 60.0, 38.0, 34.0, 26.0, 25.0, 12.0, 13.0, 7.0, 9.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.01062774658203125, -0.01036381721496582, -0.01009988784790039, -0.009835958480834961, -0.009572029113769531, -0.009308099746704102, -0.009044170379638672, -0.008780241012573242, -0.008516311645507812, -0.008252382278442383, -0.007988452911376953, -0.0077245235443115234, -0.007460594177246094, -0.007196664810180664, -0.006932735443115234, -0.006668806076049805, -0.006404876708984375, -0.006140947341918945, -0.005877017974853516, -0.005613088607788086, -0.005349159240722656, -0.0050852298736572266, -0.004821300506591797, -0.004557371139526367, -0.0042934417724609375, -0.004029512405395508, -0.003765583038330078, -0.0035016536712646484, -0.0032377243041992188, -0.002973794937133789, -0.0027098655700683594, -0.0024459362030029297, -0.0021820068359375, -0.0019180774688720703, -0.0016541481018066406, -0.001390218734741211, -0.0011262893676757812, -0.0008623600006103516, -0.0005984306335449219, -0.0003345012664794922, -7.05718994140625e-05, 0.0001933574676513672, 0.0004572868347167969, 0.0007212162017822266, 0.0009851455688476562, 0.001249074935913086, 0.0015130043029785156, 0.0017769336700439453, 0.002040863037109375, 0.0023047924041748047, 0.0025687217712402344, 0.002832651138305664, 0.0030965805053710938, 0.0033605098724365234, 0.003624439239501953, 0.003888368606567383, 0.0041522979736328125, 0.004416227340698242, 0.004680156707763672, 0.0049440860748291016, 0.005208015441894531, 0.005471944808959961, 0.005735874176025391, 0.00599980354309082, 0.00626373291015625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 21.0, 25.0, 62.0, 73.0, 132.0, 177.0, 167.0, 149.0, 73.0, 64.0, 34.0, 11.0, 9.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31661269068717957, -0.2956339716911316, -0.2746552526950836, -0.25367653369903564, -0.23269784450531006, -0.21171912550926208, -0.1907404065132141, -0.16976170241832733, -0.14878298342227936, -0.12780426442623138, -0.1068255603313446, -0.08584684133529663, -0.06486812978982925, -0.04388941824436188, -0.022910699248313904, -0.001931995153427124, 0.01904672384262085, 0.040025435388088226, 0.0610041506588459, 0.08198286592960358, 0.10296157747507095, 0.12394028902053833, 0.1449190080165863, 0.16589771211147308, 0.18687643110752106, 0.20785515010356903, 0.2288338541984558, 0.24981257319450378, 0.27079129219055176, 0.29176998138427734, 0.3127487301826477, 0.3337274193763733, 0.3547061085700989, 0.37568482756614685, 0.3966635465621948, 0.4176422357559204, 0.4386209547519684, 0.45959967374801636, 0.48057839274406433, 0.5015571117401123, 0.5225358009338379, 0.5435144901275635, 0.5644932389259338, 0.5854719281196594, 0.6064506769180298, 0.6274293661117554, 0.648408055305481, 0.6693868041038513, 0.6903655529022217, 0.7113442420959473, 0.7323229908943176, 0.7533016800880432, 0.7742804288864136, 0.7952591180801392, 0.8162378072738647, 0.8372165560722351, 0.8581952452659607, 0.8791739344596863, 0.9001526832580566, 0.9211313724517822, 0.9421101212501526, 0.9630888104438782, 0.9840675592422485, 1.0050462484359741, 1.0260249376296997]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 11.0, 14.0, 15.0, 22.0, 17.0, 19.0, 22.0, 32.0, 30.0, 41.0, 46.0, 57.0, 58.0, 52.0, 59.0, 53.0, 54.0, 58.0, 42.0, 40.0, 39.0, 38.0, 29.0, 29.0, 20.0, 24.0, 18.0, 10.0, 14.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25978797674179077, -0.25141122937202454, -0.2430344671010971, -0.23465770483016968, -0.22628095746040344, -0.2179042100906372, -0.20952744781970978, -0.20115068554878235, -0.1927739381790161, -0.18439719080924988, -0.17602042853832245, -0.16764366626739502, -0.15926691889762878, -0.15089017152786255, -0.14251340925693512, -0.1341366469860077, -0.12575989961624146, -0.11738314479589462, -0.10900638997554779, -0.10062963515520096, -0.09225288033485413, -0.0838761255145073, -0.07549937069416046, -0.06712261587381363, -0.0587458610534668, -0.050369106233119965, -0.04199235141277313, -0.0336155965924263, -0.025238841772079468, -0.016862086951732635, -0.008485332131385803, -0.00010857731103897095, 0.008268177509307861, 0.016644932329654694, 0.025021687150001526, 0.03339844197034836, 0.04177519679069519, 0.05015195161104202, 0.058528706431388855, 0.06690546125173569, 0.07528221607208252, 0.08365897089242935, 0.09203572571277618, 0.10041248053312302, 0.10878923535346985, 0.11716599017381668, 0.1255427449941635, 0.13391950726509094, 0.14229625463485718, 0.1506730020046234, 0.15904976427555084, 0.16742652654647827, 0.1758032739162445, 0.18418002128601074, 0.19255678355693817, 0.2009335458278656, 0.20931029319763184, 0.21768704056739807, 0.2260638028383255, 0.23444056510925293, 0.24281731247901917, 0.2511940598487854, 0.259570837020874, 0.26794758439064026, 0.2763243317604065]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 10.0, 12.0, 7.0, 29.0, 22.0, 40.0, 72.0, 107.0, 171.0, 274.0, 537.0, 1031.0, 2020.0, 4444.0, 10585.0, 29835.0, 117059.0, 681518.0, 144236.0, 34883.0, 11996.0, 4858.0, 2253.0, 1192.0, 601.0, 313.0, 159.0, 98.0, 62.0, 40.0, 28.0, 11.0, 14.0, 10.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33642578125, -0.323760986328125, -0.31109619140625, -0.298431396484375, -0.2857666015625, -0.273101806640625, -0.26043701171875, -0.247772216796875, -0.235107421875, -0.222442626953125, -0.20977783203125, -0.197113037109375, -0.1844482421875, -0.171783447265625, -0.15911865234375, -0.146453857421875, -0.1337890625, -0.121124267578125, -0.10845947265625, -0.095794677734375, -0.0831298828125, -0.070465087890625, -0.05780029296875, -0.045135498046875, -0.032470703125, -0.019805908203125, -0.00714111328125, 0.005523681640625, 0.0181884765625, 0.030853271484375, 0.04351806640625, 0.056182861328125, 0.06884765625, 0.081512451171875, 0.09417724609375, 0.106842041015625, 0.1195068359375, 0.132171630859375, 0.14483642578125, 0.157501220703125, 0.170166015625, 0.182830810546875, 0.19549560546875, 0.208160400390625, 0.2208251953125, 0.233489990234375, 0.24615478515625, 0.258819580078125, 0.271484375, 0.284149169921875, 0.29681396484375, 0.309478759765625, 0.3221435546875, 0.334808349609375, 0.34747314453125, 0.360137939453125, 0.372802734375, 0.385467529296875, 0.39813232421875, 0.410797119140625, 0.4234619140625, 0.436126708984375, 0.44879150390625, 0.461456298828125, 0.47412109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 4.0, 3.0, 11.0, 15.0, 26.0, 34.0, 36.0, 47.0, 56.0, 86.0, 93.0, 82.0, 82.0, 105.0, 68.0, 55.0, 56.0, 43.0, 31.0, 30.0, 14.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.47954559326171875, -0.4556732177734375, -0.43180084228515625, -0.407928466796875, -0.38405609130859375, -0.3601837158203125, -0.33631134033203125, -0.31243896484375, -0.28856658935546875, -0.2646942138671875, -0.24082183837890625, -0.216949462890625, -0.19307708740234375, -0.1692047119140625, -0.14533233642578125, -0.1214599609375, -0.09758758544921875, -0.0737152099609375, -0.04984283447265625, -0.025970458984375, -0.00209808349609375, 0.0217742919921875, 0.04564666748046875, 0.06951904296875, 0.09339141845703125, 0.1172637939453125, 0.14113616943359375, 0.165008544921875, 0.18888092041015625, 0.2127532958984375, 0.23662567138671875, 0.260498046875, 0.28437042236328125, 0.3082427978515625, 0.33211517333984375, 0.355987548828125, 0.37985992431640625, 0.4037322998046875, 0.42760467529296875, 0.45147705078125, 0.47534942626953125, 0.4992218017578125, 0.5230941772460938, 0.546966552734375, 0.5708389282226562, 0.5947113037109375, 0.6185836791992188, 0.6424560546875, 0.6663284301757812, 0.6902008056640625, 0.7140731811523438, 0.737945556640625, 0.7618179321289062, 0.7856903076171875, 0.8095626831054688, 0.83343505859375, 0.8573074340820312, 0.8811798095703125, 0.9050521850585938, 0.928924560546875, 0.9527969360351562, 0.9766693115234375, 1.0005416870117188, 1.0244140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 3.0, 13.0, 10.0, 13.0, 17.0, 17.0, 25.0, 39.0, 40.0, 63.0, 93.0, 136.0, 251.0, 555.0, 1896.0, 11908.0, 184246.0, 818668.0, 25520.0, 3351.0, 826.0, 304.0, 145.0, 112.0, 74.0, 38.0, 42.0, 31.0, 28.0, 14.0, 20.0, 4.0, 10.0, 9.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.762481689453125, -0.73541259765625, -0.708343505859375, -0.6812744140625, -0.654205322265625, -0.62713623046875, -0.600067138671875, -0.572998046875, -0.545928955078125, -0.51885986328125, -0.491790771484375, -0.4647216796875, -0.437652587890625, -0.41058349609375, -0.383514404296875, -0.3564453125, -0.329376220703125, -0.30230712890625, -0.275238037109375, -0.2481689453125, -0.221099853515625, -0.19403076171875, -0.166961669921875, -0.139892578125, -0.112823486328125, -0.08575439453125, -0.058685302734375, -0.0316162109375, -0.004547119140625, 0.02252197265625, 0.049591064453125, 0.07666015625, 0.103729248046875, 0.13079833984375, 0.157867431640625, 0.1849365234375, 0.212005615234375, 0.23907470703125, 0.266143798828125, 0.293212890625, 0.320281982421875, 0.34735107421875, 0.374420166015625, 0.4014892578125, 0.428558349609375, 0.45562744140625, 0.482696533203125, 0.509765625, 0.536834716796875, 0.56390380859375, 0.590972900390625, 0.6180419921875, 0.645111083984375, 0.67218017578125, 0.699249267578125, 0.726318359375, 0.753387451171875, 0.78045654296875, 0.807525634765625, 0.8345947265625, 0.861663818359375, 0.88873291015625, 0.915802001953125, 0.94287109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 7.0, 12.0, 10.0, 14.0, 19.0, 21.0, 23.0, 29.0, 36.0, 31.0, 43.0, 58.0, 47.0, 43.0, 46.0, 53.0, 50.0, 52.0, 39.0, 46.0, 47.0, 41.0, 38.0, 23.0, 26.0, 19.0, 18.0, 19.0, 13.0, 12.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.51116943359375, -0.4945068359375, -0.47784423828125, -0.461181640625, -0.44451904296875, -0.4278564453125, -0.41119384765625, -0.39453125, -0.37786865234375, -0.3612060546875, -0.34454345703125, -0.327880859375, -0.31121826171875, -0.2945556640625, -0.27789306640625, -0.26123046875, -0.24456787109375, -0.2279052734375, -0.21124267578125, -0.194580078125, -0.17791748046875, -0.1612548828125, -0.14459228515625, -0.1279296875, -0.11126708984375, -0.0946044921875, -0.07794189453125, -0.061279296875, -0.04461669921875, -0.0279541015625, -0.01129150390625, 0.00537109375, 0.02203369140625, 0.0386962890625, 0.05535888671875, 0.072021484375, 0.08868408203125, 0.1053466796875, 0.12200927734375, 0.138671875, 0.15533447265625, 0.1719970703125, 0.18865966796875, 0.205322265625, 0.22198486328125, 0.2386474609375, 0.25531005859375, 0.27197265625, 0.28863525390625, 0.3052978515625, 0.32196044921875, 0.338623046875, 0.35528564453125, 0.3719482421875, 0.38861083984375, 0.4052734375, 0.42193603515625, 0.4385986328125, 0.45526123046875, 0.471923828125, 0.48858642578125, 0.5052490234375, 0.52191162109375, 0.53857421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 6.0, 27.0, 29.0, 40.0, 110.0, 185.0, 367.0, 1112.0, 4477.0, 34412.0, 875485.0, 119417.0, 9939.0, 1885.0, 528.0, 237.0, 123.0, 49.0, 42.0, 27.0, 13.0, 8.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2010498046875, -0.1929149627685547, -0.18478012084960938, -0.17664527893066406, -0.16851043701171875, -0.16037559509277344, -0.15224075317382812, -0.1441059112548828, -0.1359710693359375, -0.1278362274169922, -0.11970138549804688, -0.11156654357910156, -0.10343170166015625, -0.09529685974121094, -0.08716201782226562, -0.07902717590332031, -0.070892333984375, -0.06275749206542969, -0.054622650146484375, -0.04648780822753906, -0.03835296630859375, -0.030218124389648438, -0.022083282470703125, -0.013948440551757812, -0.0058135986328125, 0.0023212432861328125, 0.010456085205078125, 0.018590927124023438, 0.02672576904296875, 0.03486061096191406, 0.042995452880859375, 0.05113029479980469, 0.05926513671875, 0.06739997863769531, 0.07553482055664062, 0.08366966247558594, 0.09180450439453125, 0.09993934631347656, 0.10807418823242188, 0.11620903015136719, 0.1243438720703125, 0.1324787139892578, 0.14061355590820312, 0.14874839782714844, 0.15688323974609375, 0.16501808166503906, 0.17315292358398438, 0.1812877655029297, 0.189422607421875, 0.1975574493408203, 0.20569229125976562, 0.21382713317871094, 0.22196197509765625, 0.23009681701660156, 0.23823165893554688, 0.2463665008544922, 0.2545013427734375, 0.2626361846923828, 0.2707710266113281, 0.27890586853027344, 0.28704071044921875, 0.29517555236816406, 0.3033103942871094, 0.3114452362060547, 0.319580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 6.0, 7.0, 8.0, 7.0, 12.0, 25.0, 26.0, 45.0, 66.0, 140.0, 254.0, 167.0, 77.0, 42.0, 46.0, 25.0, 9.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4557113647460938e-05, -2.3558735847473145e-05, -2.256035804748535e-05, -2.156198024749756e-05, -2.0563602447509766e-05, -1.9565224647521973e-05, -1.856684684753418e-05, -1.7568469047546387e-05, -1.6570091247558594e-05, -1.55717134475708e-05, -1.4573335647583008e-05, -1.3574957847595215e-05, -1.2576580047607422e-05, -1.1578202247619629e-05, -1.0579824447631836e-05, -9.581446647644043e-06, -8.58306884765625e-06, -7.584691047668457e-06, -6.586313247680664e-06, -5.587935447692871e-06, -4.589557647705078e-06, -3.591179847717285e-06, -2.592802047729492e-06, -1.5944242477416992e-06, -5.960464477539062e-07, 4.023313522338867e-07, 1.4007091522216797e-06, 2.3990869522094727e-06, 3.3974647521972656e-06, 4.395842552185059e-06, 5.3942203521728516e-06, 6.3925981521606445e-06, 7.3909759521484375e-06, 8.38935375213623e-06, 9.387731552124023e-06, 1.0386109352111816e-05, 1.138448715209961e-05, 1.2382864952087402e-05, 1.3381242752075195e-05, 1.4379620552062988e-05, 1.537799835205078e-05, 1.6376376152038574e-05, 1.7374753952026367e-05, 1.837313175201416e-05, 1.9371509552001953e-05, 2.0369887351989746e-05, 2.136826515197754e-05, 2.2366642951965332e-05, 2.3365020751953125e-05, 2.4363398551940918e-05, 2.536177635192871e-05, 2.6360154151916504e-05, 2.7358531951904297e-05, 2.835690975189209e-05, 2.9355287551879883e-05, 3.0353665351867676e-05, 3.135204315185547e-05, 3.235042095184326e-05, 3.3348798751831055e-05, 3.434717655181885e-05, 3.534555435180664e-05, 3.6343932151794434e-05, 3.7342309951782227e-05, 3.834068775177002e-05, 3.933906555175781e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 10.0, 16.0, 23.0, 36.0, 73.0, 100.0, 194.0, 336.0, 721.0, 1865.0, 8157.0, 85213.0, 884771.0, 57695.0, 6366.0, 1583.0, 634.0, 304.0, 186.0, 95.0, 59.0, 42.0, 23.0, 10.0, 9.0, 2.0, 10.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.3154296875, -0.3074302673339844, -0.29943084716796875, -0.2914314270019531, -0.2834320068359375, -0.2754325866699219, -0.26743316650390625, -0.2594337463378906, -0.251434326171875, -0.24343490600585938, -0.23543548583984375, -0.22743606567382812, -0.2194366455078125, -0.21143722534179688, -0.20343780517578125, -0.19543838500976562, -0.18743896484375, -0.17943954467773438, -0.17144012451171875, -0.16344070434570312, -0.1554412841796875, -0.14744186401367188, -0.13944244384765625, -0.13144302368164062, -0.123443603515625, -0.11544418334960938, -0.10744476318359375, -0.09944534301757812, -0.0914459228515625, -0.08344650268554688, -0.07544708251953125, -0.06744766235351562, -0.0594482421875, -0.051448822021484375, -0.04344940185546875, -0.035449981689453125, -0.0274505615234375, -0.019451141357421875, -0.01145172119140625, -0.003452301025390625, 0.004547119140625, 0.012546539306640625, 0.02054595947265625, 0.028545379638671875, 0.0365447998046875, 0.044544219970703125, 0.05254364013671875, 0.060543060302734375, 0.06854248046875, 0.07654190063476562, 0.08454132080078125, 0.09254074096679688, 0.1005401611328125, 0.10853958129882812, 0.11653900146484375, 0.12453842163085938, 0.132537841796875, 0.14053726196289062, 0.14853668212890625, 0.15653610229492188, 0.1645355224609375, 0.17253494262695312, 0.18053436279296875, 0.18853378295898438, 0.196533203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 7.0, 2.0, 13.0, 13.0, 11.0, 9.0, 28.0, 18.0, 30.0, 35.0, 56.0, 71.0, 158.0, 193.0, 97.0, 55.0, 39.0, 27.0, 34.0, 24.0, 19.0, 14.0, 11.0, 9.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045318603515625, -0.04343843460083008, -0.041558265686035156, -0.039678096771240234, -0.03779792785644531, -0.03591775894165039, -0.03403759002685547, -0.03215742111206055, -0.030277252197265625, -0.028397083282470703, -0.02651691436767578, -0.02463674545288086, -0.022756576538085938, -0.020876407623291016, -0.018996238708496094, -0.017116069793701172, -0.01523590087890625, -0.013355731964111328, -0.011475563049316406, -0.009595394134521484, -0.0077152252197265625, -0.005835056304931641, -0.003954887390136719, -0.002074718475341797, -0.000194549560546875, 0.0016856193542480469, 0.0035657882690429688, 0.005445957183837891, 0.0073261260986328125, 0.009206295013427734, 0.011086463928222656, 0.012966632843017578, 0.0148468017578125, 0.016726970672607422, 0.018607139587402344, 0.020487308502197266, 0.022367477416992188, 0.02424764633178711, 0.02612781524658203, 0.028007984161376953, 0.029888153076171875, 0.0317683219909668, 0.03364849090576172, 0.03552865982055664, 0.03740882873535156, 0.039288997650146484, 0.041169166564941406, 0.04304933547973633, 0.04492950439453125, 0.04680967330932617, 0.048689842224121094, 0.050570011138916016, 0.05245018005371094, 0.05433034896850586, 0.05621051788330078, 0.0580906867980957, 0.059970855712890625, 0.06185102462768555, 0.06373119354248047, 0.06561136245727539, 0.06749153137207031, 0.06937170028686523, 0.07125186920166016, 0.07313203811645508, 0.07501220703125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [10.0, 24.0, 52.0, 161.0, 318.0, 259.0, 132.0, 35.0, 19.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35728853940963745, -0.2844151258468628, -0.21154168248176575, -0.1386682540178299, -0.06579482555389404, 0.007078588008880615, 0.07995203137397766, 0.1528254747390747, 0.22569888830184937, 0.298572301864624, 0.37144574522972107, 0.4443191885948181, 0.5171926021575928, 0.5900660157203674, 0.6629394292831421, 0.7358129024505615, 0.8086863160133362, 0.8815597295761108, 0.9544332027435303, 1.0273065567016602, 1.1001800298690796, 1.173053503036499, 1.245926856994629, 1.3188003301620483, 1.3916738033294678, 1.4645472764968872, 1.537420630455017, 1.6102941036224365, 1.6831674575805664, 1.7560409307479858, 1.8289144039154053, 1.9017877578735352, 1.9746613502502441, 2.047534704208374, 2.120408296585083, 2.193281650543213, 2.2661550045013428, 2.3390283584594727, 2.4119019508361816, 2.4847753047943115, 2.5576486587524414, 2.6305220127105713, 2.7033956050872803, 2.77626895904541, 2.84914231300354, 2.92201566696167, 2.994889259338379, 3.067762613296509, 3.1406362056732178, 3.2135095596313477, 3.2863831520080566, 3.3592565059661865, 3.4321298599243164, 3.5050034523010254, 3.5778768062591553, 3.650750160217285, 3.723623752593994, 3.796497106552124, 3.869370698928833, 3.942244052886963, 4.015117645263672, 4.087990760803223, 4.160864353179932, 4.233737945556641, 4.306611061096191]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 26.0, 19.0, 20.0, 26.0, 27.0, 28.0, 34.0, 37.0, 41.0, 39.0, 50.0, 48.0, 42.0, 48.0, 55.0, 46.0, 49.0, 50.0, 33.0, 36.0, 25.0, 28.0, 35.0, 20.0, 21.0, 11.0, 13.0, 9.0, 13.0, 4.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7250390648841858, -0.6977466344833374, -0.6704542636871338, -0.6431618332862854, -0.615869402885437, -0.5885770320892334, -0.561284601688385, -0.5339921712875366, -0.506699800491333, -0.479407399892807, -0.452114999294281, -0.4248225688934326, -0.3975301682949066, -0.3702377676963806, -0.3429453372955322, -0.3156529366970062, -0.2883605360984802, -0.2610681354999542, -0.23377572000026703, -0.20648330450057983, -0.17919090390205383, -0.15189850330352783, -0.12460608780384064, -0.09731367230415344, -0.07002127170562744, -0.042728863656520844, -0.015436455607414246, 0.011855952441692352, 0.03914836049079895, 0.06644076108932495, 0.09373317658901215, 0.12102559208869934, 0.14831793308258057, 0.17561033368110657, 0.20290274918079376, 0.23019516468048096, 0.25748756527900696, 0.28477996587753296, 0.31207239627838135, 0.33936479687690735, 0.36665719747543335, 0.39394959807395935, 0.42124199867248535, 0.44853442907333374, 0.47582682967185974, 0.5031192302703857, 0.5304116606712341, 0.5577040910720825, 0.5849964618682861, 0.6122888922691345, 0.6395812630653381, 0.6668736934661865, 0.6941660642623901, 0.7214584946632385, 0.7487509250640869, 0.7760432958602905, 0.8033357262611389, 0.8306281566619873, 0.8579205274581909, 0.8852129578590393, 0.9125053882598877, 0.9397977590560913, 0.9670901894569397, 0.9943826198577881, 1.0216749906539917]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 25.0, 36.0, 85.0, 139.0, 288.0, 584.0, 1489.0, 5168.0, 28102.0, 814403.0, 3238712.0, 90786.0, 10295.0, 2447.0, 921.0, 378.0, 193.0, 90.0, 50.0, 29.0, 15.0, 8.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82763671875, -0.8034515380859375, -0.779266357421875, -0.7550811767578125, -0.73089599609375, -0.7067108154296875, -0.682525634765625, -0.6583404541015625, -0.6341552734375, -0.6099700927734375, -0.585784912109375, -0.5615997314453125, -0.53741455078125, -0.5132293701171875, -0.489044189453125, -0.4648590087890625, -0.440673828125, -0.4164886474609375, -0.392303466796875, -0.3681182861328125, -0.34393310546875, -0.3197479248046875, -0.295562744140625, -0.2713775634765625, -0.2471923828125, -0.2230072021484375, -0.198822021484375, -0.1746368408203125, -0.15045166015625, -0.1262664794921875, -0.102081298828125, -0.0778961181640625, -0.0537109375, -0.0295257568359375, -0.005340576171875, 0.0188446044921875, 0.04302978515625, 0.0672149658203125, 0.091400146484375, 0.1155853271484375, 0.1397705078125, 0.1639556884765625, 0.188140869140625, 0.2123260498046875, 0.23651123046875, 0.2606964111328125, 0.284881591796875, 0.3090667724609375, 0.333251953125, 0.3574371337890625, 0.381622314453125, 0.4058074951171875, 0.42999267578125, 0.4541778564453125, 0.478363037109375, 0.5025482177734375, 0.5267333984375, 0.5509185791015625, 0.575103759765625, 0.5992889404296875, 0.62347412109375, 0.6476593017578125, 0.671844482421875, 0.6960296630859375, 0.72021484375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 9.0, 2.0, 11.0, 15.0, 14.0, 16.0, 15.0, 18.0, 26.0, 27.0, 24.0, 31.0, 44.0, 41.0, 46.0, 37.0, 50.0, 47.0, 42.0, 42.0, 41.0, 43.0, 52.0, 39.0, 30.0, 33.0, 30.0, 26.0, 25.0, 13.0, 19.0, 14.0, 16.0, 8.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.252197265625, -0.24477386474609375, -0.2373504638671875, -0.22992706298828125, -0.222503662109375, -0.21508026123046875, -0.2076568603515625, -0.20023345947265625, -0.19281005859375, -0.18538665771484375, -0.1779632568359375, -0.17053985595703125, -0.163116455078125, -0.15569305419921875, -0.1482696533203125, -0.14084625244140625, -0.1334228515625, -0.12599945068359375, -0.1185760498046875, -0.11115264892578125, -0.103729248046875, -0.09630584716796875, -0.0888824462890625, -0.08145904541015625, -0.07403564453125, -0.06661224365234375, -0.0591888427734375, -0.05176544189453125, -0.044342041015625, -0.03691864013671875, -0.0294952392578125, -0.02207183837890625, -0.0146484375, -0.00722503662109375, 0.0001983642578125, 0.00762176513671875, 0.015045166015625, 0.02246856689453125, 0.0298919677734375, 0.03731536865234375, 0.04473876953125, 0.05216217041015625, 0.0595855712890625, 0.06700897216796875, 0.074432373046875, 0.08185577392578125, 0.0892791748046875, 0.09670257568359375, 0.1041259765625, 0.11154937744140625, 0.1189727783203125, 0.12639617919921875, 0.133819580078125, 0.14124298095703125, 0.1486663818359375, 0.15608978271484375, 0.16351318359375, 0.17093658447265625, 0.1783599853515625, 0.18578338623046875, 0.193206787109375, 0.20063018798828125, 0.2080535888671875, 0.21547698974609375, 0.222900390625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 3.0, 11.0, 11.0, 9.0, 27.0, 44.0, 45.0, 75.0, 205.0, 503.0, 1676.0, 9685.0, 293513.0, 3848566.0, 34818.0, 3592.0, 872.0, 307.0, 153.0, 65.0, 36.0, 16.0, 14.0, 7.0, 7.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.26171875, -1.2237701416015625, -1.185821533203125, -1.1478729248046875, -1.10992431640625, -1.0719757080078125, -1.034027099609375, -0.9960784912109375, -0.9581298828125, -0.9201812744140625, -0.882232666015625, -0.8442840576171875, -0.80633544921875, -0.7683868408203125, -0.730438232421875, -0.6924896240234375, -0.654541015625, -0.6165924072265625, -0.578643798828125, -0.5406951904296875, -0.50274658203125, -0.4647979736328125, -0.426849365234375, -0.3889007568359375, -0.3509521484375, -0.3130035400390625, -0.275054931640625, -0.2371063232421875, -0.19915771484375, -0.1612091064453125, -0.123260498046875, -0.0853118896484375, -0.04736328125, -0.0094146728515625, 0.028533935546875, 0.0664825439453125, 0.10443115234375, 0.1423797607421875, 0.180328369140625, 0.2182769775390625, 0.2562255859375, 0.2941741943359375, 0.332122802734375, 0.3700714111328125, 0.40802001953125, 0.4459686279296875, 0.483917236328125, 0.5218658447265625, 0.559814453125, 0.5977630615234375, 0.635711669921875, 0.6736602783203125, 0.71160888671875, 0.7495574951171875, 0.787506103515625, 0.8254547119140625, 0.8634033203125, 0.9013519287109375, 0.939300537109375, 0.9772491455078125, 1.01519775390625, 1.0531463623046875, 1.091094970703125, 1.1290435791015625, 1.1669921875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 11.0, 8.0, 11.0, 13.0, 15.0, 28.0, 27.0, 55.0, 90.0, 142.0, 264.0, 423.0, 595.0, 759.0, 619.0, 358.0, 231.0, 134.0, 89.0, 50.0, 33.0, 39.0, 14.0, 7.0, 10.0, 8.0, 10.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15185546875, -0.14686012268066406, -0.14186477661132812, -0.1368694305419922, -0.13187408447265625, -0.1268787384033203, -0.12188339233398438, -0.11688804626464844, -0.1118927001953125, -0.10689735412597656, -0.10190200805664062, -0.09690666198730469, -0.09191131591796875, -0.08691596984863281, -0.08192062377929688, -0.07692527770996094, -0.071929931640625, -0.06693458557128906, -0.061939239501953125, -0.05694389343261719, -0.05194854736328125, -0.04695320129394531, -0.041957855224609375, -0.03696250915527344, -0.0319671630859375, -0.026971817016601562, -0.021976470947265625, -0.016981124877929688, -0.01198577880859375, -0.0069904327392578125, -0.001995086669921875, 0.0030002593994140625, 0.00799560546875, 0.012990951538085938, 0.017986297607421875, 0.022981643676757812, 0.02797698974609375, 0.03297233581542969, 0.037967681884765625, 0.04296302795410156, 0.0479583740234375, 0.05295372009277344, 0.057949066162109375, 0.06294441223144531, 0.06793975830078125, 0.07293510437011719, 0.07793045043945312, 0.08292579650878906, 0.087921142578125, 0.09291648864746094, 0.09791183471679688, 0.10290718078613281, 0.10790252685546875, 0.11289787292480469, 0.11789321899414062, 0.12288856506347656, 0.1278839111328125, 0.13287925720214844, 0.13787460327148438, 0.1428699493408203, 0.14786529541015625, 0.1528606414794922, 0.15785598754882812, 0.16285133361816406, 0.1678466796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 6.0, 11.0, 3.0, 16.0, 12.0, 22.0, 24.0, 31.0, 34.0, 36.0, 44.0, 58.0, 75.0, 65.0, 75.0, 55.0, 75.0, 59.0, 68.0, 34.0, 38.0, 31.0, 28.0, 30.0, 20.0, 10.0, 14.0, 7.0, 6.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.5012553334236145, -0.48900681734085083, -0.47675830125808716, -0.4645098149776459, -0.4522612988948822, -0.44001278281211853, -0.42776426672935486, -0.4155157804489136, -0.4032672643661499, -0.39101874828338623, -0.37877023220062256, -0.3665217459201813, -0.3542732298374176, -0.34202471375465393, -0.32977619767189026, -0.317527711391449, -0.3052791953086853, -0.29303067922592163, -0.28078216314315796, -0.2685336768627167, -0.256285160779953, -0.24403664469718933, -0.23178812861442566, -0.21953962743282318, -0.20729109644889832, -0.19504258036613464, -0.18279407918453217, -0.1705455631017685, -0.15829706192016602, -0.14604854583740234, -0.13380002975463867, -0.1215515285730362, -0.10930302739143372, -0.09705451875925064, -0.08480601012706757, -0.0725574940443039, -0.06030898913741112, -0.04806048050522804, -0.03581196814775467, -0.023563459515571594, -0.01131495088338852, 0.0009335586801171303, 0.01318206824362278, 0.025430578738451004, 0.03767908737063408, 0.049927596002817154, 0.06217610836029053, 0.0744246169924736, 0.08667312562465668, 0.09892163425683975, 0.11117014288902283, 0.1234186589717865, 0.13566716015338898, 0.14791567623615265, 0.16016417741775513, 0.1724126935005188, 0.18466120958328247, 0.19690972566604614, 0.20915822684764862, 0.2214067429304123, 0.23365524411201477, 0.24590376019477844, 0.2581522762775421, 0.2704007625579834, 0.28264927864074707]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 6.0, 12.0, 12.0, 11.0, 17.0, 16.0, 16.0, 20.0, 28.0, 20.0, 20.0, 34.0, 41.0, 32.0, 36.0, 30.0, 39.0, 35.0, 45.0, 42.0, 40.0, 41.0, 40.0, 39.0, 28.0, 38.0, 26.0, 34.0, 26.0, 25.0, 18.0, 24.0, 14.0, 10.0, 10.0, 14.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.29343488812446594, -0.28508466482162476, -0.27673447132110596, -0.26838427782058716, -0.26003405451774597, -0.2516838312149048, -0.243333637714386, -0.234983429312706, -0.226633220911026, -0.218283012509346, -0.20993280410766602, -0.20158259570598602, -0.19323238730430603, -0.18488217890262604, -0.17653197050094604, -0.16818176209926605, -0.15983155369758606, -0.15148134529590607, -0.14313113689422607, -0.13478092849254608, -0.1264307200908661, -0.1180805116891861, -0.1097303032875061, -0.10138009488582611, -0.09302988648414612, -0.08467967808246613, -0.07632946968078613, -0.06797926127910614, -0.05962905287742615, -0.051278844475746155, -0.04292863607406616, -0.03457842767238617, -0.02622818946838379, -0.017877981066703796, -0.009527772665023804, -0.001177564263343811, 0.007172644138336182, 0.015522852540016174, 0.023873060941696167, 0.03222326934337616, 0.04057347774505615, 0.048923686146736145, 0.05727389454841614, 0.06562410295009613, 0.07397431135177612, 0.08232451975345612, 0.09067472815513611, 0.0990249365568161, 0.1073751449584961, 0.11572535336017609, 0.12407556176185608, 0.13242577016353607, 0.14077597856521606, 0.14912618696689606, 0.15747639536857605, 0.16582660377025604, 0.17417681217193604, 0.18252702057361603, 0.19087722897529602, 0.199227437376976, 0.207577645778656, 0.215927854180336, 0.224278062582016, 0.23262827098369598, 0.24097847938537598]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 8.0, 10.0, 7.0, 22.0, 33.0, 59.0, 86.0, 113.0, 179.0, 271.0, 411.0, 664.0, 1044.0, 1578.0, 2627.0, 4698.0, 8145.0, 16173.0, 46722.0, 231198.0, 534816.0, 137593.0, 32196.0, 12892.0, 6733.0, 3944.0, 2360.0, 1484.0, 906.0, 571.0, 343.0, 218.0, 145.0, 79.0, 80.0, 54.0, 22.0, 14.0, 17.0, 12.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12066650390625, -0.11704826354980469, -0.11343002319335938, -0.10981178283691406, -0.10619354248046875, -0.10257530212402344, -0.09895706176757812, -0.09533882141113281, -0.0917205810546875, -0.08810234069824219, -0.08448410034179688, -0.08086585998535156, -0.07724761962890625, -0.07362937927246094, -0.07001113891601562, -0.06639289855957031, -0.062774658203125, -0.05915641784667969, -0.055538177490234375, -0.05191993713378906, -0.04830169677734375, -0.04468345642089844, -0.041065216064453125, -0.03744697570800781, -0.0338287353515625, -0.030210494995117188, -0.026592254638671875, -0.022974014282226562, -0.01935577392578125, -0.015737533569335938, -0.012119293212890625, -0.008501052856445312, -0.0048828125, -0.0012645721435546875, 0.002353668212890625, 0.0059719085693359375, 0.00959014892578125, 0.013208389282226562, 0.016826629638671875, 0.020444869995117188, 0.0240631103515625, 0.027681350708007812, 0.031299591064453125, 0.03491783142089844, 0.03853607177734375, 0.04215431213378906, 0.045772552490234375, 0.04939079284667969, 0.053009033203125, 0.05662727355957031, 0.060245513916015625, 0.06386375427246094, 0.06748199462890625, 0.07110023498535156, 0.07471847534179688, 0.07833671569824219, 0.0819549560546875, 0.08557319641113281, 0.08919143676757812, 0.09280967712402344, 0.09642791748046875, 0.10004615783691406, 0.10366439819335938, 0.10728263854980469, 0.11090087890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 8.0, 3.0, 7.0, 9.0, 5.0, 7.0, 12.0, 14.0, 15.0, 13.0, 19.0, 30.0, 20.0, 38.0, 42.0, 32.0, 33.0, 33.0, 38.0, 53.0, 35.0, 42.0, 46.0, 38.0, 43.0, 50.0, 39.0, 39.0, 31.0, 35.0, 28.0, 18.0, 16.0, 17.0, 15.0, 15.0, 12.0, 7.0, 10.0, 8.0, 2.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.17919921875, -0.17395401000976562, -0.16870880126953125, -0.16346359252929688, -0.1582183837890625, -0.15297317504882812, -0.14772796630859375, -0.14248275756835938, -0.137237548828125, -0.13199234008789062, -0.12674713134765625, -0.12150192260742188, -0.1162567138671875, -0.11101150512695312, -0.10576629638671875, -0.10052108764648438, -0.09527587890625, -0.09003067016601562, -0.08478546142578125, -0.07954025268554688, -0.0742950439453125, -0.06904983520507812, -0.06380462646484375, -0.058559417724609375, -0.053314208984375, -0.048069000244140625, -0.04282379150390625, -0.037578582763671875, -0.0323333740234375, -0.027088165283203125, -0.02184295654296875, -0.016597747802734375, -0.0113525390625, -0.006107330322265625, -0.00086212158203125, 0.004383087158203125, 0.0096282958984375, 0.014873504638671875, 0.02011871337890625, 0.025363922119140625, 0.030609130859375, 0.035854339599609375, 0.04109954833984375, 0.046344757080078125, 0.0515899658203125, 0.056835174560546875, 0.06208038330078125, 0.06732559204101562, 0.07257080078125, 0.07781600952148438, 0.08306121826171875, 0.08830642700195312, 0.0935516357421875, 0.09879684448242188, 0.10404205322265625, 0.10928726196289062, 0.114532470703125, 0.11977767944335938, 0.12502288818359375, 0.13026809692382812, 0.1355133056640625, 0.14075851440429688, 0.14600372314453125, 0.15124893188476562, 0.156494140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 5.0, 4.0, 3.0, 3.0, 7.0, 1.0, 8.0, 7.0, 16.0, 35.0, 31.0, 51.0, 60.0, 113.0, 166.0, 309.0, 462.0, 793.0, 1533.0, 3271.0, 7348.0, 19212.0, 68785.0, 321895.0, 458665.0, 118339.0, 28540.0, 10060.0, 4314.0, 1988.0, 1082.0, 604.0, 310.0, 191.0, 137.0, 75.0, 40.0, 29.0, 24.0, 13.0, 10.0, 4.0, 6.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08935546875, -0.08681488037109375, -0.0842742919921875, -0.08173370361328125, -0.079193115234375, -0.07665252685546875, -0.0741119384765625, -0.07157135009765625, -0.06903076171875, -0.06649017333984375, -0.0639495849609375, -0.06140899658203125, -0.058868408203125, -0.05632781982421875, -0.0537872314453125, -0.05124664306640625, -0.0487060546875, -0.04616546630859375, -0.0436248779296875, -0.04108428955078125, -0.038543701171875, -0.03600311279296875, -0.0334625244140625, -0.03092193603515625, -0.02838134765625, -0.02584075927734375, -0.0233001708984375, -0.02075958251953125, -0.018218994140625, -0.01567840576171875, -0.0131378173828125, -0.01059722900390625, -0.008056640625, -0.00551605224609375, -0.0029754638671875, -0.00043487548828125, 0.002105712890625, 0.00464630126953125, 0.0071868896484375, 0.00972747802734375, 0.01226806640625, 0.01480865478515625, 0.0173492431640625, 0.01988983154296875, 0.022430419921875, 0.02497100830078125, 0.0275115966796875, 0.03005218505859375, 0.0325927734375, 0.03513336181640625, 0.0376739501953125, 0.04021453857421875, 0.042755126953125, 0.04529571533203125, 0.0478363037109375, 0.05037689208984375, 0.05291748046875, 0.05545806884765625, 0.0579986572265625, 0.06053924560546875, 0.063079833984375, 0.06562042236328125, 0.0681610107421875, 0.07070159912109375, 0.0732421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 15.0, 9.0, 16.0, 22.0, 17.0, 17.0, 19.0, 25.0, 21.0, 27.0, 28.0, 26.0, 40.0, 30.0, 33.0, 29.0, 41.0, 45.0, 40.0, 49.0, 40.0, 41.0, 39.0, 37.0, 35.0, 42.0, 28.0, 22.0, 21.0, 16.0, 14.0, 11.0, 12.0, 11.0, 16.0, 7.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2958984375, -0.286376953125, -0.27685546875, -0.267333984375, -0.2578125, -0.248291015625, -0.23876953125, -0.229248046875, -0.2197265625, -0.210205078125, -0.20068359375, -0.191162109375, -0.181640625, -0.172119140625, -0.16259765625, -0.153076171875, -0.1435546875, -0.134033203125, -0.12451171875, -0.114990234375, -0.10546875, -0.095947265625, -0.08642578125, -0.076904296875, -0.0673828125, -0.057861328125, -0.04833984375, -0.038818359375, -0.029296875, -0.019775390625, -0.01025390625, -0.000732421875, 0.0087890625, 0.018310546875, 0.02783203125, 0.037353515625, 0.046875, 0.056396484375, 0.06591796875, 0.075439453125, 0.0849609375, 0.094482421875, 0.10400390625, 0.113525390625, 0.123046875, 0.132568359375, 0.14208984375, 0.151611328125, 0.1611328125, 0.170654296875, 0.18017578125, 0.189697265625, 0.19921875, 0.208740234375, 0.21826171875, 0.227783203125, 0.2373046875, 0.246826171875, 0.25634765625, 0.265869140625, 0.275390625, 0.284912109375, 0.29443359375, 0.303955078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 6.0, 11.0, 15.0, 37.0, 66.0, 107.0, 163.0, 293.0, 562.0, 1007.0, 2300.0, 5793.0, 16660.0, 61985.0, 278616.0, 490884.0, 140168.0, 32768.0, 10007.0, 3814.0, 1602.0, 762.0, 358.0, 202.0, 132.0, 82.0, 49.0, 27.0, 20.0, 15.0, 7.0, 8.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0234375, -0.022608518600463867, -0.021779537200927734, -0.0209505558013916, -0.02012157440185547, -0.019292593002319336, -0.018463611602783203, -0.01763463020324707, -0.016805648803710938, -0.015976667404174805, -0.015147686004638672, -0.014318704605102539, -0.013489723205566406, -0.012660741806030273, -0.01183176040649414, -0.011002779006958008, -0.010173797607421875, -0.009344816207885742, -0.00851583480834961, -0.0076868534088134766, -0.006857872009277344, -0.006028890609741211, -0.005199909210205078, -0.004370927810668945, -0.0035419464111328125, -0.0027129650115966797, -0.0018839836120605469, -0.001055002212524414, -0.00022602081298828125, 0.0006029605865478516, 0.0014319419860839844, 0.002260923385620117, 0.00308990478515625, 0.003918886184692383, 0.004747867584228516, 0.0055768489837646484, 0.006405830383300781, 0.007234811782836914, 0.008063793182373047, 0.00889277458190918, 0.009721755981445312, 0.010550737380981445, 0.011379718780517578, 0.012208700180053711, 0.013037681579589844, 0.013866662979125977, 0.01469564437866211, 0.015524625778198242, 0.016353607177734375, 0.017182588577270508, 0.01801156997680664, 0.018840551376342773, 0.019669532775878906, 0.02049851417541504, 0.021327495574951172, 0.022156476974487305, 0.022985458374023438, 0.02381443977355957, 0.024643421173095703, 0.025472402572631836, 0.02630138397216797, 0.0271303653717041, 0.027959346771240234, 0.028788328170776367, 0.0296173095703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 1.0, 1.0, 4.0, 4.0, 11.0, 2.0, 10.0, 6.0, 16.0, 24.0, 24.0, 29.0, 45.0, 55.0, 61.0, 81.0, 93.0, 71.0, 76.0, 72.0, 73.0, 62.0, 35.0, 32.0, 33.0, 18.0, 9.0, 15.0, 12.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-05, -1.2025237083435059e-05, -1.1533498764038086e-05, -1.1041760444641113e-05, -1.055002212524414e-05, -1.0058283805847168e-05, -9.566545486450195e-06, -9.074807167053223e-06, -8.58306884765625e-06, -8.091330528259277e-06, -7.599592208862305e-06, -7.107853889465332e-06, -6.616115570068359e-06, -6.124377250671387e-06, -5.632638931274414e-06, -5.140900611877441e-06, -4.649162292480469e-06, -4.157423973083496e-06, -3.6656856536865234e-06, -3.1739473342895508e-06, -2.682209014892578e-06, -2.1904706954956055e-06, -1.6987323760986328e-06, -1.2069940567016602e-06, -7.152557373046875e-07, -2.2351741790771484e-07, 2.682209014892578e-07, 7.599592208862305e-07, 1.2516975402832031e-06, 1.7434358596801758e-06, 2.2351741790771484e-06, 2.726912498474121e-06, 3.2186508178710938e-06, 3.7103891372680664e-06, 4.202127456665039e-06, 4.693865776062012e-06, 5.185604095458984e-06, 5.677342414855957e-06, 6.16908073425293e-06, 6.660819053649902e-06, 7.152557373046875e-06, 7.644295692443848e-06, 8.13603401184082e-06, 8.627772331237793e-06, 9.119510650634766e-06, 9.611248970031738e-06, 1.0102987289428711e-05, 1.0594725608825684e-05, 1.1086463928222656e-05, 1.1578202247619629e-05, 1.2069940567016602e-05, 1.2561678886413574e-05, 1.3053417205810547e-05, 1.354515552520752e-05, 1.4036893844604492e-05, 1.4528632164001465e-05, 1.5020370483398438e-05, 1.551210880279541e-05, 1.6003847122192383e-05, 1.6495585441589355e-05, 1.6987323760986328e-05, 1.74790620803833e-05, 1.7970800399780273e-05, 1.8462538719177246e-05, 1.895427703857422e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 11.0, 10.0, 12.0, 12.0, 29.0, 29.0, 52.0, 65.0, 95.0, 138.0, 209.0, 318.0, 564.0, 882.0, 1543.0, 2682.0, 4897.0, 9906.0, 21999.0, 51450.0, 131740.0, 299048.0, 298017.0, 130078.0, 51141.0, 21825.0, 9991.0, 5013.0, 2737.0, 1530.0, 951.0, 543.0, 322.0, 227.0, 146.0, 100.0, 66.0, 45.0, 29.0, 33.0, 18.0, 18.0, 9.0, 8.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0214691162109375, -0.020818471908569336, -0.020167827606201172, -0.019517183303833008, -0.018866539001464844, -0.01821589469909668, -0.017565250396728516, -0.01691460609436035, -0.016263961791992188, -0.015613317489624023, -0.01496267318725586, -0.014312028884887695, -0.013661384582519531, -0.013010740280151367, -0.012360095977783203, -0.011709451675415039, -0.011058807373046875, -0.010408163070678711, -0.009757518768310547, -0.009106874465942383, -0.008456230163574219, -0.007805585861206055, -0.007154941558837891, -0.0065042972564697266, -0.0058536529541015625, -0.0052030086517333984, -0.004552364349365234, -0.0039017200469970703, -0.0032510757446289062, -0.002600431442260742, -0.0019497871398925781, -0.001299142837524414, -0.00064849853515625, 2.1457672119140625e-06, 0.0006527900695800781, 0.0013034343719482422, 0.0019540786743164062, 0.0026047229766845703, 0.0032553672790527344, 0.0039060115814208984, 0.0045566558837890625, 0.0052073001861572266, 0.005857944488525391, 0.006508588790893555, 0.007159233093261719, 0.007809877395629883, 0.008460521697998047, 0.009111166000366211, 0.009761810302734375, 0.010412454605102539, 0.011063098907470703, 0.011713743209838867, 0.012364387512207031, 0.013015031814575195, 0.01366567611694336, 0.014316320419311523, 0.014966964721679688, 0.015617609024047852, 0.016268253326416016, 0.01691889762878418, 0.017569541931152344, 0.018220186233520508, 0.018870830535888672, 0.019521474838256836, 0.020172119140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 1.0, 4.0, 6.0, 6.0, 9.0, 7.0, 14.0, 16.0, 13.0, 19.0, 32.0, 33.0, 35.0, 30.0, 43.0, 46.0, 69.0, 61.0, 58.0, 38.0, 55.0, 64.0, 57.0, 39.0, 29.0, 42.0, 27.0, 34.0, 20.0, 19.0, 8.0, 8.0, 4.0, 8.0, 5.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005176544189453125, -0.005019545555114746, -0.004862546920776367, -0.004705548286437988, -0.004548549652099609, -0.0043915510177612305, -0.0042345523834228516, -0.004077553749084473, -0.003920555114746094, -0.003763556480407715, -0.003606557846069336, -0.003449559211730957, -0.003292560577392578, -0.0031355619430541992, -0.0029785633087158203, -0.0028215646743774414, -0.0026645660400390625, -0.0025075674057006836, -0.0023505687713623047, -0.0021935701370239258, -0.002036571502685547, -0.001879572868347168, -0.001722574234008789, -0.0015655755996704102, -0.0014085769653320312, -0.0012515783309936523, -0.0010945796966552734, -0.0009375810623168945, -0.0007805824279785156, -0.0006235837936401367, -0.0004665851593017578, -0.0003095865249633789, -0.000152587890625, 4.410743713378906e-06, 0.0001614093780517578, 0.0003184080123901367, 0.0004754066467285156, 0.0006324052810668945, 0.0007894039154052734, 0.0009464025497436523, 0.0011034011840820312, 0.0012603998184204102, 0.001417398452758789, 0.001574397087097168, 0.0017313957214355469, 0.0018883943557739258, 0.0020453929901123047, 0.0022023916244506836, 0.0023593902587890625, 0.0025163888931274414, 0.0026733875274658203, 0.0028303861618041992, 0.002987384796142578, 0.003144383430480957, 0.003301382064819336, 0.003458380699157715, 0.0036153793334960938, 0.0037723779678344727, 0.0039293766021728516, 0.0040863752365112305, 0.004243373870849609, 0.004400372505187988, 0.004557371139526367, 0.004714369773864746, 0.004871368408203125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 8.0, 3.0, 7.0, 10.0, 19.0, 23.0, 17.0, 45.0, 56.0, 53.0, 95.0, 85.0, 97.0, 91.0, 81.0, 75.0, 71.0, 56.0, 38.0, 39.0, 15.0, 12.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3764435350894928, -0.36676907539367676, -0.3570946455001831, -0.34742018580436707, -0.3377457559108734, -0.3280712962150574, -0.3183968663215637, -0.3087224066257477, -0.29904794692993164, -0.2893734872341156, -0.27969905734062195, -0.2700245976448059, -0.26035016775131226, -0.2506757080554962, -0.24100126326084137, -0.23132681846618652, -0.22165237367153168, -0.21197792887687683, -0.20230348408222198, -0.19262903928756714, -0.1829545795917511, -0.17328013479709625, -0.1636056900024414, -0.15393123030662537, -0.1442568004131317, -0.13458235561847687, -0.12490790337324142, -0.11523345857858658, -0.10555900633335114, -0.09588456153869629, -0.08621011674404144, -0.076535664498806, -0.06686121225357056, -0.05718676373362541, -0.04751231521368027, -0.03783787041902542, -0.028163421899080276, -0.018488973379135132, -0.008814528584480286, 0.0008599236607551575, 0.010534368455410004, 0.02020881697535515, 0.029883263632655144, 0.03955771028995514, 0.049232158809900284, 0.05890660732984543, 0.06858105212450027, 0.07825550436973572, 0.08792994916439056, 0.09760439395904541, 0.10727884620428085, 0.1169532909989357, 0.12662774324417114, 0.136302188038826, 0.14597663283348083, 0.15565109252929688, 0.16532552242279053, 0.17499996721744537, 0.18467441201210022, 0.19434887170791626, 0.2040233165025711, 0.21369776129722595, 0.2233722060918808, 0.23304665088653564, 0.24272111058235168]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 8.0, 14.0, 10.0, 8.0, 14.0, 20.0, 22.0, 23.0, 21.0, 35.0, 21.0, 37.0, 54.0, 41.0, 41.0, 39.0, 50.0, 57.0, 60.0, 43.0, 49.0, 35.0, 46.0, 41.0, 34.0, 22.0, 29.0, 28.0, 14.0, 15.0, 14.0, 7.0, 11.0, 4.0, 8.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717919558286667, -0.16606242954730988, -0.16033290326595306, -0.15460337698459625, -0.14887385070323944, -0.14314432442188263, -0.13741478323936462, -0.1316852569580078, -0.125955730676651, -0.12022620439529419, -0.11449667811393738, -0.10876715183258057, -0.10303762555122375, -0.09730809926986694, -0.09157856553792953, -0.08584903925657272, -0.08011952042579651, -0.0743899941444397, -0.06866046786308289, -0.06293094158172607, -0.057201411575078964, -0.05147188529372215, -0.04574235528707504, -0.04001282900571823, -0.03428330272436142, -0.028553776443004608, -0.022824248299002647, -0.017094720155000687, -0.011365193873643875, -0.005635667592287064, 9.386241436004639e-05, 0.005823388695716858, 0.01155291497707367, 0.01728244125843048, 0.02301196940243244, 0.028741497546434402, 0.034471023827791214, 0.040200550109148026, 0.045930080115795135, 0.05165960639715195, 0.05738913267850876, 0.06311865895986557, 0.06884818524122238, 0.07457771897315979, 0.0803072452545166, 0.08603677153587341, 0.09176629781723022, 0.09749582409858704, 0.10322535037994385, 0.10895487666130066, 0.11468440294265747, 0.12041392922401428, 0.1261434555053711, 0.1318729817867279, 0.13760250806808472, 0.14333203434944153, 0.14906156063079834, 0.15479108691215515, 0.16052061319351196, 0.16625013947486877, 0.17197966575622559, 0.1777091920375824, 0.1834387183189392, 0.18916824460029602, 0.19489778578281403]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 11.0, 16.0, 14.0, 26.0, 34.0, 53.0, 74.0, 126.0, 162.0, 292.0, 451.0, 707.0, 1313.0, 2366.0, 4698.0, 9488.0, 20863.0, 51985.0, 175029.0, 494756.0, 188870.0, 54771.0, 21845.0, 9863.0, 4824.0, 2465.0, 1400.0, 792.0, 451.0, 266.0, 184.0, 112.0, 77.0, 54.0, 37.0, 31.0, 16.0, 10.0, 10.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.234375, -0.225860595703125, -0.21734619140625, -0.208831787109375, -0.2003173828125, -0.191802978515625, -0.18328857421875, -0.174774169921875, -0.166259765625, -0.157745361328125, -0.14923095703125, -0.140716552734375, -0.1322021484375, -0.123687744140625, -0.11517333984375, -0.106658935546875, -0.09814453125, -0.089630126953125, -0.08111572265625, -0.072601318359375, -0.0640869140625, -0.055572509765625, -0.04705810546875, -0.038543701171875, -0.030029296875, -0.021514892578125, -0.01300048828125, -0.004486083984375, 0.0040283203125, 0.012542724609375, 0.02105712890625, 0.029571533203125, 0.0380859375, 0.046600341796875, 0.05511474609375, 0.063629150390625, 0.0721435546875, 0.080657958984375, 0.08917236328125, 0.097686767578125, 0.106201171875, 0.114715576171875, 0.12322998046875, 0.131744384765625, 0.1402587890625, 0.148773193359375, 0.15728759765625, 0.165802001953125, 0.17431640625, 0.182830810546875, 0.19134521484375, 0.199859619140625, 0.2083740234375, 0.216888427734375, 0.22540283203125, 0.233917236328125, 0.242431640625, 0.250946044921875, 0.25946044921875, 0.267974853515625, 0.2764892578125, 0.285003662109375, 0.29351806640625, 0.302032470703125, 0.310546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 7.0, 12.0, 17.0, 15.0, 17.0, 27.0, 27.0, 21.0, 25.0, 41.0, 47.0, 50.0, 63.0, 61.0, 65.0, 59.0, 53.0, 54.0, 58.0, 47.0, 41.0, 32.0, 30.0, 34.0, 16.0, 13.0, 15.0, 13.0, 7.0, 6.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3564643859863281, -0.34256744384765625, -0.3286705017089844, -0.3147735595703125, -0.3008766174316406, -0.28697967529296875, -0.2730827331542969, -0.259185791015625, -0.24528884887695312, -0.23139190673828125, -0.21749496459960938, -0.2035980224609375, -0.18970108032226562, -0.17580413818359375, -0.16190719604492188, -0.14801025390625, -0.13411331176757812, -0.12021636962890625, -0.10631942749023438, -0.0924224853515625, -0.07852554321289062, -0.06462860107421875, -0.050731658935546875, -0.036834716796875, -0.022937774658203125, -0.00904083251953125, 0.004856109619140625, 0.0187530517578125, 0.032649993896484375, 0.04654693603515625, 0.060443878173828125, 0.0743408203125, 0.08823776245117188, 0.10213470458984375, 0.11603164672851562, 0.1299285888671875, 0.14382553100585938, 0.15772247314453125, 0.17161941528320312, 0.185516357421875, 0.19941329956054688, 0.21331024169921875, 0.22720718383789062, 0.2411041259765625, 0.2550010681152344, 0.26889801025390625, 0.2827949523925781, 0.29669189453125, 0.3105888366699219, 0.32448577880859375, 0.3383827209472656, 0.3522796630859375, 0.3661766052246094, 0.38007354736328125, 0.3939704895019531, 0.407867431640625, 0.4217643737792969, 0.43566131591796875, 0.4495582580566406, 0.4634552001953125, 0.4773521423339844, 0.49124908447265625, 0.5051460266113281, 0.51904296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 13.0, 20.0, 29.0, 34.0, 67.0, 117.0, 286.0, 777.0, 3118.0, 19574.0, 282712.0, 699936.0, 34872.0, 5211.0, 1061.0, 335.0, 143.0, 78.0, 51.0, 39.0, 12.0, 22.0, 10.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5527191162109375, -0.530731201171875, -0.5087432861328125, -0.48675537109375, -0.4647674560546875, -0.442779541015625, -0.4207916259765625, -0.3988037109375, -0.3768157958984375, -0.354827880859375, -0.3328399658203125, -0.31085205078125, -0.2888641357421875, -0.266876220703125, -0.2448883056640625, -0.222900390625, -0.2009124755859375, -0.178924560546875, -0.1569366455078125, -0.13494873046875, -0.1129608154296875, -0.090972900390625, -0.0689849853515625, -0.0469970703125, -0.0250091552734375, -0.003021240234375, 0.0189666748046875, 0.04095458984375, 0.0629425048828125, 0.084930419921875, 0.1069183349609375, 0.12890625, 0.1508941650390625, 0.172882080078125, 0.1948699951171875, 0.21685791015625, 0.2388458251953125, 0.260833740234375, 0.2828216552734375, 0.3048095703125, 0.3267974853515625, 0.348785400390625, 0.3707733154296875, 0.39276123046875, 0.4147491455078125, 0.436737060546875, 0.4587249755859375, 0.480712890625, 0.5027008056640625, 0.524688720703125, 0.5466766357421875, 0.56866455078125, 0.5906524658203125, 0.612640380859375, 0.6346282958984375, 0.6566162109375, 0.6786041259765625, 0.700592041015625, 0.7225799560546875, 0.74456787109375, 0.7665557861328125, 0.788543701171875, 0.8105316162109375, 0.83251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 9.0, 10.0, 12.0, 20.0, 26.0, 31.0, 35.0, 33.0, 58.0, 51.0, 50.0, 57.0, 64.0, 57.0, 59.0, 60.0, 61.0, 54.0, 40.0, 38.0, 30.0, 26.0, 19.0, 16.0, 18.0, 8.0, 13.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62451171875, -0.6078262329101562, -0.5911407470703125, -0.5744552612304688, -0.557769775390625, -0.5410842895507812, -0.5243988037109375, -0.5077133178710938, -0.49102783203125, -0.47434234619140625, -0.4576568603515625, -0.44097137451171875, -0.424285888671875, -0.40760040283203125, -0.3909149169921875, -0.37422943115234375, -0.3575439453125, -0.34085845947265625, -0.3241729736328125, -0.30748748779296875, -0.290802001953125, -0.27411651611328125, -0.2574310302734375, -0.24074554443359375, -0.22406005859375, -0.20737457275390625, -0.1906890869140625, -0.17400360107421875, -0.157318115234375, -0.14063262939453125, -0.1239471435546875, -0.10726165771484375, -0.090576171875, -0.07389068603515625, -0.0572052001953125, -0.04051971435546875, -0.023834228515625, -0.00714874267578125, 0.0095367431640625, 0.02622222900390625, 0.04290771484375, 0.05959320068359375, 0.0762786865234375, 0.09296417236328125, 0.109649658203125, 0.12633514404296875, 0.1430206298828125, 0.15970611572265625, 0.1763916015625, 0.19307708740234375, 0.2097625732421875, 0.22644805908203125, 0.243133544921875, 0.25981903076171875, 0.2765045166015625, 0.29319000244140625, 0.30987548828125, 0.32656097412109375, 0.3432464599609375, 0.35993194580078125, 0.376617431640625, 0.39330291748046875, 0.4099884033203125, 0.42667388916015625, 0.443359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 13.0, 15.0, 15.0, 19.0, 39.0, 49.0, 119.0, 169.0, 335.0, 697.0, 1479.0, 3756.0, 13766.0, 82554.0, 664613.0, 239263.0, 30762.0, 6659.0, 2238.0, 918.0, 472.0, 262.0, 111.0, 86.0, 55.0, 27.0, 16.0, 10.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.132080078125, -0.12838459014892578, -0.12468910217285156, -0.12099361419677734, -0.11729812622070312, -0.1136026382446289, -0.10990715026855469, -0.10621166229248047, -0.10251617431640625, -0.09882068634033203, -0.09512519836425781, -0.0914297103881836, -0.08773422241210938, -0.08403873443603516, -0.08034324645996094, -0.07664775848388672, -0.0729522705078125, -0.06925678253173828, -0.06556129455566406, -0.061865806579589844, -0.058170318603515625, -0.054474830627441406, -0.05077934265136719, -0.04708385467529297, -0.04338836669921875, -0.03969287872314453, -0.03599739074707031, -0.032301902770996094, -0.028606414794921875, -0.024910926818847656, -0.021215438842773438, -0.01751995086669922, -0.013824462890625, -0.010128974914550781, -0.0064334869384765625, -0.0027379989624023438, 0.000957489013671875, 0.004652976989746094, 0.008348464965820312, 0.012043952941894531, 0.01573944091796875, 0.01943492889404297, 0.023130416870117188, 0.026825904846191406, 0.030521392822265625, 0.034216880798339844, 0.03791236877441406, 0.04160785675048828, 0.0453033447265625, 0.04899883270263672, 0.05269432067871094, 0.056389808654785156, 0.060085296630859375, 0.0637807846069336, 0.06747627258300781, 0.07117176055908203, 0.07486724853515625, 0.07856273651123047, 0.08225822448730469, 0.0859537124633789, 0.08964920043945312, 0.09334468841552734, 0.09704017639160156, 0.10073566436767578, 0.10443115234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 7.0, 11.0, 6.0, 18.0, 12.0, 20.0, 23.0, 42.0, 33.0, 52.0, 63.0, 79.0, 91.0, 112.0, 87.0, 70.0, 58.0, 53.0, 38.0, 21.0, 15.0, 19.0, 11.0, 14.0, 7.0, 8.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.519918441772461e-05, -1.4727935194969177e-05, -1.4256685972213745e-05, -1.3785436749458313e-05, -1.3314187526702881e-05, -1.2842938303947449e-05, -1.2371689081192017e-05, -1.1900439858436584e-05, -1.1429190635681152e-05, -1.095794141292572e-05, -1.0486692190170288e-05, -1.0015442967414856e-05, -9.544193744659424e-06, -9.072944521903992e-06, -8.60169529914856e-06, -8.130446076393127e-06, -7.659196853637695e-06, -7.187947630882263e-06, -6.716698408126831e-06, -6.245449185371399e-06, -5.774199962615967e-06, -5.302950739860535e-06, -4.8317015171051025e-06, -4.36045229434967e-06, -3.889203071594238e-06, -3.417953848838806e-06, -2.946704626083374e-06, -2.475455403327942e-06, -2.0042061805725098e-06, -1.5329569578170776e-06, -1.0617077350616455e-06, -5.904585123062134e-07, -1.1920928955078125e-07, 3.520399332046509e-07, 8.23289155960083e-07, 1.2945383787155151e-06, 1.7657876014709473e-06, 2.2370368242263794e-06, 2.7082860469818115e-06, 3.1795352697372437e-06, 3.6507844924926758e-06, 4.122033715248108e-06, 4.59328293800354e-06, 5.064532160758972e-06, 5.535781383514404e-06, 6.0070306062698364e-06, 6.4782798290252686e-06, 6.949529051780701e-06, 7.420778274536133e-06, 7.892027497291565e-06, 8.363276720046997e-06, 8.83452594280243e-06, 9.305775165557861e-06, 9.777024388313293e-06, 1.0248273611068726e-05, 1.0719522833824158e-05, 1.119077205657959e-05, 1.1662021279335022e-05, 1.2133270502090454e-05, 1.2604519724845886e-05, 1.3075768947601318e-05, 1.354701817035675e-05, 1.4018267393112183e-05, 1.4489516615867615e-05, 1.4960765838623047e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 8.0, 10.0, 23.0, 36.0, 65.0, 106.0, 212.0, 467.0, 1049.0, 2643.0, 9233.0, 65880.0, 723375.0, 217917.0, 20194.0, 4427.0, 1592.0, 669.0, 293.0, 173.0, 83.0, 32.0, 17.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16492080688476562, -0.15955352783203125, -0.15418624877929688, -0.1488189697265625, -0.14345169067382812, -0.13808441162109375, -0.13271713256835938, -0.127349853515625, -0.12198257446289062, -0.11661529541015625, -0.11124801635742188, -0.1058807373046875, -0.10051345825195312, -0.09514617919921875, -0.08977890014648438, -0.08441162109375, -0.07904434204101562, -0.07367706298828125, -0.06830978393554688, -0.0629425048828125, -0.057575225830078125, -0.05220794677734375, -0.046840667724609375, -0.041473388671875, -0.036106109619140625, -0.03073883056640625, -0.025371551513671875, -0.0200042724609375, -0.014636993408203125, -0.00926971435546875, -0.003902435302734375, 0.00146484375, 0.006832122802734375, 0.01219940185546875, 0.017566680908203125, 0.0229339599609375, 0.028301239013671875, 0.03366851806640625, 0.039035797119140625, 0.044403076171875, 0.049770355224609375, 0.05513763427734375, 0.060504913330078125, 0.0658721923828125, 0.07123947143554688, 0.07660675048828125, 0.08197402954101562, 0.08734130859375, 0.09270858764648438, 0.09807586669921875, 0.10344314575195312, 0.1088104248046875, 0.11417770385742188, 0.11954498291015625, 0.12491226196289062, 0.130279541015625, 0.13564682006835938, 0.14101409912109375, 0.14638137817382812, 0.1517486572265625, 0.15711593627929688, 0.16248321533203125, 0.16785049438476562, 0.1732177734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 14.0, 16.0, 18.0, 21.0, 29.0, 60.0, 86.0, 136.0, 145.0, 148.0, 93.0, 68.0, 41.0, 40.0, 26.0, 16.0, 14.0, 3.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0670166015625, -0.06490612030029297, -0.06279563903808594, -0.060685157775878906, -0.058574676513671875, -0.056464195251464844, -0.05435371398925781, -0.05224323272705078, -0.05013275146484375, -0.04802227020263672, -0.04591178894042969, -0.043801307678222656, -0.041690826416015625, -0.039580345153808594, -0.03746986389160156, -0.03535938262939453, -0.0332489013671875, -0.03113842010498047, -0.029027938842773438, -0.026917457580566406, -0.024806976318359375, -0.022696495056152344, -0.020586013793945312, -0.01847553253173828, -0.01636505126953125, -0.014254570007324219, -0.012144088745117188, -0.010033607482910156, -0.007923126220703125, -0.005812644958496094, -0.0037021636962890625, -0.0015916824340820312, 0.000518798828125, 0.0026292800903320312, 0.0047397613525390625, 0.006850242614746094, 0.008960723876953125, 0.011071205139160156, 0.013181686401367188, 0.015292167663574219, 0.01740264892578125, 0.01951313018798828, 0.021623611450195312, 0.023734092712402344, 0.025844573974609375, 0.027955055236816406, 0.030065536499023438, 0.03217601776123047, 0.0342864990234375, 0.03639698028564453, 0.03850746154785156, 0.040617942810058594, 0.042728424072265625, 0.044838905334472656, 0.04694938659667969, 0.04905986785888672, 0.05117034912109375, 0.05328083038330078, 0.05539131164550781, 0.057501792907714844, 0.059612274169921875, 0.061722755432128906, 0.06383323669433594, 0.06594371795654297, 0.06805419921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 32.0, 87.0, 176.0, 280.0, 248.0, 116.0, 54.0, 11.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8445942997932434, -0.7835565805435181, -0.7225189208984375, -0.6614812016487122, -0.6004435420036316, -0.5394058227539062, -0.4783681333065033, -0.41733044385910034, -0.3562927544116974, -0.29525506496429443, -0.23421737551689148, -0.17317967116832733, -0.11214198172092438, -0.05110427737236023, 0.009933412075042725, 0.07097110152244568, 0.13200879096984863, 0.1930464804172516, 0.25408416986465454, 0.3151218891143799, 0.37615954875946045, 0.4371972680091858, 0.49823495745658875, 0.5592726469039917, 0.6203103065490723, 0.6813480257987976, 0.7423856854438782, 0.8034234046936035, 0.8644610643386841, 0.9254987835884094, 0.9865365028381348, 1.0475741624832153, 1.1086119413375854, 1.169649600982666, 1.2306873798370361, 1.2917250394821167, 1.3527626991271973, 1.4138004779815674, 1.474838137626648, 1.5358757972717285, 1.596913456916809, 1.6579511165618896, 1.7189888954162598, 1.7800265550613403, 1.841064214706421, 1.902101993560791, 1.9631396532058716, 2.024177312850952, 2.0852150917053223, 2.1462528705596924, 2.2072904109954834, 2.2683281898498535, 2.3293659687042236, 2.3904035091400146, 2.4514412879943848, 2.512478828430176, 2.573516607284546, 2.634554386138916, 2.695591926574707, 2.756629705429077, 2.8176674842834473, 2.8787050247192383, 2.9397428035736084, 3.0007805824279785, 3.0618181228637695]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 9.0, 19.0, 10.0, 13.0, 21.0, 24.0, 24.0, 23.0, 27.0, 31.0, 29.0, 42.0, 39.0, 37.0, 38.0, 42.0, 51.0, 51.0, 48.0, 55.0, 41.0, 38.0, 44.0, 43.0, 32.0, 19.0, 29.0, 17.0, 20.0, 11.0, 15.0, 12.0, 12.0, 6.0, 3.0, 10.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6871644258499146, -0.6649504899978638, -0.6427364945411682, -0.6205225586891174, -0.5983086228370667, -0.5760946869850159, -0.5538806915283203, -0.5316667556762695, -0.5094528198242188, -0.4872388541698456, -0.4650249183177948, -0.44281095266342163, -0.42059701681137085, -0.3983830511569977, -0.3761690855026245, -0.35395514965057373, -0.33174118399620056, -0.3095272183418274, -0.2873132824897766, -0.26509931683540344, -0.24288538098335266, -0.2206714153289795, -0.19845746457576752, -0.17624351382255554, -0.15402956306934357, -0.1318156123161316, -0.10960166156291962, -0.08738770335912704, -0.06517375260591507, -0.042959801852703094, -0.020745843648910522, 0.0014681071043014526, 0.023682057857513428, 0.0458960086107254, 0.06810995936393738, 0.09032391756772995, 0.11253786832094193, 0.1347518265247345, 0.15696577727794647, 0.17917972803115845, 0.20139367878437042, 0.2236076295375824, 0.24582158029079437, 0.26803553104400635, 0.2902494966983795, 0.3124634325504303, 0.33467739820480347, 0.35689133405685425, 0.3791052997112274, 0.4013192653656006, 0.42353320121765137, 0.44574716687202454, 0.4679611027240753, 0.4901750683784485, 0.5123890042304993, 0.5346029996871948, 0.5568169355392456, 0.5790308713912964, 0.6012448668479919, 0.6234588027000427, 0.6456727385520935, 0.6678866744041443, 0.6901006698608398, 0.7123146057128906, 0.7345285415649414]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 11.0, 10.0, 13.0, 12.0, 15.0, 19.0, 25.0, 40.0, 67.0, 105.0, 167.0, 346.0, 710.0, 1585.0, 3491.0, 9441.0, 34293.0, 377416.0, 3245929.0, 466798.0, 37175.0, 9898.0, 3630.0, 1558.0, 723.0, 342.0, 162.0, 98.0, 46.0, 42.0, 25.0, 21.0, 13.0, 12.0, 10.0, 8.0, 3.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51953125, -0.5044822692871094, -0.48943328857421875, -0.4743843078613281, -0.4593353271484375, -0.4442863464355469, -0.42923736572265625, -0.4141883850097656, -0.399139404296875, -0.3840904235839844, -0.36904144287109375, -0.3539924621582031, -0.3389434814453125, -0.3238945007324219, -0.30884552001953125, -0.2937965393066406, -0.27874755859375, -0.2636985778808594, -0.24864959716796875, -0.23360061645507812, -0.2185516357421875, -0.20350265502929688, -0.18845367431640625, -0.17340469360351562, -0.158355712890625, -0.14330673217773438, -0.12825775146484375, -0.11320877075195312, -0.0981597900390625, -0.08311080932617188, -0.06806182861328125, -0.053012847900390625, -0.0379638671875, -0.022914886474609375, -0.00786590576171875, 0.007183074951171875, 0.0222320556640625, 0.037281036376953125, 0.05233001708984375, 0.06737899780273438, 0.082427978515625, 0.09747695922851562, 0.11252593994140625, 0.12757492065429688, 0.1426239013671875, 0.15767288208007812, 0.17272186279296875, 0.18777084350585938, 0.20281982421875, 0.21786880493164062, 0.23291778564453125, 0.24796676635742188, 0.2630157470703125, 0.2780647277832031, 0.29311370849609375, 0.3081626892089844, 0.323211669921875, 0.3382606506347656, 0.35330963134765625, 0.3683586120605469, 0.3834075927734375, 0.3984565734863281, 0.41350555419921875, 0.4285545349121094, 0.443603515625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 11.0, 8.0, 16.0, 16.0, 10.0, 15.0, 21.0, 29.0, 25.0, 34.0, 32.0, 29.0, 27.0, 45.0, 40.0, 48.0, 37.0, 51.0, 41.0, 56.0, 50.0, 51.0, 41.0, 41.0, 44.0, 33.0, 22.0, 21.0, 13.0, 10.0, 13.0, 18.0, 9.0, 8.0, 2.0, 6.0, 3.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.222412109375, -0.21626853942871094, -0.21012496948242188, -0.2039813995361328, -0.19783782958984375, -0.1916942596435547, -0.18555068969726562, -0.17940711975097656, -0.1732635498046875, -0.16711997985839844, -0.16097640991210938, -0.1548328399658203, -0.14868927001953125, -0.1425457000732422, -0.13640213012695312, -0.13025856018066406, -0.124114990234375, -0.11797142028808594, -0.11182785034179688, -0.10568428039550781, -0.09954071044921875, -0.09339714050292969, -0.08725357055664062, -0.08111000061035156, -0.0749664306640625, -0.06882286071777344, -0.06267929077148438, -0.05653572082519531, -0.05039215087890625, -0.04424858093261719, -0.038105010986328125, -0.03196144104003906, -0.02581787109375, -0.019674301147460938, -0.013530731201171875, -0.0073871612548828125, -0.00124359130859375, 0.0048999786376953125, 0.011043548583984375, 0.017187118530273438, 0.0233306884765625, 0.029474258422851562, 0.035617828369140625, 0.04176139831542969, 0.04790496826171875, 0.05404853820800781, 0.060192108154296875, 0.06633567810058594, 0.072479248046875, 0.07862281799316406, 0.08476638793945312, 0.09090995788574219, 0.09705352783203125, 0.10319709777832031, 0.10934066772460938, 0.11548423767089844, 0.1216278076171875, 0.12777137756347656, 0.13391494750976562, 0.1400585174560547, 0.14620208740234375, 0.1523456573486328, 0.15848922729492188, 0.16463279724121094, 0.1707763671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 12.0, 12.0, 19.0, 40.0, 70.0, 141.0, 317.0, 989.0, 5383.0, 119756.0, 4015424.0, 47472.0, 3407.0, 726.0, 244.0, 120.0, 64.0, 42.0, 16.0, 11.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4150390625, -1.3781814575195312, -1.3413238525390625, -1.3044662475585938, -1.267608642578125, -1.2307510375976562, -1.1938934326171875, -1.1570358276367188, -1.12017822265625, -1.0833206176757812, -1.0464630126953125, -1.0096054077148438, -0.972747802734375, -0.9358901977539062, -0.8990325927734375, -0.8621749877929688, -0.8253173828125, -0.7884597778320312, -0.7516021728515625, -0.7147445678710938, -0.677886962890625, -0.6410293579101562, -0.6041717529296875, -0.5673141479492188, -0.53045654296875, -0.49359893798828125, -0.4567413330078125, -0.41988372802734375, -0.383026123046875, -0.34616851806640625, -0.3093109130859375, -0.27245330810546875, -0.235595703125, -0.19873809814453125, -0.1618804931640625, -0.12502288818359375, -0.088165283203125, -0.05130767822265625, -0.0144500732421875, 0.02240753173828125, 0.05926513671875, 0.09612274169921875, 0.1329803466796875, 0.16983795166015625, 0.206695556640625, 0.24355316162109375, 0.2804107666015625, 0.31726837158203125, 0.3541259765625, 0.39098358154296875, 0.4278411865234375, 0.46469879150390625, 0.501556396484375, 0.5384140014648438, 0.5752716064453125, 0.6121292114257812, 0.64898681640625, 0.6858444213867188, 0.7227020263671875, 0.7595596313476562, 0.796417236328125, 0.8332748413085938, 0.8701324462890625, 0.9069900512695312, 0.94384765625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 18.0, 19.0, 33.0, 67.0, 110.0, 251.0, 638.0, 1180.0, 930.0, 432.0, 170.0, 96.0, 46.0, 34.0, 19.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20533180236816406, -0.19765090942382812, -0.1899700164794922, -0.18228912353515625, -0.1746082305908203, -0.16692733764648438, -0.15924644470214844, -0.1515655517578125, -0.14388465881347656, -0.13620376586914062, -0.1285228729248047, -0.12084197998046875, -0.11316108703613281, -0.10548019409179688, -0.09779930114746094, -0.090118408203125, -0.08243751525878906, -0.07475662231445312, -0.06707572937011719, -0.05939483642578125, -0.05171394348144531, -0.044033050537109375, -0.03635215759277344, -0.0286712646484375, -0.020990371704101562, -0.013309478759765625, -0.0056285858154296875, 0.00205230712890625, 0.009733200073242188, 0.017414093017578125, 0.025094985961914062, 0.03277587890625, 0.04045677185058594, 0.048137664794921875, 0.05581855773925781, 0.06349945068359375, 0.07118034362792969, 0.07886123657226562, 0.08654212951660156, 0.0942230224609375, 0.10190391540527344, 0.10958480834960938, 0.11726570129394531, 0.12494659423828125, 0.1326274871826172, 0.14030838012695312, 0.14798927307128906, 0.155670166015625, 0.16335105895996094, 0.17103195190429688, 0.1787128448486328, 0.18639373779296875, 0.1940746307373047, 0.20175552368164062, 0.20943641662597656, 0.2171173095703125, 0.22479820251464844, 0.23247909545898438, 0.2401599884033203, 0.24784088134765625, 0.2555217742919922, 0.2632026672363281, 0.27088356018066406, 0.278564453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 13.0, 16.0, 21.0, 28.0, 36.0, 47.0, 55.0, 70.0, 56.0, 77.0, 69.0, 73.0, 71.0, 49.0, 56.0, 56.0, 42.0, 34.0, 28.0, 19.0, 21.0, 10.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5387060642242432, -0.5260964632034302, -0.5134868621826172, -0.5008772611618042, -0.4882676601409912, -0.4756580591201782, -0.46304845809936523, -0.45043885707855225, -0.43782925605773926, -0.42521965503692627, -0.4126100540161133, -0.4000004529953003, -0.3873908519744873, -0.3747812509536743, -0.36217164993286133, -0.34956204891204834, -0.33695247769355774, -0.32434287667274475, -0.31173327565193176, -0.2991236746311188, -0.2865140736103058, -0.2739044725894928, -0.2612949013710022, -0.24868528544902802, -0.23607568442821503, -0.22346608340740204, -0.21085648238658905, -0.19824689626693726, -0.18563729524612427, -0.17302769422531128, -0.1604180932044983, -0.1478084921836853, -0.1351989209651947, -0.12258931994438171, -0.10997971892356873, -0.09737012535333633, -0.08476052433252335, -0.07215092331171036, -0.059541329741477966, -0.04693172872066498, -0.03432212769985199, -0.02171252854168415, -0.009102929383516312, 0.003506667912006378, 0.016116268932819366, 0.028725869953632355, 0.041335463523864746, 0.053945064544677734, 0.06655466556549072, 0.07916426658630371, 0.0917738676071167, 0.10438346117734909, 0.11699306219816208, 0.12960267066955566, 0.14221225678920746, 0.15482185781002045, 0.16743145883083344, 0.18004105985164642, 0.1926506608724594, 0.2052602469921112, 0.2178698480129242, 0.23047944903373718, 0.24308905005455017, 0.25569865107536316, 0.26830825209617615]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 10.0, 15.0, 9.0, 15.0, 14.0, 19.0, 18.0, 19.0, 33.0, 24.0, 43.0, 43.0, 42.0, 31.0, 40.0, 42.0, 55.0, 46.0, 37.0, 38.0, 29.0, 29.0, 46.0, 32.0, 35.0, 34.0, 28.0, 29.0, 19.0, 14.0, 14.0, 12.0, 12.0, 16.0, 9.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.28750863671302795, -0.27930018305778503, -0.2710916996002197, -0.2628832459449768, -0.2546747624874115, -0.24646630883216858, -0.23825784027576447, -0.23004937171936035, -0.22184090316295624, -0.21363243460655212, -0.205423966050148, -0.1972154974937439, -0.18900704383850098, -0.18079856038093567, -0.17259010672569275, -0.16438163816928864, -0.15617316961288452, -0.1479647010564804, -0.1397562325000763, -0.13154776394367218, -0.12333930283784866, -0.11513083428144455, -0.10692237317562103, -0.09871390461921692, -0.0905054360628128, -0.08229696750640869, -0.07408849895000458, -0.06588003784418106, -0.05767156928777695, -0.04946310073137283, -0.04125463590025902, -0.0330461710691452, -0.02483770251274109, -0.016629235818982124, -0.00842076912522316, -0.00021230243146419525, 0.00799616426229477, 0.016204632818698883, 0.0244130976498127, 0.032621562480926514, 0.04083003103733063, 0.04903849959373474, 0.057246964424848557, 0.06545542925596237, 0.07366389781236649, 0.0818723663687706, 0.09008082747459412, 0.09828929603099823, 0.10649776458740234, 0.11470623314380646, 0.12291470170021057, 0.13112317025661469, 0.1393316388130188, 0.14754009246826172, 0.15574856102466583, 0.16395702958106995, 0.17216549813747406, 0.18037396669387817, 0.1885824352502823, 0.1967909038066864, 0.20499935746192932, 0.21320784091949463, 0.22141629457473755, 0.22962476313114166, 0.23783323168754578]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 6.0, 15.0, 15.0, 25.0, 35.0, 43.0, 63.0, 78.0, 127.0, 169.0, 275.0, 446.0, 748.0, 1351.0, 2614.0, 4878.0, 9645.0, 22662.0, 80507.0, 429180.0, 384246.0, 71049.0, 20718.0, 9354.0, 4667.0, 2422.0, 1283.0, 695.0, 386.0, 250.0, 163.0, 126.0, 75.0, 50.0, 41.0, 28.0, 29.0, 13.0, 14.0, 14.0, 3.0, 8.0, 13.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.10528564453125, -0.10218524932861328, -0.09908485412597656, -0.09598445892333984, -0.09288406372070312, -0.0897836685180664, -0.08668327331542969, -0.08358287811279297, -0.08048248291015625, -0.07738208770751953, -0.07428169250488281, -0.0711812973022461, -0.06808090209960938, -0.06498050689697266, -0.06188011169433594, -0.05877971649169922, -0.0556793212890625, -0.05257892608642578, -0.04947853088378906, -0.046378135681152344, -0.043277740478515625, -0.040177345275878906, -0.03707695007324219, -0.03397655487060547, -0.03087615966796875, -0.02777576446533203, -0.024675369262695312, -0.021574974060058594, -0.018474578857421875, -0.015374183654785156, -0.012273788452148438, -0.009173393249511719, -0.006072998046875, -0.0029726028442382812, 0.0001277923583984375, 0.0032281875610351562, 0.006328582763671875, 0.009428977966308594, 0.012529373168945312, 0.01562976837158203, 0.01873016357421875, 0.02183055877685547, 0.024930953979492188, 0.028031349182128906, 0.031131744384765625, 0.034232139587402344, 0.03733253479003906, 0.04043292999267578, 0.0435333251953125, 0.04663372039794922, 0.04973411560058594, 0.052834510803222656, 0.055934906005859375, 0.059035301208496094, 0.06213569641113281, 0.06523609161376953, 0.06833648681640625, 0.07143688201904297, 0.07453727722167969, 0.0776376724243164, 0.08073806762695312, 0.08383846282958984, 0.08693885803222656, 0.09003925323486328, 0.0931396484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 10.0, 12.0, 12.0, 11.0, 14.0, 17.0, 23.0, 18.0, 26.0, 25.0, 37.0, 27.0, 54.0, 40.0, 35.0, 62.0, 50.0, 45.0, 47.0, 38.0, 41.0, 31.0, 42.0, 36.0, 25.0, 33.0, 27.0, 32.0, 16.0, 16.0, 19.0, 19.0, 9.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16146469116210938, -0.15581512451171875, -0.15016555786132812, -0.1445159912109375, -0.13886642456054688, -0.13321685791015625, -0.12756729125976562, -0.121917724609375, -0.11626815795898438, -0.11061859130859375, -0.10496902465820312, -0.0993194580078125, -0.09366989135742188, -0.08802032470703125, -0.08237075805664062, -0.07672119140625, -0.07107162475585938, -0.06542205810546875, -0.059772491455078125, -0.0541229248046875, -0.048473358154296875, -0.04282379150390625, -0.037174224853515625, -0.031524658203125, -0.025875091552734375, -0.02022552490234375, -0.014575958251953125, -0.0089263916015625, -0.003276824951171875, 0.00237274169921875, 0.008022308349609375, 0.013671875, 0.019321441650390625, 0.02497100830078125, 0.030620574951171875, 0.0362701416015625, 0.041919708251953125, 0.04756927490234375, 0.053218841552734375, 0.058868408203125, 0.06451797485351562, 0.07016754150390625, 0.07581710815429688, 0.0814666748046875, 0.08711624145507812, 0.09276580810546875, 0.09841537475585938, 0.10406494140625, 0.10971450805664062, 0.11536407470703125, 0.12101364135742188, 0.1266632080078125, 0.13231277465820312, 0.13796234130859375, 0.14361190795898438, 0.149261474609375, 0.15491104125976562, 0.16056060791015625, 0.16621017456054688, 0.1718597412109375, 0.17750930786132812, 0.18315887451171875, 0.18880844116210938, 0.1944580078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 11.0, 9.0, 22.0, 23.0, 29.0, 43.0, 56.0, 100.0, 122.0, 188.0, 263.0, 446.0, 741.0, 1186.0, 2126.0, 4014.0, 8343.0, 19397.0, 54304.0, 191389.0, 441353.0, 219992.0, 62742.0, 22341.0, 9155.0, 4450.0, 2317.0, 1234.0, 766.0, 485.0, 309.0, 168.0, 122.0, 85.0, 49.0, 46.0, 33.0, 20.0, 21.0, 11.0, 9.0, 3.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06194019317626953, -0.06003761291503906, -0.058135032653808594, -0.056232452392578125, -0.054329872131347656, -0.05242729187011719, -0.05052471160888672, -0.04862213134765625, -0.04671955108642578, -0.04481697082519531, -0.042914390563964844, -0.041011810302734375, -0.039109230041503906, -0.03720664978027344, -0.03530406951904297, -0.0334014892578125, -0.03149890899658203, -0.029596328735351562, -0.027693748474121094, -0.025791168212890625, -0.023888587951660156, -0.021986007690429688, -0.02008342742919922, -0.01818084716796875, -0.01627826690673828, -0.014375686645507812, -0.012473106384277344, -0.010570526123046875, -0.008667945861816406, -0.0067653656005859375, -0.004862785339355469, -0.002960205078125, -0.0010576248168945312, 0.0008449554443359375, 0.0027475357055664062, 0.004650115966796875, 0.006552696228027344, 0.008455276489257812, 0.010357856750488281, 0.01226043701171875, 0.014163017272949219, 0.016065597534179688, 0.017968177795410156, 0.019870758056640625, 0.021773338317871094, 0.023675918579101562, 0.02557849884033203, 0.0274810791015625, 0.02938365936279297, 0.03128623962402344, 0.033188819885253906, 0.035091400146484375, 0.036993980407714844, 0.03889656066894531, 0.04079914093017578, 0.04270172119140625, 0.04460430145263672, 0.04650688171386719, 0.048409461975097656, 0.050312042236328125, 0.052214622497558594, 0.05411720275878906, 0.05601978302001953, 0.05792236328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 7.0, 12.0, 11.0, 12.0, 15.0, 19.0, 13.0, 23.0, 21.0, 22.0, 31.0, 28.0, 31.0, 41.0, 38.0, 51.0, 40.0, 34.0, 38.0, 30.0, 33.0, 41.0, 31.0, 29.0, 38.0, 32.0, 34.0, 33.0, 30.0, 29.0, 23.0, 23.0, 19.0, 13.0, 8.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0], "bins": [-0.4091796875, -0.3971672058105469, -0.38515472412109375, -0.3731422424316406, -0.3611297607421875, -0.3491172790527344, -0.33710479736328125, -0.3250923156738281, -0.313079833984375, -0.3010673522949219, -0.28905487060546875, -0.2770423889160156, -0.2650299072265625, -0.2530174255371094, -0.24100494384765625, -0.22899246215820312, -0.21697998046875, -0.20496749877929688, -0.19295501708984375, -0.18094253540039062, -0.1689300537109375, -0.15691757202148438, -0.14490509033203125, -0.13289260864257812, -0.120880126953125, -0.10886764526367188, -0.09685516357421875, -0.08484268188476562, -0.0728302001953125, -0.060817718505859375, -0.04880523681640625, -0.036792755126953125, -0.0247802734375, -0.012767791748046875, -0.00075531005859375, 0.011257171630859375, 0.0232696533203125, 0.035282135009765625, 0.04729461669921875, 0.059307098388671875, 0.071319580078125, 0.08333206176757812, 0.09534454345703125, 0.10735702514648438, 0.1193695068359375, 0.13138198852539062, 0.14339447021484375, 0.15540695190429688, 0.16741943359375, 0.17943191528320312, 0.19144439697265625, 0.20345687866210938, 0.2154693603515625, 0.22748184204101562, 0.23949432373046875, 0.2515068054199219, 0.263519287109375, 0.2755317687988281, 0.28754425048828125, 0.2995567321777344, 0.3115692138671875, 0.3235816955566406, 0.33559417724609375, 0.3476066589355469, 0.359619140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 11.0, 7.0, 12.0, 7.0, 20.0, 14.0, 19.0, 43.0, 76.0, 137.0, 191.0, 373.0, 867.0, 1689.0, 3908.0, 10736.0, 40895.0, 383763.0, 527420.0, 56922.0, 12972.0, 4544.0, 1959.0, 912.0, 463.0, 231.0, 152.0, 64.0, 44.0, 32.0, 21.0, 12.0, 14.0, 10.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.047332763671875, -0.04598379135131836, -0.04463481903076172, -0.04328584671020508, -0.04193687438964844, -0.0405879020690918, -0.039238929748535156, -0.037889957427978516, -0.036540985107421875, -0.035192012786865234, -0.033843040466308594, -0.03249406814575195, -0.031145095825195312, -0.029796123504638672, -0.02844715118408203, -0.02709817886352539, -0.02574920654296875, -0.02440023422241211, -0.02305126190185547, -0.021702289581298828, -0.020353317260742188, -0.019004344940185547, -0.017655372619628906, -0.016306400299072266, -0.014957427978515625, -0.013608455657958984, -0.012259483337402344, -0.010910511016845703, -0.009561538696289062, -0.008212566375732422, -0.006863594055175781, -0.005514621734619141, -0.0041656494140625, -0.0028166770935058594, -0.0014677047729492188, -0.00011873245239257812, 0.0012302398681640625, 0.002579212188720703, 0.003928184509277344, 0.005277156829833984, 0.006626129150390625, 0.007975101470947266, 0.009324073791503906, 0.010673046112060547, 0.012022018432617188, 0.013370990753173828, 0.014719963073730469, 0.01606893539428711, 0.01741790771484375, 0.01876688003540039, 0.02011585235595703, 0.021464824676513672, 0.022813796997070312, 0.024162769317626953, 0.025511741638183594, 0.026860713958740234, 0.028209686279296875, 0.029558658599853516, 0.030907630920410156, 0.0322566032409668, 0.03360557556152344, 0.03495454788208008, 0.03630352020263672, 0.03765249252319336, 0.03900146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 7.0, 6.0, 13.0, 24.0, 51.0, 71.0, 149.0, 182.0, 183.0, 132.0, 65.0, 38.0, 19.0, 9.0, 9.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8133392333984375e-05, -2.7156434953212738e-05, -2.61794775724411e-05, -2.5202520191669464e-05, -2.4225562810897827e-05, -2.324860543012619e-05, -2.2271648049354553e-05, -2.1294690668582916e-05, -2.031773328781128e-05, -1.9340775907039642e-05, -1.8363818526268005e-05, -1.738686114549637e-05, -1.640990376472473e-05, -1.5432946383953094e-05, -1.4455989003181458e-05, -1.347903162240982e-05, -1.2502074241638184e-05, -1.1525116860866547e-05, -1.054815948009491e-05, -9.571202099323273e-06, -8.594244718551636e-06, -7.617287337779999e-06, -6.640329957008362e-06, -5.663372576236725e-06, -4.686415195465088e-06, -3.709457814693451e-06, -2.732500433921814e-06, -1.755543053150177e-06, -7.7858567237854e-07, 1.9837170839309692e-07, 1.1753290891647339e-06, 2.152286469936371e-06, 3.129243850708008e-06, 4.106201231479645e-06, 5.083158612251282e-06, 6.060115993022919e-06, 7.037073373794556e-06, 8.014030754566193e-06, 8.99098813533783e-06, 9.967945516109467e-06, 1.0944902896881104e-05, 1.192186027765274e-05, 1.2898817658424377e-05, 1.3875775039196014e-05, 1.4852732419967651e-05, 1.582968980073929e-05, 1.6806647181510925e-05, 1.7783604562282562e-05, 1.87605619430542e-05, 1.9737519323825836e-05, 2.0714476704597473e-05, 2.169143408536911e-05, 2.2668391466140747e-05, 2.3645348846912384e-05, 2.462230622768402e-05, 2.5599263608455658e-05, 2.6576220989227295e-05, 2.7553178369998932e-05, 2.853013575077057e-05, 2.9507093131542206e-05, 3.0484050512313843e-05, 3.146100789308548e-05, 3.243796527385712e-05, 3.3414922654628754e-05, 3.439188003540039e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 9.0, 6.0, 11.0, 19.0, 23.0, 39.0, 40.0, 79.0, 96.0, 189.0, 251.0, 417.0, 644.0, 1087.0, 1834.0, 3132.0, 6124.0, 12462.0, 30140.0, 93762.0, 303068.0, 381388.0, 138189.0, 42257.0, 16342.0, 7531.0, 4019.0, 2129.0, 1260.0, 694.0, 466.0, 284.0, 176.0, 126.0, 84.0, 63.0, 34.0, 23.0, 17.0, 13.0, 8.0, 15.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02618408203125, -0.02531576156616211, -0.02444744110107422, -0.023579120635986328, -0.022710800170898438, -0.021842479705810547, -0.020974159240722656, -0.020105838775634766, -0.019237518310546875, -0.018369197845458984, -0.017500877380371094, -0.016632556915283203, -0.015764236450195312, -0.014895915985107422, -0.014027595520019531, -0.01315927505493164, -0.01229095458984375, -0.01142263412475586, -0.010554313659667969, -0.009685993194580078, -0.008817672729492188, -0.007949352264404297, -0.007081031799316406, -0.006212711334228516, -0.005344390869140625, -0.004476070404052734, -0.0036077499389648438, -0.002739429473876953, -0.0018711090087890625, -0.0010027885437011719, -0.00013446807861328125, 0.0007338523864746094, 0.0016021728515625, 0.0024704933166503906, 0.0033388137817382812, 0.004207134246826172, 0.0050754547119140625, 0.005943775177001953, 0.006812095642089844, 0.007680416107177734, 0.008548736572265625, 0.009417057037353516, 0.010285377502441406, 0.011153697967529297, 0.012022018432617188, 0.012890338897705078, 0.013758659362792969, 0.01462697982788086, 0.01549530029296875, 0.01636362075805664, 0.01723194122314453, 0.018100261688232422, 0.018968582153320312, 0.019836902618408203, 0.020705223083496094, 0.021573543548583984, 0.022441864013671875, 0.023310184478759766, 0.024178504943847656, 0.025046825408935547, 0.025915145874023438, 0.026783466339111328, 0.02765178680419922, 0.02852010726928711, 0.029388427734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 13.0, 9.0, 16.0, 20.0, 17.0, 38.0, 48.0, 77.0, 90.0, 83.0, 107.0, 92.0, 76.0, 85.0, 50.0, 39.0, 28.0, 21.0, 11.0, 19.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01061248779296875, -0.0102766752243042, -0.009940862655639648, -0.009605050086975098, -0.009269237518310547, -0.008933424949645996, -0.008597612380981445, -0.008261799812316895, -0.007925987243652344, -0.007590174674987793, -0.007254362106323242, -0.006918549537658691, -0.006582736968994141, -0.00624692440032959, -0.005911111831665039, -0.005575299263000488, -0.0052394866943359375, -0.004903674125671387, -0.004567861557006836, -0.004232048988342285, -0.0038962364196777344, -0.0035604238510131836, -0.003224611282348633, -0.002888798713684082, -0.0025529861450195312, -0.0022171735763549805, -0.0018813610076904297, -0.001545548439025879, -0.0012097358703613281, -0.0008739233016967773, -0.0005381107330322266, -0.00020229816436767578, 0.000133514404296875, 0.0004693269729614258, 0.0008051395416259766, 0.0011409521102905273, 0.0014767646789550781, 0.001812577247619629, 0.0021483898162841797, 0.0024842023849487305, 0.0028200149536132812, 0.003155827522277832, 0.003491640090942383, 0.0038274526596069336, 0.004163265228271484, 0.004499077796936035, 0.004834890365600586, 0.005170702934265137, 0.0055065155029296875, 0.005842328071594238, 0.006178140640258789, 0.00651395320892334, 0.006849765777587891, 0.007185578346252441, 0.007521390914916992, 0.007857203483581543, 0.008193016052246094, 0.008528828620910645, 0.008864641189575195, 0.009200453758239746, 0.009536266326904297, 0.009872078895568848, 0.010207891464233398, 0.01054370403289795, 0.0108795166015625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 6.0, 13.0, 13.0, 9.0, 13.0, 13.0, 24.0, 19.0, 46.0, 57.0, 48.0, 47.0, 52.0, 62.0, 56.0, 61.0, 61.0, 52.0, 52.0, 48.0, 55.0, 40.0, 27.0, 26.0, 15.0, 23.0, 12.0, 11.0, 6.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21121995151042938, -0.2046094834804535, -0.1979990005493164, -0.19138853251934052, -0.18477806448936462, -0.17816759645938873, -0.17155712842941284, -0.16494664549827576, -0.15833617746829987, -0.15172570943832397, -0.1451152265071869, -0.138504758477211, -0.1318942904472351, -0.12528382241725922, -0.11867334693670273, -0.11206287145614624, -0.10545240342617035, -0.09884193539619446, -0.09223145991563797, -0.08562098443508148, -0.07901051640510559, -0.0724000483751297, -0.06578957289457321, -0.05917910113930702, -0.05256862938404083, -0.04595815762877464, -0.03934768587350845, -0.032737214118242264, -0.026126742362976074, -0.019516270607709885, -0.012905798852443695, -0.0062953270971775055, 0.00031515955924987793, 0.0069256313145160675, 0.013536103069782257, 0.020146574825048447, 0.026757046580314636, 0.033367518335580826, 0.039977990090847015, 0.046588461846113205, 0.053198933601379395, 0.059809405356645584, 0.06641987711191177, 0.07303035259246826, 0.07964082062244415, 0.08625128865242004, 0.09286176413297653, 0.09947223961353302, 0.10608270764350891, 0.1126931756734848, 0.11930365115404129, 0.12591412663459778, 0.13252459466457367, 0.13913506269454956, 0.14574554562568665, 0.15235601365566254, 0.15896648168563843, 0.16557694971561432, 0.1721874177455902, 0.1787979006767273, 0.18540836870670319, 0.19201883673667908, 0.19862931966781616, 0.20523978769779205, 0.21185025572776794]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 13.0, 17.0, 17.0, 13.0, 17.0, 21.0, 24.0, 23.0, 31.0, 44.0, 40.0, 46.0, 42.0, 40.0, 47.0, 46.0, 38.0, 43.0, 31.0, 43.0, 31.0, 32.0, 31.0, 32.0, 30.0, 36.0, 29.0, 16.0, 16.0, 15.0, 14.0, 10.0, 17.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.18202324211597443, -0.17685925960540771, -0.1716952919960022, -0.16653130948543549, -0.16136732697486877, -0.15620335936546326, -0.15103937685489655, -0.14587539434432983, -0.14071142673492432, -0.1355474442243576, -0.1303834766149521, -0.12521949410438538, -0.12005551159381866, -0.11489153653383255, -0.10972756147384644, -0.10456357896327972, -0.09939959645271301, -0.0942356213927269, -0.08907163888216019, -0.08390766382217407, -0.07874368131160736, -0.07357970625162125, -0.06841573119163513, -0.06325174868106842, -0.058087773621082306, -0.05292379483580589, -0.04775981605052948, -0.042595840990543365, -0.03743186220526695, -0.03226788341999054, -0.027103906497359276, -0.021939929574728012, -0.016775965690612793, -0.011611987836658955, -0.006448009982705116, -0.001284032128751278, 0.0038799457252025604, 0.009043924510478973, 0.014207901433110237, 0.0193718783557415, 0.024535857141017914, 0.029699835926294327, 0.03486381471157074, 0.040027789771556854, 0.04519176855683327, 0.05035574734210968, 0.055519722402095795, 0.06068370118737221, 0.06584767997264862, 0.07101165503263474, 0.07617563754320145, 0.08133961260318756, 0.08650359511375427, 0.09166757017374039, 0.0968315452337265, 0.10199552774429321, 0.10715950280427933, 0.11232347786426544, 0.11748746037483215, 0.12265143543481827, 0.12781541049480438, 0.1329793930053711, 0.1381433755159378, 0.14330734312534332, 0.14847132563591003]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 7.0, 14.0, 16.0, 39.0, 47.0, 73.0, 125.0, 147.0, 255.0, 415.0, 691.0, 1233.0, 2344.0, 4395.0, 8518.0, 18313.0, 43889.0, 120770.0, 321582.0, 323463.0, 121380.0, 44037.0, 18364.0, 8592.0, 4276.0, 2375.0, 1272.0, 700.0, 420.0, 282.0, 170.0, 99.0, 70.0, 51.0, 41.0, 25.0, 12.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.313232421875, -0.303741455078125, -0.29425048828125, -0.284759521484375, -0.2752685546875, -0.265777587890625, -0.25628662109375, -0.246795654296875, -0.2373046875, -0.227813720703125, -0.21832275390625, -0.208831787109375, -0.1993408203125, -0.189849853515625, -0.18035888671875, -0.170867919921875, -0.161376953125, -0.151885986328125, -0.14239501953125, -0.132904052734375, -0.1234130859375, -0.113922119140625, -0.10443115234375, -0.094940185546875, -0.08544921875, -0.075958251953125, -0.06646728515625, -0.056976318359375, -0.0474853515625, -0.037994384765625, -0.02850341796875, -0.019012451171875, -0.009521484375, -3.0517578125e-05, 0.00946044921875, 0.018951416015625, 0.0284423828125, 0.037933349609375, 0.04742431640625, 0.056915283203125, 0.06640625, 0.075897216796875, 0.08538818359375, 0.094879150390625, 0.1043701171875, 0.113861083984375, 0.12335205078125, 0.132843017578125, 0.142333984375, 0.151824951171875, 0.16131591796875, 0.170806884765625, 0.1802978515625, 0.189788818359375, 0.19927978515625, 0.208770751953125, 0.21826171875, 0.227752685546875, 0.23724365234375, 0.246734619140625, 0.2562255859375, 0.265716552734375, 0.27520751953125, 0.284698486328125, 0.294189453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 9.0, 12.0, 18.0, 12.0, 14.0, 23.0, 33.0, 29.0, 28.0, 34.0, 54.0, 46.0, 44.0, 45.0, 58.0, 48.0, 45.0, 31.0, 43.0, 43.0, 43.0, 30.0, 41.0, 38.0, 20.0, 23.0, 24.0, 14.0, 16.0, 10.0, 13.0, 10.0, 9.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.320068359375, -0.310882568359375, -0.30169677734375, -0.292510986328125, -0.2833251953125, -0.274139404296875, -0.26495361328125, -0.255767822265625, -0.24658203125, -0.237396240234375, -0.22821044921875, -0.219024658203125, -0.2098388671875, -0.200653076171875, -0.19146728515625, -0.182281494140625, -0.173095703125, -0.163909912109375, -0.15472412109375, -0.145538330078125, -0.1363525390625, -0.127166748046875, -0.11798095703125, -0.108795166015625, -0.099609375, -0.090423583984375, -0.08123779296875, -0.072052001953125, -0.0628662109375, -0.053680419921875, -0.04449462890625, -0.035308837890625, -0.026123046875, -0.016937255859375, -0.00775146484375, 0.001434326171875, 0.0106201171875, 0.019805908203125, 0.02899169921875, 0.038177490234375, 0.04736328125, 0.056549072265625, 0.06573486328125, 0.074920654296875, 0.0841064453125, 0.093292236328125, 0.10247802734375, 0.111663818359375, 0.120849609375, 0.130035400390625, 0.13922119140625, 0.148406982421875, 0.1575927734375, 0.166778564453125, 0.17596435546875, 0.185150146484375, 0.1943359375, 0.203521728515625, 0.21270751953125, 0.221893310546875, 0.2310791015625, 0.240264892578125, 0.24945068359375, 0.258636474609375, 0.267822265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 6.0, 4.0, 12.0, 13.0, 19.0, 32.0, 53.0, 72.0, 143.0, 206.0, 345.0, 632.0, 1248.0, 2414.0, 5123.0, 12081.0, 32206.0, 103575.0, 352478.0, 369565.0, 110855.0, 33900.0, 12887.0, 5369.0, 2510.0, 1214.0, 662.0, 350.0, 205.0, 132.0, 72.0, 52.0, 38.0, 23.0, 9.0, 12.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34912109375, -0.3370933532714844, -0.32506561279296875, -0.3130378723144531, -0.3010101318359375, -0.2889823913574219, -0.27695465087890625, -0.2649269104003906, -0.252899169921875, -0.24087142944335938, -0.22884368896484375, -0.21681594848632812, -0.2047882080078125, -0.19276046752929688, -0.18073272705078125, -0.16870498657226562, -0.15667724609375, -0.14464950561523438, -0.13262176513671875, -0.12059402465820312, -0.1085662841796875, -0.09653854370117188, -0.08451080322265625, -0.07248306274414062, -0.060455322265625, -0.048427581787109375, -0.03639984130859375, -0.024372100830078125, -0.0123443603515625, -0.000316619873046875, 0.01171112060546875, 0.023738861083984375, 0.0357666015625, 0.047794342041015625, 0.05982208251953125, 0.07184982299804688, 0.0838775634765625, 0.09590530395507812, 0.10793304443359375, 0.11996078491210938, 0.131988525390625, 0.14401626586914062, 0.15604400634765625, 0.16807174682617188, 0.1800994873046875, 0.19212722778320312, 0.20415496826171875, 0.21618270874023438, 0.22821044921875, 0.24023818969726562, 0.25226593017578125, 0.2642936706542969, 0.2763214111328125, 0.2883491516113281, 0.30037689208984375, 0.3124046325683594, 0.324432373046875, 0.3364601135253906, 0.34848785400390625, 0.3605155944824219, 0.3725433349609375, 0.3845710754394531, 0.39659881591796875, 0.4086265563964844, 0.420654296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 11.0, 12.0, 8.0, 22.0, 24.0, 27.0, 28.0, 29.0, 40.0, 50.0, 44.0, 64.0, 69.0, 56.0, 55.0, 62.0, 58.0, 46.0, 48.0, 38.0, 44.0, 31.0, 23.0, 19.0, 21.0, 15.0, 14.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3403472900390625, -0.326690673828125, -0.3130340576171875, -0.29937744140625, -0.2857208251953125, -0.272064208984375, -0.2584075927734375, -0.2447509765625, -0.2310943603515625, -0.217437744140625, -0.2037811279296875, -0.19012451171875, -0.1764678955078125, -0.162811279296875, -0.1491546630859375, -0.135498046875, -0.1218414306640625, -0.108184814453125, -0.0945281982421875, -0.08087158203125, -0.0672149658203125, -0.053558349609375, -0.0399017333984375, -0.0262451171875, -0.0125885009765625, 0.001068115234375, 0.0147247314453125, 0.02838134765625, 0.0420379638671875, 0.055694580078125, 0.0693511962890625, 0.0830078125, 0.0966644287109375, 0.110321044921875, 0.1239776611328125, 0.13763427734375, 0.1512908935546875, 0.164947509765625, 0.1786041259765625, 0.1922607421875, 0.2059173583984375, 0.219573974609375, 0.2332305908203125, 0.24688720703125, 0.2605438232421875, 0.274200439453125, 0.2878570556640625, 0.301513671875, 0.3151702880859375, 0.328826904296875, 0.3424835205078125, 0.35614013671875, 0.3697967529296875, 0.383453369140625, 0.3971099853515625, 0.4107666015625, 0.4244232177734375, 0.438079833984375, 0.4517364501953125, 0.46539306640625, 0.4790496826171875, 0.492706298828125, 0.5063629150390625, 0.52001953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 6.0, 10.0, 16.0, 22.0, 28.0, 50.0, 83.0, 149.0, 242.0, 368.0, 589.0, 950.0, 1699.0, 2945.0, 5148.0, 9861.0, 19688.0, 42038.0, 95770.0, 201597.0, 337507.0, 177032.0, 80781.0, 35898.0, 16738.0, 8540.0, 4492.0, 2576.0, 1409.0, 912.0, 531.0, 329.0, 194.0, 139.0, 76.0, 49.0, 28.0, 16.0, 22.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04888916015625, -0.04737997055053711, -0.04587078094482422, -0.04436159133911133, -0.04285240173339844, -0.04134321212768555, -0.039834022521972656, -0.038324832916259766, -0.036815643310546875, -0.035306453704833984, -0.033797264099121094, -0.0322880744934082, -0.030778884887695312, -0.029269695281982422, -0.02776050567626953, -0.02625131607055664, -0.02474212646484375, -0.02323293685913086, -0.02172374725341797, -0.020214557647705078, -0.018705368041992188, -0.017196178436279297, -0.015686988830566406, -0.014177799224853516, -0.012668609619140625, -0.011159420013427734, -0.009650230407714844, -0.008141040802001953, -0.0066318511962890625, -0.005122661590576172, -0.0036134719848632812, -0.0021042823791503906, -0.0005950927734375, 0.0009140968322753906, 0.0024232864379882812, 0.003932476043701172, 0.0054416656494140625, 0.006950855255126953, 0.008460044860839844, 0.009969234466552734, 0.011478424072265625, 0.012987613677978516, 0.014496803283691406, 0.016005992889404297, 0.017515182495117188, 0.019024372100830078, 0.02053356170654297, 0.02204275131225586, 0.02355194091796875, 0.02506113052368164, 0.02657032012939453, 0.028079509735107422, 0.029588699340820312, 0.031097888946533203, 0.032607078552246094, 0.034116268157958984, 0.035625457763671875, 0.037134647369384766, 0.038643836975097656, 0.04015302658081055, 0.04166221618652344, 0.04317140579223633, 0.04468059539794922, 0.04618978500366211, 0.047698974609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 10.0, 7.0, 9.0, 5.0, 18.0, 17.0, 17.0, 27.0, 32.0, 48.0, 54.0, 48.0, 79.0, 101.0, 106.0, 59.0, 63.0, 62.0, 46.0, 36.0, 21.0, 29.0, 11.0, 14.0, 15.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3947486877441406e-05, -1.3538636267185211e-05, -1.3129785656929016e-05, -1.2720935046672821e-05, -1.2312084436416626e-05, -1.1903233826160431e-05, -1.1494383215904236e-05, -1.108553260564804e-05, -1.0676681995391846e-05, -1.026783138513565e-05, -9.858980774879456e-06, -9.45013016462326e-06, -9.041279554367065e-06, -8.63242894411087e-06, -8.223578333854675e-06, -7.81472772359848e-06, -7.405877113342285e-06, -6.99702650308609e-06, -6.588175892829895e-06, -6.1793252825737e-06, -5.770474672317505e-06, -5.36162406206131e-06, -4.952773451805115e-06, -4.54392284154892e-06, -4.135072231292725e-06, -3.7262216210365295e-06, -3.3173710107803345e-06, -2.9085204005241394e-06, -2.4996697902679443e-06, -2.0908191800117493e-06, -1.6819685697555542e-06, -1.2731179594993591e-06, -8.642673492431641e-07, -4.55416738986969e-07, -4.6566128730773926e-08, 3.6228448152542114e-07, 7.711350917816162e-07, 1.1799857020378113e-06, 1.5888363122940063e-06, 1.9976869225502014e-06, 2.4065375328063965e-06, 2.8153881430625916e-06, 3.2242387533187866e-06, 3.6330893635749817e-06, 4.041939973831177e-06, 4.450790584087372e-06, 4.859641194343567e-06, 5.268491804599762e-06, 5.677342414855957e-06, 6.086193025112152e-06, 6.495043635368347e-06, 6.903894245624542e-06, 7.312744855880737e-06, 7.721595466136932e-06, 8.130446076393127e-06, 8.539296686649323e-06, 8.948147296905518e-06, 9.356997907161713e-06, 9.765848517417908e-06, 1.0174699127674103e-05, 1.0583549737930298e-05, 1.0992400348186493e-05, 1.1401250958442688e-05, 1.1810101568698883e-05, 1.2218952178955078e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 14.0, 11.0, 18.0, 16.0, 25.0, 49.0, 55.0, 83.0, 99.0, 156.0, 245.0, 304.0, 402.0, 630.0, 977.0, 1780.0, 3246.0, 6305.0, 13750.0, 33486.0, 99604.0, 332824.0, 386416.0, 104243.0, 34855.0, 14110.0, 6433.0, 3367.0, 1786.0, 1089.0, 695.0, 483.0, 293.0, 171.0, 138.0, 99.0, 59.0, 50.0, 53.0, 31.0, 19.0, 17.0, 12.0, 14.0, 12.0, 6.0, 5.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.08127689361572266, -0.07856941223144531, -0.07586193084716797, -0.07315444946289062, -0.07044696807861328, -0.06773948669433594, -0.0650320053100586, -0.06232452392578125, -0.059617042541503906, -0.05690956115722656, -0.05420207977294922, -0.051494598388671875, -0.04878711700439453, -0.04607963562011719, -0.043372154235839844, -0.0406646728515625, -0.037957191467285156, -0.03524971008300781, -0.03254222869873047, -0.029834747314453125, -0.02712726593017578, -0.024419784545898438, -0.021712303161621094, -0.01900482177734375, -0.016297340393066406, -0.013589859008789062, -0.010882377624511719, -0.008174896240234375, -0.005467414855957031, -0.0027599334716796875, -5.245208740234375e-05, 0.002655029296875, 0.005362510681152344, 0.008069992065429688, 0.010777473449707031, 0.013484954833984375, 0.01619243621826172, 0.018899917602539062, 0.021607398986816406, 0.02431488037109375, 0.027022361755371094, 0.029729843139648438, 0.03243732452392578, 0.035144805908203125, 0.03785228729248047, 0.04055976867675781, 0.043267250061035156, 0.0459747314453125, 0.048682212829589844, 0.05138969421386719, 0.05409717559814453, 0.056804656982421875, 0.05951213836669922, 0.06221961975097656, 0.0649271011352539, 0.06763458251953125, 0.0703420639038086, 0.07304954528808594, 0.07575702667236328, 0.07846450805664062, 0.08117198944091797, 0.08387947082519531, 0.08658695220947266, 0.08929443359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 14.0, 20.0, 18.0, 25.0, 39.0, 40.0, 67.0, 56.0, 80.0, 124.0, 105.0, 87.0, 73.0, 50.0, 26.0, 31.0, 22.0, 21.0, 11.0, 5.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0499267578125, -0.04836320877075195, -0.046799659729003906, -0.04523611068725586, -0.04367256164550781, -0.042109012603759766, -0.04054546356201172, -0.03898191452026367, -0.037418365478515625, -0.03585481643676758, -0.03429126739501953, -0.032727718353271484, -0.031164169311523438, -0.02960062026977539, -0.028037071228027344, -0.026473522186279297, -0.02490997314453125, -0.023346424102783203, -0.021782875061035156, -0.02021932601928711, -0.018655776977539062, -0.017092227935791016, -0.015528678894042969, -0.013965129852294922, -0.012401580810546875, -0.010838031768798828, -0.009274482727050781, -0.007710933685302734, -0.0061473846435546875, -0.004583835601806641, -0.0030202865600585938, -0.0014567375183105469, 0.0001068115234375, 0.0016703605651855469, 0.0032339096069335938, 0.004797458648681641, 0.0063610076904296875, 0.007924556732177734, 0.009488105773925781, 0.011051654815673828, 0.012615203857421875, 0.014178752899169922, 0.01574230194091797, 0.017305850982666016, 0.018869400024414062, 0.02043294906616211, 0.021996498107910156, 0.023560047149658203, 0.02512359619140625, 0.026687145233154297, 0.028250694274902344, 0.02981424331665039, 0.03137779235839844, 0.032941341400146484, 0.03450489044189453, 0.03606843948364258, 0.037631988525390625, 0.03919553756713867, 0.04075908660888672, 0.042322635650634766, 0.04388618469238281, 0.04544973373413086, 0.047013282775878906, 0.04857683181762695, 0.050140380859375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 16.0, 31.0, 74.0, 119.0, 200.0, 192.0, 148.0, 96.0, 61.0, 34.0, 10.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0467673540115356, -1.007058024406433, -0.9673486351966858, -0.9276392459869385, -0.8879299163818359, -0.8482205271720886, -0.8085111379623413, -0.7688018083572388, -0.7290924191474915, -0.6893830299377441, -0.6496737003326416, -0.6099643111228943, -0.570254921913147, -0.5305455923080444, -0.4908362030982971, -0.4511268436908722, -0.41141748428344727, -0.37170812487602234, -0.3319987654685974, -0.2922893762588501, -0.25258001685142517, -0.21287065744400024, -0.17316128313541412, -0.133451908826828, -0.09374254941940308, -0.05403318256139755, -0.014323815703392029, 0.025385551154613495, 0.06509491801261902, 0.10480427742004395, 0.14451365172863007, 0.1842230260372162, 0.22393250465393066, 0.2636418640613556, 0.3033512234687805, 0.34306061267852783, 0.38276997208595276, 0.4224793314933777, 0.462188720703125, 0.5018980503082275, 0.5416074395179749, 0.5813168287277222, 0.6210261583328247, 0.660735547542572, 0.7004449367523193, 0.7401542663574219, 0.7798636555671692, 0.8195730447769165, 0.859282374382019, 0.8989917635917664, 0.9387010931968689, 0.9784104824066162, 1.0181198120117188, 1.0578291416168213, 1.0975385904312134, 1.137247920036316, 1.176957368850708, 1.2166666984558105, 1.2563761472702026, 1.2960854768753052, 1.3357948064804077, 1.3755042552947998, 1.4152135848999023, 1.4549229145050049, 1.4946322441101074]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 5.0, 6.0, 6.0, 17.0, 17.0, 18.0, 17.0, 26.0, 22.0, 28.0, 40.0, 24.0, 35.0, 52.0, 41.0, 36.0, 55.0, 50.0, 50.0, 35.0, 40.0, 47.0, 31.0, 34.0, 26.0, 36.0, 30.0, 26.0, 24.0, 14.0, 21.0, 16.0, 13.0, 16.0, 7.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6149052381515503, -0.5975620746612549, -0.5802189111709595, -0.5628758072853088, -0.5455326437950134, -0.528189480304718, -0.5108463168144226, -0.4935031533241272, -0.4761600196361542, -0.45881685614585876, -0.44147372245788574, -0.42413055896759033, -0.4067873954772949, -0.3894442617893219, -0.3721010982990265, -0.35475796461105347, -0.33741480112075806, -0.32007163763046265, -0.3027285039424896, -0.2853853404521942, -0.2680422067642212, -0.2506990432739258, -0.23335587978363037, -0.21601273119449615, -0.19866958260536194, -0.18132643401622772, -0.1639832854270935, -0.1466401219367981, -0.12929697334766388, -0.11195382475852966, -0.09461066871881485, -0.07726751267910004, -0.05992436408996582, -0.042581211775541306, -0.02523805946111679, -0.007894907146692276, 0.009448245167732239, 0.026791393756866455, 0.04413454979658127, 0.06147770583629608, 0.0788208544254303, 0.09616400301456451, 0.11350715905427933, 0.13085031509399414, 0.14819346368312836, 0.16553661227226257, 0.18287977576255798, 0.2002229243516922, 0.21756607294082642, 0.23490922152996063, 0.25225237011909485, 0.26959553360939026, 0.2869386672973633, 0.3042818307876587, 0.3216249942779541, 0.3389681577682495, 0.35631129145622253, 0.37365445494651794, 0.39099758863449097, 0.4083407521247864, 0.4256839156150818, 0.4430270493030548, 0.4603702127933502, 0.47771334648132324, 0.49505650997161865]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 17.0, 18.0, 20.0, 23.0, 41.0, 43.0, 52.0, 61.0, 94.0, 150.0, 178.0, 255.0, 320.0, 482.0, 841.0, 1347.0, 2506.0, 4625.0, 1021404.0, 8392.0, 4050.0, 2072.0, 1191.0, 787.0, 469.0, 280.0, 203.0, 162.0, 98.0, 101.0, 72.0, 47.0, 38.0, 35.0, 29.0, 18.0, 25.0, 9.0, 9.0, 5.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.598320722579956, -0.5776081085205078, -0.5568954944610596, -0.5361828804016113, -0.5154702663421631, -0.49475765228271484, -0.474045068025589, -0.45333245396614075, -0.4326198399066925, -0.41190722584724426, -0.391194611787796, -0.3704819977283478, -0.3497694134712219, -0.3290567994117737, -0.30834418535232544, -0.2876315712928772, -0.26691895723342896, -0.2462063431739807, -0.22549372911453247, -0.20478112995624542, -0.18406851589679718, -0.16335590183734894, -0.1426433026790619, -0.12193068861961365, -0.1012180745601654, -0.08050546050071716, -0.05979285389184952, -0.039080243557691574, -0.01836763322353363, 0.002344980835914612, 0.023057587444782257, 0.0437701940536499, 0.06448280811309814, 0.08519542217254639, 0.10590802878141403, 0.12662063539028168, 0.14733324944972992, 0.16804586350917816, 0.1887584626674652, 0.20947107672691345, 0.2301836907863617, 0.25089630484580994, 0.2716089189052582, 0.2923215329647064, 0.3130341172218323, 0.3337467312812805, 0.35445934534072876, 0.375171959400177, 0.39588457345962524, 0.4165971875190735, 0.43730980157852173, 0.45802241563796997, 0.4787350296974182, 0.49944764375686646, 0.5201602578163147, 0.5408728122711182, 0.5615854263305664, 0.5822980403900146, 0.6030106544494629, 0.6237232685089111, 0.6444358825683594, 0.6651484966278076, 0.6858611106872559, 0.7065737247467041, 0.7272863388061523]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 8.0, 8.0, 17.0, 49.0, 110.0, 287.0, 835.0, 2415.0, 51457048.0, 7208.0, 1436.0, 539.0, 218.0, 74.0, 32.0, 19.0, 2.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.43700122833252, -13.050508499145508, -12.664015769958496, -12.277523040771484, -11.891031265258789, -11.504538536071777, -11.118045806884766, -10.731553077697754, -10.345060348510742, -9.95856761932373, -9.572074890136719, -9.185583114624023, -8.799090385437012, -8.41259765625, -8.026104927062988, -7.639612197875977, -7.253120422363281, -6.8666276931762695, -6.480135440826416, -6.093642711639404, -5.707150459289551, -5.320657730102539, -4.934165000915527, -4.547672271728516, -4.161180019378662, -3.7746875286102295, -3.388195037841797, -3.001702308654785, -2.6152098178863525, -2.22871732711792, -1.8422245979309082, -1.4557321071624756, -1.069239616394043, -0.6827470660209656, -0.2962545156478882, 0.09023809432983398, 0.4767305850982666, 0.8632230758666992, 1.249715805053711, 1.6362082958221436, 2.022700786590576, 2.409193277359009, 2.7956857681274414, 3.182178497314453, 3.5686709880828857, 3.9551634788513184, 4.34165620803833, 4.728148460388184, 5.114641189575195, 5.501133918762207, 5.8876261711120605, 6.274118900299072, 6.660611152648926, 7.0471038818359375, 7.433596611022949, 7.820089340209961, 8.206581115722656, 8.593073844909668, 8.97956657409668, 9.366058349609375, 9.752551078796387, 10.139043807983398, 10.52553653717041, 10.912029266357422, 11.298521995544434]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 26.0, 31.0, 40.0, 80.0, 113.0, 169.0, 290.0, 456.0, 789.0, 1298.0, 2087.0, 3590.0, 5904.0, 9991.0, 17003.0, 28016.0, 46827.0, 75334.0, 119186.0, 182364.0, 260300.0, 349174.0, 981586.0, 2930900.0, 400247.0, 292167.0, 210462.0, 142143.0, 90403.0, 55916.0, 33896.0, 20592.0, 12346.0, 7159.0, 4241.0, 2559.0, 1474.0, 899.0, 537.0, 319.0, 198.0, 112.0, 74.0, 53.0, 19.0, 21.0, 15.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.27587890625, -0.2675666809082031, -0.25925445556640625, -0.2509422302246094, -0.2426300048828125, -0.23431777954101562, -0.22600555419921875, -0.21769332885742188, -0.209381103515625, -0.20106887817382812, -0.19275665283203125, -0.18444442749023438, -0.1761322021484375, -0.16781997680664062, -0.15950775146484375, -0.15119552612304688, -0.14288330078125, -0.13457107543945312, -0.12625885009765625, -0.11794662475585938, -0.1096343994140625, -0.10132217407226562, -0.09300994873046875, -0.08469772338867188, -0.076385498046875, -0.06807327270507812, -0.05976104736328125, -0.051448822021484375, -0.0431365966796875, -0.034824371337890625, -0.02651214599609375, -0.018199920654296875, -0.0098876953125, -0.001575469970703125, 0.00673675537109375, 0.015048980712890625, 0.0233612060546875, 0.031673431396484375, 0.03998565673828125, 0.048297882080078125, 0.056610107421875, 0.06492233276367188, 0.07323455810546875, 0.08154678344726562, 0.0898590087890625, 0.09817123413085938, 0.10648345947265625, 0.11479568481445312, 0.12310791015625, 0.13142013549804688, 0.13973236083984375, 0.14804458618164062, 0.1563568115234375, 0.16466903686523438, 0.17298126220703125, 0.18129348754882812, 0.189605712890625, 0.19791793823242188, 0.20623016357421875, 0.21454238891601562, 0.2228546142578125, 0.23116683959960938, 0.23947906494140625, 0.24779129028320312, 0.256103515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 8.0, 5.0, 9.0, 11.0, 17.0, 14.0, 20.0, 21.0, 31.0, 16.0, 22.0, 41.0, 24.0, 37.0, 43.0, 46.0, 56.0, 83.0, 560.0, 502.0, 58.0, 42.0, 48.0, 30.0, 36.0, 32.0, 30.0, 29.0, 35.0, 15.0, 17.0, 17.0, 15.0, 13.0, 11.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.619140625, -2.537261962890625, -2.45538330078125, -2.373504638671875, -2.2916259765625, -2.209747314453125, -2.12786865234375, -2.045989990234375, -1.964111328125, -1.882232666015625, -1.80035400390625, -1.718475341796875, -1.6365966796875, -1.554718017578125, -1.47283935546875, -1.390960693359375, -1.30908203125, -1.227203369140625, -1.14532470703125, -1.063446044921875, -0.9815673828125, -0.899688720703125, -0.81781005859375, -0.735931396484375, -0.654052734375, -0.572174072265625, -0.49029541015625, -0.408416748046875, -0.3265380859375, -0.244659423828125, -0.16278076171875, -0.080902099609375, 0.0009765625, 0.082855224609375, 0.16473388671875, 0.246612548828125, 0.3284912109375, 0.410369873046875, 0.49224853515625, 0.574127197265625, 0.656005859375, 0.737884521484375, 0.81976318359375, 0.901641845703125, 0.9835205078125, 1.065399169921875, 1.14727783203125, 1.229156494140625, 1.31103515625, 1.392913818359375, 1.47479248046875, 1.556671142578125, 1.6385498046875, 1.720428466796875, 1.80230712890625, 1.884185791015625, 1.966064453125, 2.047943115234375, 2.12982177734375, 2.211700439453125, 2.2935791015625, 2.375457763671875, 2.45733642578125, 2.539215087890625, 2.62109375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 9.0, 8.0, 8.0, 23.0, 41.0, 69.0, 105.0, 126.0, 207.0, 404.0, 626.0, 1020.0, 1639.0, 2763.0, 4350.0, 7211.0, 11875.0, 18737.0, 29771.0, 46302.0, 69195.0, 102150.0, 142590.0, 193614.0, 244099.0, 290772.0, 721321.0, 3048997.0, 330798.0, 269988.0, 219103.0, 168145.0, 122947.0, 85462.0, 57096.0, 37135.0, 23672.0, 15004.0, 9398.0, 5662.0, 3393.0, 2095.0, 1357.0, 837.0, 501.0, 319.0, 196.0, 137.0, 62.0, 36.0, 14.0, 18.0, 10.0, 7.0, 5.0, 3.0, 7.0], "bins": [-0.184814453125, -0.17942047119140625, -0.1740264892578125, -0.16863250732421875, -0.163238525390625, -0.15784454345703125, -0.1524505615234375, -0.14705657958984375, -0.14166259765625, -0.13626861572265625, -0.1308746337890625, -0.12548065185546875, -0.120086669921875, -0.11469268798828125, -0.1092987060546875, -0.10390472412109375, -0.0985107421875, -0.09311676025390625, -0.0877227783203125, -0.08232879638671875, -0.076934814453125, -0.07154083251953125, -0.0661468505859375, -0.06075286865234375, -0.05535888671875, -0.04996490478515625, -0.0445709228515625, -0.03917694091796875, -0.033782958984375, -0.02838897705078125, -0.0229949951171875, -0.01760101318359375, -0.01220703125, -0.00681304931640625, -0.0014190673828125, 0.00397491455078125, 0.009368896484375, 0.01476287841796875, 0.0201568603515625, 0.02555084228515625, 0.03094482421875, 0.03633880615234375, 0.0417327880859375, 0.04712677001953125, 0.052520751953125, 0.05791473388671875, 0.0633087158203125, 0.06870269775390625, 0.0740966796875, 0.07949066162109375, 0.0848846435546875, 0.09027862548828125, 0.095672607421875, 0.10106658935546875, 0.1064605712890625, 0.11185455322265625, 0.11724853515625, 0.12264251708984375, 0.1280364990234375, 0.13343048095703125, 0.138824462890625, 0.14421844482421875, 0.1496124267578125, 0.15500640869140625, 0.160400390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 2.0, 4.0, 9.0, 16.0, 9.0, 16.0, 16.0, 20.0, 21.0, 18.0, 17.0, 30.0, 31.0, 38.0, 29.0, 44.0, 31.0, 30.0, 53.0, 484.0, 595.0, 61.0, 48.0, 40.0, 41.0, 36.0, 38.0, 28.0, 33.0, 27.0, 21.0, 19.0, 11.0, 21.0, 24.0, 15.0, 10.0, 3.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.98968505859375, -1.9188232421875, -1.84796142578125, -1.777099609375, -1.70623779296875, -1.6353759765625, -1.56451416015625, -1.49365234375, -1.42279052734375, -1.3519287109375, -1.28106689453125, -1.210205078125, -1.13934326171875, -1.0684814453125, -0.99761962890625, -0.9267578125, -0.85589599609375, -0.7850341796875, -0.71417236328125, -0.643310546875, -0.57244873046875, -0.5015869140625, -0.43072509765625, -0.35986328125, -0.28900146484375, -0.2181396484375, -0.14727783203125, -0.076416015625, -0.00555419921875, 0.0653076171875, 0.13616943359375, 0.20703125, 0.27789306640625, 0.3487548828125, 0.41961669921875, 0.490478515625, 0.56134033203125, 0.6322021484375, 0.70306396484375, 0.77392578125, 0.84478759765625, 0.9156494140625, 0.98651123046875, 1.057373046875, 1.12823486328125, 1.1990966796875, 1.26995849609375, 1.3408203125, 1.41168212890625, 1.4825439453125, 1.55340576171875, 1.624267578125, 1.69512939453125, 1.7659912109375, 1.83685302734375, 1.90771484375, 1.97857666015625, 2.0494384765625, 2.12030029296875, 2.191162109375, 2.26202392578125, 2.3328857421875, 2.40374755859375, 2.474609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 17.0, 18.0, 41.0, 55.0, 65.0, 91.0, 136.0, 143.0, 218.0, 301.0, 404.0, 527.0, 759.0, 1052.0, 1574.0, 2616.0, 4539.0, 8963.0, 17606.0, 35698.0, 72037.0, 145264.0, 5531812.0, 276233.0, 93245.0, 47226.0, 23388.0, 11646.0, 6079.0, 3302.0, 2035.0, 1286.0, 855.0, 596.0, 424.0, 285.0, 226.0, 168.0, 125.0, 95.0, 57.0, 51.0, 44.0, 32.0, 19.0, 12.0, 14.0, 8.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.72900390625, -0.7067108154296875, -0.684417724609375, -0.6621246337890625, -0.63983154296875, -0.6175384521484375, -0.595245361328125, -0.5729522705078125, -0.5506591796875, -0.5283660888671875, -0.506072998046875, -0.4837799072265625, -0.46148681640625, -0.4391937255859375, -0.416900634765625, -0.3946075439453125, -0.372314453125, -0.3500213623046875, -0.327728271484375, -0.3054351806640625, -0.28314208984375, -0.2608489990234375, -0.238555908203125, -0.2162628173828125, -0.1939697265625, -0.1716766357421875, -0.149383544921875, -0.1270904541015625, -0.10479736328125, -0.0825042724609375, -0.060211181640625, -0.0379180908203125, -0.015625, 0.0066680908203125, 0.028961181640625, 0.0512542724609375, 0.07354736328125, 0.0958404541015625, 0.118133544921875, 0.1404266357421875, 0.1627197265625, 0.1850128173828125, 0.207305908203125, 0.2295989990234375, 0.25189208984375, 0.2741851806640625, 0.296478271484375, 0.3187713623046875, 0.341064453125, 0.3633575439453125, 0.385650634765625, 0.4079437255859375, 0.43023681640625, 0.4525299072265625, 0.474822998046875, 0.4971160888671875, 0.5194091796875, 0.5417022705078125, 0.563995361328125, 0.5862884521484375, 0.60858154296875, 0.6308746337890625, 0.653167724609375, 0.6754608154296875, 0.69775390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 2.0, 10.0, 8.0, 7.0, 13.0, 9.0, 13.0, 25.0, 36.0, 39.0, 38.0, 37.0, 44.0, 42.0, 39.0, 42.0, 98.0, 1012.0, 62.0, 58.0, 44.0, 48.0, 49.0, 40.0, 30.0, 25.0, 19.0, 29.0, 24.0, 21.0, 16.0, 7.0, 5.0, 5.0, 7.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -3.0069580078125, -2.914306640625, -2.8216552734375, -2.72900390625, -2.6363525390625, -2.543701171875, -2.4510498046875, -2.3583984375, -2.2657470703125, -2.173095703125, -2.0804443359375, -1.98779296875, -1.8951416015625, -1.802490234375, -1.7098388671875, -1.6171875, -1.5245361328125, -1.431884765625, -1.3392333984375, -1.24658203125, -1.1539306640625, -1.061279296875, -0.9686279296875, -0.8759765625, -0.7833251953125, -0.690673828125, -0.5980224609375, -0.50537109375, -0.4127197265625, -0.320068359375, -0.2274169921875, -0.134765625, -0.0421142578125, 0.050537109375, 0.1431884765625, 0.23583984375, 0.3284912109375, 0.421142578125, 0.5137939453125, 0.6064453125, 0.6990966796875, 0.791748046875, 0.8843994140625, 0.97705078125, 1.0697021484375, 1.162353515625, 1.2550048828125, 1.34765625, 1.4403076171875, 1.532958984375, 1.6256103515625, 1.71826171875, 1.8109130859375, 1.903564453125, 1.9962158203125, 2.0888671875, 2.1815185546875, 2.274169921875, 2.3668212890625, 2.45947265625, 2.5521240234375, 2.644775390625, 2.7374267578125, 2.830078125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 15.0, 19.0, 35.0, 80.0, 170.0, 284.0, 210.0, 100.0, 49.0, 23.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.863334655761719, -15.454010009765625, -15.044686317443848, -14.635361671447754, -14.22603702545166, -13.816713333129883, -13.407388687133789, -12.998064041137695, -12.588739395141602, -12.179414749145508, -11.77009105682373, -11.360766410827637, -10.951441764831543, -10.542118072509766, -10.132793426513672, -9.723468780517578, -9.3141450881958, -8.904820442199707, -8.49549674987793, -8.086172103881836, -7.676847457885742, -7.267523288726807, -6.858199119567871, -6.448874473571777, -6.039550304412842, -5.630226135253906, -5.2209014892578125, -4.811577320098877, -4.402253150939941, -3.9929285049438477, -3.583604335784912, -3.1742799282073975, -2.764955520629883, -2.355631113052368, -1.946306824684143, -1.536982536315918, -1.1276581287384033, -0.7183337211608887, -0.3090095520019531, 0.10031485557556152, 0.5096392631530762, 0.918963611125946, 1.328287959098816, 1.737612247467041, 2.1469366550445557, 2.5562610626220703, 2.965585231781006, 3.3749096393585205, 3.784234046936035, 4.193558216094971, 4.6028828620910645, 5.01220703125, 5.421531677246094, 5.830855846405029, 6.240180015563965, 6.649504661560059, 7.058828830718994, 7.46815299987793, 7.877477645874023, 8.286802291870117, 8.696125984191895, 9.105450630187988, 9.514774322509766, 9.92409896850586, 10.333423614501953]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 0.0, 4.0, 6.0, 7.0, 12.0, 8.0, 11.0, 12.0, 20.0, 20.0, 33.0, 28.0, 33.0, 34.0, 43.0, 53.0, 60.0, 68.0, 85.0, 49.0, 65.0, 58.0, 52.0, 37.0, 26.0, 27.0, 22.0, 22.0, 15.0, 14.0, 9.0, 12.0, 15.0, 11.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0], "bins": [-10.555952072143555, -10.27237606048584, -9.988801002502441, -9.705224990844727, -9.421649932861328, -9.138073921203613, -8.854498863220215, -8.5709228515625, -8.287347793579102, -8.003771781921387, -7.720196723937988, -7.436621189117432, -7.153045654296875, -6.86946964263916, -6.5858941078186035, -6.302318572998047, -6.018742561340332, -5.735167026519775, -5.451591491699219, -5.168015956878662, -4.8844404220581055, -4.600864410400391, -4.317288875579834, -4.033713340759277, -3.7501378059387207, -3.466562271118164, -3.1829867362976074, -2.8994109630584717, -2.615835428237915, -2.3322598934173584, -2.0486841201782227, -1.765108585357666, -1.4815325736999512, -1.1979570388793945, -0.9143813848495483, -0.6308057904243469, -0.3472301959991455, -0.06365466117858887, 0.21992099285125732, 0.5034966468811035, 0.7870721817016602, 1.0706477165222168, 1.354223370552063, 1.6377990245819092, 1.9213745594024658, 2.2049500942230225, 2.488525867462158, 2.772101402282715, 3.0556769371032715, 3.339252471923828, 3.6228280067443848, 3.9064037799835205, 4.189979553222656, 4.473554611206055, 4.7571306228637695, 5.040706157684326, 5.324281692504883, 5.6078572273254395, 5.891432762145996, 6.175008296966553, 6.458583831787109, 6.742159843444824, 7.025735378265381, 7.3093109130859375, 7.592886447906494]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 3.0, 12.0, 6.0, 16.0, 10.0, 28.0, 50.0, 53.0, 93.0, 107.0, 169.0, 271.0, 530.0, 845.0, 1435.0, 2789.0, 5394.0, 12519.0, 39522.0, 3574427.0, 498296.0, 34967.0, 11670.0, 5179.0, 2553.0, 1339.0, 762.0, 444.0, 289.0, 173.0, 94.0, 73.0, 41.0, 41.0, 21.0, 15.0, 12.0, 7.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08148193359375, -0.07900810241699219, -0.07653427124023438, -0.07406044006347656, -0.07158660888671875, -0.06911277770996094, -0.06663894653320312, -0.06416511535644531, -0.0616912841796875, -0.05921745300292969, -0.056743621826171875, -0.05426979064941406, -0.05179595947265625, -0.04932212829589844, -0.046848297119140625, -0.04437446594238281, -0.041900634765625, -0.03942680358886719, -0.036952972412109375, -0.03447914123535156, -0.03200531005859375, -0.029531478881835938, -0.027057647705078125, -0.024583816528320312, -0.0221099853515625, -0.019636154174804688, -0.017162322998046875, -0.014688491821289062, -0.01221466064453125, -0.009740829467773438, -0.007266998291015625, -0.0047931671142578125, -0.0023193359375, 0.0001544952392578125, 0.002628326416015625, 0.0051021575927734375, 0.00757598876953125, 0.010049819946289062, 0.012523651123046875, 0.014997482299804688, 0.0174713134765625, 0.019945144653320312, 0.022418975830078125, 0.024892807006835938, 0.02736663818359375, 0.029840469360351562, 0.032314300537109375, 0.03478813171386719, 0.037261962890625, 0.03973579406738281, 0.042209625244140625, 0.04468345642089844, 0.04715728759765625, 0.04963111877441406, 0.052104949951171875, 0.05457878112792969, 0.0570526123046875, 0.05952644348144531, 0.062000274658203125, 0.06447410583496094, 0.06694793701171875, 0.06942176818847656, 0.07189559936523438, 0.07436943054199219, 0.07684326171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 5.0, 5.0, 9.0, 4.0, 7.0, 9.0, 11.0, 18.0, 19.0, 30.0, 63.0, 439.0, 168.0, 52.0, 30.0, 17.0, 8.0, 10.0, 13.0, 12.0, 6.0, 3.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0225067138671875, -0.021802902221679688, -0.021099090576171875, -0.020395278930664062, -0.01969146728515625, -0.018987655639648438, -0.018283843994140625, -0.017580032348632812, -0.016876220703125, -0.016172409057617188, -0.015468597412109375, -0.014764785766601562, -0.01406097412109375, -0.013357162475585938, -0.012653350830078125, -0.011949539184570312, -0.0112457275390625, -0.010541915893554688, -0.009838104248046875, -0.009134292602539062, -0.00843048095703125, -0.0077266693115234375, -0.007022857666015625, -0.0063190460205078125, -0.005615234375, -0.0049114227294921875, -0.004207611083984375, -0.0035037994384765625, -0.00279998779296875, -0.0020961761474609375, -0.001392364501953125, -0.0006885528564453125, 1.52587890625e-05, 0.0007190704345703125, 0.001422882080078125, 0.0021266937255859375, 0.00283050537109375, 0.0035343170166015625, 0.004238128662109375, 0.0049419403076171875, 0.005645751953125, 0.0063495635986328125, 0.007053375244140625, 0.0077571868896484375, 0.00846099853515625, 0.009164810180664062, 0.009868621826171875, 0.010572433471679688, 0.0112762451171875, 0.011980056762695312, 0.012683868408203125, 0.013387680053710938, 0.01409149169921875, 0.014795303344726562, 0.015499114990234375, 0.016202926635742188, 0.01690673828125, 0.017610549926757812, 0.018314361572265625, 0.019018173217773438, 0.01972198486328125, 0.020425796508789062, 0.021129608154296875, 0.021833419799804688, 0.0225372314453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 15.0, 15.0, 19.0, 36.0, 63.0, 72.0, 158.0, 327.0, 636.0, 1399.0, 3245.0, 8679.0, 25848.0, 100798.0, 696303.0, 3055694.0, 229680.0, 48530.0, 14202.0, 4795.0, 1952.0, 867.0, 400.0, 219.0, 93.0, 61.0, 38.0, 28.0, 14.0, 16.0, 8.0, 7.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.055891990661621094, -0.05404472351074219, -0.05219745635986328, -0.050350189208984375, -0.04850292205810547, -0.04665565490722656, -0.044808387756347656, -0.04296112060546875, -0.041113853454589844, -0.03926658630371094, -0.03741931915283203, -0.035572052001953125, -0.03372478485107422, -0.03187751770019531, -0.030030250549316406, -0.0281829833984375, -0.026335716247558594, -0.024488449096679688, -0.02264118194580078, -0.020793914794921875, -0.01894664764404297, -0.017099380493164062, -0.015252113342285156, -0.01340484619140625, -0.011557579040527344, -0.009710311889648438, -0.007863044738769531, -0.006015777587890625, -0.004168510437011719, -0.0023212432861328125, -0.00047397613525390625, 0.001373291015625, 0.0032205581665039062, 0.0050678253173828125, 0.006915092468261719, 0.008762359619140625, 0.010609626770019531, 0.012456893920898438, 0.014304161071777344, 0.01615142822265625, 0.017998695373535156, 0.019845962524414062, 0.02169322967529297, 0.023540496826171875, 0.02538776397705078, 0.027235031127929688, 0.029082298278808594, 0.0309295654296875, 0.032776832580566406, 0.03462409973144531, 0.03647136688232422, 0.038318634033203125, 0.04016590118408203, 0.04201316833496094, 0.043860435485839844, 0.04570770263671875, 0.047554969787597656, 0.04940223693847656, 0.05124950408935547, 0.053096771240234375, 0.05494403839111328, 0.05679130554199219, 0.058638572692871094, 0.06048583984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 10.0, 6.0, 6.0, 19.0, 16.0, 24.0, 16.0, 22.0, 33.0, 48.0, 68.0, 91.0, 91.0, 174.0, 253.0, 498.0, 1151.0, 672.0, 266.0, 148.0, 104.0, 76.0, 56.0, 45.0, 38.0, 24.0, 25.0, 18.0, 13.0, 12.0, 7.0, 5.0, 2.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.0283660888671875, -0.02761244773864746, -0.026858806610107422, -0.026105165481567383, -0.025351524353027344, -0.024597883224487305, -0.023844242095947266, -0.023090600967407227, -0.022336959838867188, -0.02158331871032715, -0.02082967758178711, -0.02007603645324707, -0.01932239532470703, -0.018568754196166992, -0.017815113067626953, -0.017061471939086914, -0.016307830810546875, -0.015554189682006836, -0.014800548553466797, -0.014046907424926758, -0.013293266296386719, -0.01253962516784668, -0.01178598403930664, -0.011032342910766602, -0.010278701782226562, -0.009525060653686523, -0.008771419525146484, -0.008017778396606445, -0.007264137268066406, -0.006510496139526367, -0.005756855010986328, -0.005003213882446289, -0.00424957275390625, -0.003495931625366211, -0.002742290496826172, -0.001988649368286133, -0.0012350082397460938, -0.0004813671112060547, 0.0002722740173339844, 0.0010259151458740234, 0.0017795562744140625, 0.0025331974029541016, 0.0032868385314941406, 0.00404047966003418, 0.004794120788574219, 0.005547761917114258, 0.006301403045654297, 0.007055044174194336, 0.007808685302734375, 0.008562326431274414, 0.009315967559814453, 0.010069608688354492, 0.010823249816894531, 0.01157689094543457, 0.01233053207397461, 0.013084173202514648, 0.013837814331054688, 0.014591455459594727, 0.015345096588134766, 0.016098737716674805, 0.016852378845214844, 0.017606019973754883, 0.018359661102294922, 0.01911330223083496, 0.019866943359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 14.0, 47.0, 151.0, 350.0, 310.0, 100.0, 22.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3096752166748047, -0.2989852726459503, -0.28829532861709595, -0.27760541439056396, -0.2669154703617096, -0.2562255263328552, -0.24553558230400085, -0.23484563827514648, -0.2241557091474533, -0.21346576511859894, -0.20277583599090576, -0.1920858919620514, -0.18139594793319702, -0.17070601880550385, -0.16001607477664948, -0.1493261456489563, -0.13863620162010193, -0.12794625759124756, -0.11725632846355438, -0.10656638443470001, -0.09587644785642624, -0.08518651127815247, -0.0744965672492981, -0.06380663067102432, -0.05311669409275055, -0.042426757514476776, -0.031736817210912704, -0.021046876907348633, -0.01035694032907486, 0.0003329962491989136, 0.011022940278053284, 0.021712876856327057, 0.03240281343460083, 0.0430927500128746, 0.053782690316438675, 0.06447263062000275, 0.07516256719827652, 0.08585250377655029, 0.09654244780540466, 0.10723238438367844, 0.11792232096195221, 0.12861226499080658, 0.13930219411849976, 0.14999213814735413, 0.1606820821762085, 0.17137201130390167, 0.18206195533275604, 0.19275188446044922, 0.2034418284893036, 0.21413177251815796, 0.22482170164585114, 0.2355116456747055, 0.24620157480239868, 0.25689151883125305, 0.2675814628601074, 0.2782714068889618, 0.28896135091781616, 0.29965129494667053, 0.3103412389755249, 0.3210311532020569, 0.33172109723091125, 0.3424110412597656, 0.35310098528862, 0.36379092931747437, 0.37448084354400635]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 12.0, 22.0, 30.0, 30.0, 32.0, 37.0, 36.0, 37.0, 61.0, 77.0, 62.0, 86.0, 66.0, 65.0, 63.0, 45.0, 51.0, 41.0, 28.0, 21.0, 21.0, 18.0, 7.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12411165237426758, -0.11969789862632751, -0.11528414487838745, -0.11087039113044739, -0.10645663738250732, -0.10204288363456726, -0.0976291373372078, -0.09321538358926773, -0.08880162984132767, -0.0843878760933876, -0.07997412234544754, -0.07556036859750748, -0.07114662230014801, -0.06673286855220795, -0.06231911480426788, -0.05790536105632782, -0.053491607308387756, -0.04907785356044769, -0.04466409981250763, -0.040250349789857864, -0.0358365960419178, -0.03142284229397774, -0.027009090408682823, -0.02259533852338791, -0.018181584775447845, -0.013767831958830357, -0.009354079142212868, -0.004940326325595379, -0.00052657350897789, 0.0038871802389621735, 0.008300932124257088, 0.012714684009552002, 0.017128437757492065, 0.02154219150543213, 0.025955943390727043, 0.030369695276021957, 0.03478344902396202, 0.039197202771902084, 0.04361095279455185, 0.04802470654249191, 0.052438460290431976, 0.05685221403837204, 0.0612659677863121, 0.06567972153425217, 0.07009346783161163, 0.0745072215795517, 0.07892097532749176, 0.08333472907543182, 0.08774848282337189, 0.09216223657131195, 0.09657599031925201, 0.10098974406719208, 0.10540349781513214, 0.1098172515630722, 0.11423099786043167, 0.11864475160837173, 0.1230585053563118, 0.12747225165367126, 0.13188600540161133, 0.1362997591495514, 0.14071351289749146, 0.14512726664543152, 0.14954102039337158, 0.15395477414131165, 0.1583685278892517]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 10.0, 17.0, 23.0, 43.0, 38.0, 65.0, 78.0, 114.0, 181.0, 222.0, 352.0, 509.0, 640.0, 958.0, 1420.0, 2085.0, 3103.0, 4908.0, 7685.0, 13055.0, 23888.0, 56305.0, 718165.0, 134916.0, 34425.0, 17270.0, 9911.0, 6130.0, 3800.0, 2560.0, 1687.0, 1258.0, 808.0, 541.0, 386.0, 278.0, 217.0, 146.0, 104.0, 70.0, 50.0, 30.0, 24.0, 24.0, 17.0, 11.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0806884765625, -0.07822418212890625, -0.0757598876953125, -0.07329559326171875, -0.070831298828125, -0.06836700439453125, -0.0659027099609375, -0.06343841552734375, -0.06097412109375, -0.05850982666015625, -0.0560455322265625, -0.05358123779296875, -0.051116943359375, -0.04865264892578125, -0.0461883544921875, -0.04372406005859375, -0.041259765625, -0.03879547119140625, -0.0363311767578125, -0.03386688232421875, -0.031402587890625, -0.02893829345703125, -0.0264739990234375, -0.02400970458984375, -0.02154541015625, -0.01908111572265625, -0.0166168212890625, -0.01415252685546875, -0.011688232421875, -0.00922393798828125, -0.0067596435546875, -0.00429534912109375, -0.0018310546875, 0.00063323974609375, 0.0030975341796875, 0.00556182861328125, 0.008026123046875, 0.01049041748046875, 0.0129547119140625, 0.01541900634765625, 0.01788330078125, 0.02034759521484375, 0.0228118896484375, 0.02527618408203125, 0.027740478515625, 0.03020477294921875, 0.0326690673828125, 0.03513336181640625, 0.03759765625, 0.04006195068359375, 0.0425262451171875, 0.04499053955078125, 0.047454833984375, 0.04991912841796875, 0.0523834228515625, 0.05484771728515625, 0.05731201171875, 0.05977630615234375, 0.0622406005859375, 0.06470489501953125, 0.067169189453125, 0.06963348388671875, 0.0720977783203125, 0.07456207275390625, 0.0770263671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 6.0, 14.0, 8.0, 21.0, 27.0, 49.0, 179.0, 395.0, 88.0, 35.0, 27.0, 17.0, 8.0, 10.0, 12.0, 7.0, 8.0, 4.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.023895263671875, -0.023179292678833008, -0.022463321685791016, -0.021747350692749023, -0.02103137969970703, -0.02031540870666504, -0.019599437713623047, -0.018883466720581055, -0.018167495727539062, -0.01745152473449707, -0.016735553741455078, -0.016019582748413086, -0.015303611755371094, -0.014587640762329102, -0.01387166976928711, -0.013155698776245117, -0.012439727783203125, -0.011723756790161133, -0.01100778579711914, -0.010291814804077148, -0.009575843811035156, -0.008859872817993164, -0.008143901824951172, -0.00742793083190918, -0.0067119598388671875, -0.005995988845825195, -0.005280017852783203, -0.004564046859741211, -0.0038480758666992188, -0.0031321048736572266, -0.0024161338806152344, -0.0017001628875732422, -0.00098419189453125, -0.0002682209014892578, 0.0004477500915527344, 0.0011637210845947266, 0.0018796920776367188, 0.002595663070678711, 0.003311634063720703, 0.004027605056762695, 0.0047435760498046875, 0.00545954704284668, 0.006175518035888672, 0.006891489028930664, 0.007607460021972656, 0.008323431015014648, 0.00903940200805664, 0.009755373001098633, 0.010471343994140625, 0.011187314987182617, 0.01190328598022461, 0.012619256973266602, 0.013335227966308594, 0.014051198959350586, 0.014767169952392578, 0.01548314094543457, 0.016199111938476562, 0.016915082931518555, 0.017631053924560547, 0.01834702491760254, 0.01906299591064453, 0.019778966903686523, 0.020494937896728516, 0.021210908889770508, 0.0219268798828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 10.0, 6.0, 15.0, 13.0, 32.0, 41.0, 53.0, 74.0, 127.0, 166.0, 299.0, 566.0, 1166.0, 2743.0, 6846.0, 19184.0, 62834.0, 245335.0, 491939.0, 152666.0, 41298.0, 13608.0, 5198.0, 2133.0, 978.0, 484.0, 251.0, 138.0, 107.0, 69.0, 48.0, 40.0, 23.0, 18.0, 18.0, 7.0, 13.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.06565380096435547, -0.06355857849121094, -0.061463356018066406, -0.059368133544921875, -0.057272911071777344, -0.05517768859863281, -0.05308246612548828, -0.05098724365234375, -0.04889202117919922, -0.04679679870605469, -0.044701576232910156, -0.042606353759765625, -0.040511131286621094, -0.03841590881347656, -0.03632068634033203, -0.0342254638671875, -0.03213024139404297, -0.030035018920898438, -0.027939796447753906, -0.025844573974609375, -0.023749351501464844, -0.021654129028320312, -0.01955890655517578, -0.01746368408203125, -0.015368461608886719, -0.013273239135742188, -0.011178016662597656, -0.009082794189453125, -0.006987571716308594, -0.0048923492431640625, -0.0027971267700195312, -0.000701904296875, 0.0013933181762695312, 0.0034885406494140625, 0.005583763122558594, 0.007678985595703125, 0.009774208068847656, 0.011869430541992188, 0.013964653015136719, 0.01605987548828125, 0.01815509796142578, 0.020250320434570312, 0.022345542907714844, 0.024440765380859375, 0.026535987854003906, 0.028631210327148438, 0.03072643280029297, 0.0328216552734375, 0.03491687774658203, 0.03701210021972656, 0.039107322692871094, 0.041202545166015625, 0.043297767639160156, 0.04539299011230469, 0.04748821258544922, 0.04958343505859375, 0.05167865753173828, 0.05377388000488281, 0.055869102478027344, 0.057964324951171875, 0.060059547424316406, 0.06215476989746094, 0.06424999237060547, 0.06634521484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 7.0, 11.0, 7.0, 9.0, 14.0, 20.0, 19.0, 31.0, 28.0, 43.0, 41.0, 36.0, 43.0, 51.0, 44.0, 48.0, 52.0, 58.0, 52.0, 41.0, 40.0, 39.0, 29.0, 39.0, 32.0, 19.0, 26.0, 20.0, 20.0, 19.0, 11.0, 13.0, 11.0, 6.0, 10.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10394287109375, -0.1006765365600586, -0.09741020202636719, -0.09414386749267578, -0.09087753295898438, -0.08761119842529297, -0.08434486389160156, -0.08107852935791016, -0.07781219482421875, -0.07454586029052734, -0.07127952575683594, -0.06801319122314453, -0.06474685668945312, -0.06148052215576172, -0.05821418762207031, -0.054947853088378906, -0.0516815185546875, -0.048415184020996094, -0.04514884948730469, -0.04188251495361328, -0.038616180419921875, -0.03534984588623047, -0.03208351135253906, -0.028817176818847656, -0.02555084228515625, -0.022284507751464844, -0.019018173217773438, -0.01575183868408203, -0.012485504150390625, -0.009219169616699219, -0.0059528350830078125, -0.0026865005493164062, 0.000579833984375, 0.0038461685180664062, 0.0071125030517578125, 0.010378837585449219, 0.013645172119140625, 0.01691150665283203, 0.020177841186523438, 0.023444175720214844, 0.02671051025390625, 0.029976844787597656, 0.03324317932128906, 0.03650951385498047, 0.039775848388671875, 0.04304218292236328, 0.04630851745605469, 0.049574851989746094, 0.0528411865234375, 0.056107521057128906, 0.05937385559082031, 0.06264019012451172, 0.06590652465820312, 0.06917285919189453, 0.07243919372558594, 0.07570552825927734, 0.07897186279296875, 0.08223819732666016, 0.08550453186035156, 0.08877086639404297, 0.09203720092773438, 0.09530353546142578, 0.09856986999511719, 0.1018362045288086, 0.1051025390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 10.0, 13.0, 14.0, 28.0, 30.0, 38.0, 59.0, 82.0, 119.0, 188.0, 274.0, 412.0, 659.0, 1197.0, 2343.0, 5048.0, 13056.0, 49009.0, 410631.0, 483938.0, 55844.0, 14437.0, 5299.0, 2516.0, 1275.0, 732.0, 462.0, 275.0, 171.0, 111.0, 76.0, 71.0, 33.0, 37.0, 7.0, 13.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06402587890625, -0.062198638916015625, -0.06037139892578125, -0.058544158935546875, -0.0567169189453125, -0.054889678955078125, -0.05306243896484375, -0.051235198974609375, -0.049407958984375, -0.047580718994140625, -0.04575347900390625, -0.043926239013671875, -0.0420989990234375, -0.040271759033203125, -0.03844451904296875, -0.036617279052734375, -0.0347900390625, -0.032962799072265625, -0.03113555908203125, -0.029308319091796875, -0.0274810791015625, -0.025653839111328125, -0.02382659912109375, -0.021999359130859375, -0.020172119140625, -0.018344879150390625, -0.01651763916015625, -0.014690399169921875, -0.0128631591796875, -0.011035919189453125, -0.00920867919921875, -0.007381439208984375, -0.00555419921875, -0.003726959228515625, -0.00189971923828125, -7.2479248046875e-05, 0.0017547607421875, 0.003582000732421875, 0.00540924072265625, 0.007236480712890625, 0.009063720703125, 0.010890960693359375, 0.01271820068359375, 0.014545440673828125, 0.0163726806640625, 0.018199920654296875, 0.02002716064453125, 0.021854400634765625, 0.023681640625, 0.025508880615234375, 0.02733612060546875, 0.029163360595703125, 0.0309906005859375, 0.032817840576171875, 0.03464508056640625, 0.036472320556640625, 0.038299560546875, 0.040126800537109375, 0.04195404052734375, 0.043781280517578125, 0.0456085205078125, 0.047435760498046875, 0.04926300048828125, 0.051090240478515625, 0.05291748046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 2.0, 8.0, 9.0, 17.0, 12.0, 20.0, 30.0, 17.0, 30.0, 40.0, 47.0, 58.0, 69.0, 64.0, 69.0, 66.0, 78.0, 76.0, 53.0, 27.0, 34.0, 34.0, 21.0, 21.0, 19.0, 12.0, 17.0, 13.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6716461181640625e-05, -3.569386899471283e-05, -3.4671276807785034e-05, -3.364868462085724e-05, -3.262609243392944e-05, -3.160350024700165e-05, -3.058090806007385e-05, -2.9558315873146057e-05, -2.8535723686218262e-05, -2.7513131499290466e-05, -2.649053931236267e-05, -2.5467947125434875e-05, -2.444535493850708e-05, -2.3422762751579285e-05, -2.240017056465149e-05, -2.1377578377723694e-05, -2.03549861907959e-05, -1.9332394003868103e-05, -1.8309801816940308e-05, -1.7287209630012512e-05, -1.6264617443084717e-05, -1.5242025256156921e-05, -1.4219433069229126e-05, -1.319684088230133e-05, -1.2174248695373535e-05, -1.115165650844574e-05, -1.0129064321517944e-05, -9.106472134590149e-06, -8.083879947662354e-06, -7.061287760734558e-06, -6.038695573806763e-06, -5.016103386878967e-06, -3.993511199951172e-06, -2.9709190130233765e-06, -1.948326826095581e-06, -9.257346391677856e-07, 9.685754776000977e-08, 1.1194497346878052e-06, 2.1420419216156006e-06, 3.164634108543396e-06, 4.187226295471191e-06, 5.209818482398987e-06, 6.232410669326782e-06, 7.255002856254578e-06, 8.277595043182373e-06, 9.300187230110168e-06, 1.0322779417037964e-05, 1.134537160396576e-05, 1.2367963790893555e-05, 1.339055597782135e-05, 1.4413148164749146e-05, 1.543574035167694e-05, 1.6458332538604736e-05, 1.7480924725532532e-05, 1.8503516912460327e-05, 1.9526109099388123e-05, 2.0548701286315918e-05, 2.1571293473243713e-05, 2.259388566017151e-05, 2.3616477847099304e-05, 2.46390700340271e-05, 2.5661662220954895e-05, 2.668425440788269e-05, 2.7706846594810486e-05, 2.872943878173828e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 26.0, 29.0, 44.0, 64.0, 112.0, 222.0, 371.0, 803.0, 1736.0, 4696.0, 17187.0, 112636.0, 727424.0, 152853.0, 20949.0, 5502.0, 2009.0, 856.0, 412.0, 210.0, 123.0, 83.0, 52.0, 41.0, 16.0, 15.0, 15.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.055389404296875, -0.053304195404052734, -0.05121898651123047, -0.0491337776184082, -0.04704856872558594, -0.04496335983276367, -0.042878150939941406, -0.04079294204711914, -0.038707733154296875, -0.03662252426147461, -0.034537315368652344, -0.03245210647583008, -0.030366897583007812, -0.028281688690185547, -0.02619647979736328, -0.024111270904541016, -0.02202606201171875, -0.019940853118896484, -0.01785564422607422, -0.015770435333251953, -0.013685226440429688, -0.011600017547607422, -0.009514808654785156, -0.007429599761962891, -0.005344390869140625, -0.0032591819763183594, -0.0011739730834960938, 0.0009112358093261719, 0.0029964447021484375, 0.005081653594970703, 0.007166862487792969, 0.009252071380615234, 0.0113372802734375, 0.013422489166259766, 0.015507698059082031, 0.017592906951904297, 0.019678115844726562, 0.021763324737548828, 0.023848533630371094, 0.02593374252319336, 0.028018951416015625, 0.03010416030883789, 0.032189369201660156, 0.03427457809448242, 0.03635978698730469, 0.03844499588012695, 0.04053020477294922, 0.042615413665771484, 0.04470062255859375, 0.046785831451416016, 0.04887104034423828, 0.05095624923706055, 0.05304145812988281, 0.05512666702270508, 0.057211875915527344, 0.05929708480834961, 0.061382293701171875, 0.06346750259399414, 0.0655527114868164, 0.06763792037963867, 0.06972312927246094, 0.0718083381652832, 0.07389354705810547, 0.07597875595092773, 0.07806396484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 10.0, 6.0, 7.0, 21.0, 20.0, 22.0, 32.0, 40.0, 48.0, 50.0, 56.0, 77.0, 66.0, 79.0, 77.0, 66.0, 65.0, 42.0, 44.0, 31.0, 24.0, 23.0, 17.0, 12.0, 3.0, 7.0, 12.0, 5.0, 5.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.032379150390625, -0.031101703643798828, -0.029824256896972656, -0.028546810150146484, -0.027269363403320312, -0.02599191665649414, -0.02471446990966797, -0.023437023162841797, -0.022159576416015625, -0.020882129669189453, -0.01960468292236328, -0.01832723617553711, -0.017049789428710938, -0.015772342681884766, -0.014494895935058594, -0.013217449188232422, -0.01194000244140625, -0.010662555694580078, -0.009385108947753906, -0.008107662200927734, -0.0068302154541015625, -0.005552768707275391, -0.004275321960449219, -0.002997875213623047, -0.001720428466796875, -0.0004429817199707031, 0.0008344650268554688, 0.0021119117736816406, 0.0033893585205078125, 0.004666805267333984, 0.005944252014160156, 0.007221698760986328, 0.0084991455078125, 0.009776592254638672, 0.011054039001464844, 0.012331485748291016, 0.013608932495117188, 0.01488637924194336, 0.01616382598876953, 0.017441272735595703, 0.018718719482421875, 0.019996166229248047, 0.02127361297607422, 0.02255105972290039, 0.023828506469726562, 0.025105953216552734, 0.026383399963378906, 0.027660846710205078, 0.02893829345703125, 0.030215740203857422, 0.031493186950683594, 0.032770633697509766, 0.03404808044433594, 0.03532552719116211, 0.03660297393798828, 0.03788042068481445, 0.039157867431640625, 0.0404353141784668, 0.04171276092529297, 0.04299020767211914, 0.04426765441894531, 0.045545101165771484, 0.046822547912597656, 0.04809999465942383, 0.04937744140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 16.0, 15.0, 30.0, 75.0, 153.0, 248.0, 213.0, 124.0, 55.0, 28.0, 15.0, 11.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48074230551719666, -0.4563523232936859, -0.4319623112678528, -0.40757232904434204, -0.3831823468208313, -0.35879236459732056, -0.3344023525714874, -0.3100123703479767, -0.28562235832214355, -0.2612323760986328, -0.23684237897396088, -0.21245238184928894, -0.1880623996257782, -0.16367240250110626, -0.13928240537643433, -0.11489242315292358, -0.09050244092941284, -0.0661124512553215, -0.041722457855939865, -0.017332464456558228, 0.007057525217533112, 0.03144751489162445, 0.05583751201629639, 0.08022749423980713, 0.10461749136447906, 0.129007488489151, 0.15339747071266174, 0.17778746783733368, 0.20217746496200562, 0.22656744718551636, 0.2509574294090271, 0.27534741163253784, 0.2997373938560486, 0.3241273760795593, 0.34851738810539246, 0.3729073703289032, 0.39729735255241394, 0.42168736457824707, 0.4460773468017578, 0.47046732902526855, 0.4948573112487793, 0.51924729347229, 0.5436372756958008, 0.5680272579193115, 0.592417299747467, 0.6168072819709778, 0.6411972641944885, 0.6655872464179993, 0.6899772882461548, 0.7143672704696655, 0.7387572526931763, 0.763147234916687, 0.7875372767448425, 0.8119272589683533, 0.836317241191864, 0.8607072234153748, 0.8850972056388855, 0.9094871878623962, 0.933877170085907, 0.9582672119140625, 0.9826571941375732, 1.007047176361084, 1.0314371585845947, 1.0558271408081055, 1.0802171230316162]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 14.0, 24.0, 33.0, 49.0, 76.0, 135.0, 184.0, 145.0, 103.0, 75.0, 39.0, 16.0, 12.0, 9.0, 5.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.504492998123169, -1.4502655267715454, -1.3960381746292114, -1.341810703277588, -1.287583351135254, -1.2333558797836304, -1.1791284084320068, -1.1249010562896729, -1.0706737041473389, -1.0164462327957153, -0.9622188806533813, -0.9079914093017578, -0.8537640571594238, -0.7995365858078003, -0.7453091740608215, -0.6910817623138428, -0.6368542909622192, -0.5826268792152405, -0.5283994674682617, -0.47417202591896057, -0.4199446141719818, -0.36571720242500305, -0.3114897608757019, -0.25726234912872314, -0.20303493738174438, -0.14880752563476562, -0.09458009898662567, -0.04035267233848572, 0.013874739408493042, 0.0681021511554718, 0.12232959270477295, 0.1765570044517517, 0.23078429698944092, 0.2850117087364197, 0.33923912048339844, 0.3934665620326996, 0.44769397377967834, 0.5019214153289795, 0.5561488270759583, 0.610376238822937, 0.6646036505699158, 0.7188310623168945, 0.7730584740638733, 0.827285885810852, 0.8815133571624756, 0.9357407093048096, 0.9899681806564331, 1.0441956520080566, 1.0984230041503906, 1.1526504755020142, 1.2068778276443481, 1.2611052989959717, 1.3153326511383057, 1.3695601224899292, 1.4237875938415527, 1.4780149459838867, 1.5322422981262207, 1.5864697694778442, 1.6406971216201782, 1.6949245929718018, 1.7491519451141357, 1.8033794164657593, 1.8576068878173828, 1.9118342399597168, 1.9660617113113403]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 1.0, 11.0, 21.0, 24.0, 27.0, 37.0, 56.0, 91.0, 115.0, 191.0, 275.0, 419.0, 726.0, 1367.0, 2560.0, 5466.0, 14162.0, 56692.0, 3786349.0, 270691.0, 33308.0, 11213.0, 4703.0, 2427.0, 1362.0, 768.0, 410.0, 280.0, 170.0, 120.0, 58.0, 46.0, 30.0, 23.0, 20.0, 22.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2022705078125, -0.1964588165283203, -0.19064712524414062, -0.18483543395996094, -0.17902374267578125, -0.17321205139160156, -0.16740036010742188, -0.1615886688232422, -0.1557769775390625, -0.1499652862548828, -0.14415359497070312, -0.13834190368652344, -0.13253021240234375, -0.12671852111816406, -0.12090682983398438, -0.11509513854980469, -0.109283447265625, -0.10347175598144531, -0.09766006469726562, -0.09184837341308594, -0.08603668212890625, -0.08022499084472656, -0.07441329956054688, -0.06860160827636719, -0.0627899169921875, -0.05697822570800781, -0.051166534423828125, -0.04535484313964844, -0.03954315185546875, -0.03373146057128906, -0.027919769287109375, -0.022108078002929688, -0.01629638671875, -0.010484695434570312, -0.004673004150390625, 0.0011386871337890625, 0.00695037841796875, 0.012762069702148438, 0.018573760986328125, 0.024385452270507812, 0.0301971435546875, 0.03600883483886719, 0.041820526123046875, 0.04763221740722656, 0.05344390869140625, 0.05925559997558594, 0.06506729125976562, 0.07087898254394531, 0.076690673828125, 0.08250236511230469, 0.08831405639648438, 0.09412574768066406, 0.09993743896484375, 0.10574913024902344, 0.11156082153320312, 0.11737251281738281, 0.1231842041015625, 0.1289958953857422, 0.13480758666992188, 0.14061927795410156, 0.14643096923828125, 0.15224266052246094, 0.15805435180664062, 0.1638660430908203, 0.169677734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 7.0, 2.0, 6.0, 7.0, 8.0, 20.0, 15.0, 26.0, 49.0, 127.0, 237.0, 203.0, 108.0, 45.0, 33.0, 21.0, 15.0, 3.0, 12.0, 6.0, 10.0, 8.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023956298828125, -0.023235797882080078, -0.022515296936035156, -0.021794795989990234, -0.021074295043945312, -0.02035379409790039, -0.01963329315185547, -0.018912792205810547, -0.018192291259765625, -0.017471790313720703, -0.01675128936767578, -0.01603078842163086, -0.015310287475585938, -0.014589786529541016, -0.013869285583496094, -0.013148784637451172, -0.01242828369140625, -0.011707782745361328, -0.010987281799316406, -0.010266780853271484, -0.009546279907226562, -0.00882577896118164, -0.008105278015136719, -0.007384777069091797, -0.006664276123046875, -0.005943775177001953, -0.005223274230957031, -0.004502773284912109, -0.0037822723388671875, -0.0030617713928222656, -0.0023412704467773438, -0.0016207695007324219, -0.0009002685546875, -0.00017976760864257812, 0.0005407333374023438, 0.0012612342834472656, 0.0019817352294921875, 0.0027022361755371094, 0.0034227371215820312, 0.004143238067626953, 0.004863739013671875, 0.005584239959716797, 0.006304740905761719, 0.007025241851806641, 0.0077457427978515625, 0.008466243743896484, 0.009186744689941406, 0.009907245635986328, 0.01062774658203125, 0.011348247528076172, 0.012068748474121094, 0.012789249420166016, 0.013509750366210938, 0.01423025131225586, 0.014950752258300781, 0.015671253204345703, 0.016391754150390625, 0.017112255096435547, 0.01783275604248047, 0.01855325698852539, 0.019273757934570312, 0.019994258880615234, 0.020714759826660156, 0.021435260772705078, 0.02215576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 10.0, 3.0, 19.0, 22.0, 44.0, 44.0, 81.0, 135.0, 186.0, 357.0, 721.0, 1593.0, 4453.0, 14727.0, 71676.0, 1194717.0, 2791547.0, 88040.0, 16903.0, 5187.0, 1929.0, 819.0, 432.0, 227.0, 139.0, 77.0, 49.0, 52.0, 25.0, 20.0, 12.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.14980125427246094, -0.14481735229492188, -0.1398334503173828, -0.13484954833984375, -0.1298656463623047, -0.12488174438476562, -0.11989784240722656, -0.1149139404296875, -0.10993003845214844, -0.10494613647460938, -0.09996223449707031, -0.09497833251953125, -0.08999443054199219, -0.08501052856445312, -0.08002662658691406, -0.075042724609375, -0.07005882263183594, -0.06507492065429688, -0.06009101867675781, -0.05510711669921875, -0.05012321472167969, -0.045139312744140625, -0.04015541076660156, -0.0351715087890625, -0.030187606811523438, -0.025203704833984375, -0.020219802856445312, -0.01523590087890625, -0.010251998901367188, -0.005268096923828125, -0.0002841949462890625, 0.00469970703125, 0.009683609008789062, 0.014667510986328125, 0.019651412963867188, 0.02463531494140625, 0.029619216918945312, 0.034603118896484375, 0.03958702087402344, 0.0445709228515625, 0.04955482482910156, 0.054538726806640625, 0.05952262878417969, 0.06450653076171875, 0.06949043273925781, 0.07447433471679688, 0.07945823669433594, 0.084442138671875, 0.08942604064941406, 0.09440994262695312, 0.09939384460449219, 0.10437774658203125, 0.10936164855957031, 0.11434555053710938, 0.11932945251464844, 0.1243133544921875, 0.12929725646972656, 0.13428115844726562, 0.1392650604248047, 0.14424896240234375, 0.1492328643798828, 0.15421676635742188, 0.15920066833496094, 0.1641845703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 12.0, 16.0, 31.0, 28.0, 59.0, 83.0, 151.0, 274.0, 654.0, 1814.0, 453.0, 165.0, 103.0, 55.0, 34.0, 19.0, 20.0, 21.0, 6.0, 8.0, 10.0, 8.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02874755859375, -0.02780008316040039, -0.02685260772705078, -0.025905132293701172, -0.024957656860351562, -0.024010181427001953, -0.023062705993652344, -0.022115230560302734, -0.021167755126953125, -0.020220279693603516, -0.019272804260253906, -0.018325328826904297, -0.017377853393554688, -0.016430377960205078, -0.015482902526855469, -0.01453542709350586, -0.01358795166015625, -0.01264047622680664, -0.011693000793457031, -0.010745525360107422, -0.009798049926757812, -0.008850574493408203, -0.007903099060058594, -0.006955623626708984, -0.006008148193359375, -0.005060672760009766, -0.004113197326660156, -0.003165721893310547, -0.0022182464599609375, -0.0012707710266113281, -0.00032329559326171875, 0.0006241798400878906, 0.0015716552734375, 0.0025191307067871094, 0.0034666061401367188, 0.004414081573486328, 0.0053615570068359375, 0.006309032440185547, 0.007256507873535156, 0.008203983306884766, 0.009151458740234375, 0.010098934173583984, 0.011046409606933594, 0.011993885040283203, 0.012941360473632812, 0.013888835906982422, 0.014836311340332031, 0.01578378677368164, 0.01673126220703125, 0.01767873764038086, 0.01862621307373047, 0.019573688507080078, 0.020521163940429688, 0.021468639373779297, 0.022416114807128906, 0.023363590240478516, 0.024311065673828125, 0.025258541107177734, 0.026206016540527344, 0.027153491973876953, 0.028100967407226562, 0.029048442840576172, 0.02999591827392578, 0.03094339370727539, 0.031890869140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 9.0, 19.0, 70.0, 206.0, 328.0, 238.0, 72.0, 34.0, 18.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16206994652748108, -0.15288899838924408, -0.1437080353498459, -0.1345270872116089, -0.1253461241722107, -0.1161651760339737, -0.1069842278957367, -0.0978032723069191, -0.0886223167181015, -0.0794413611292839, -0.07026040554046631, -0.06107945740222931, -0.05189850181341171, -0.042717546224594116, -0.03353659436106682, -0.02435564249753952, -0.015174686908721924, -0.005993733182549477, 0.0031872205436229706, 0.012368174269795418, 0.021549127995967865, 0.03073008358478546, 0.03991103544831276, 0.04909198731184006, 0.058272942900657654, 0.06745389848947525, 0.07663485407829285, 0.08581580221652985, 0.09499675780534744, 0.10417771339416504, 0.11335866153240204, 0.12253961712121964, 0.13172060251235962, 0.14090155065059662, 0.1500825136899948, 0.1592634618282318, 0.16844442486763, 0.177625373005867, 0.186806321144104, 0.1959872841835022, 0.2051682323217392, 0.2143491804599762, 0.2235301434993744, 0.2327110916376114, 0.2418920397758484, 0.2510730028152466, 0.2602539658546448, 0.2694348990917206, 0.2786158621311188, 0.28779682517051697, 0.2969777584075928, 0.30615872144699097, 0.31533968448638916, 0.32452064752578735, 0.33370158076286316, 0.34288254380226135, 0.35206347703933716, 0.36124444007873535, 0.37042537331581116, 0.37960633635520935, 0.38878729939460754, 0.39796823263168335, 0.40714919567108154, 0.41633015871047974, 0.42551112174987793]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 16.0, 17.0, 15.0, 26.0, 39.0, 34.0, 64.0, 42.0, 53.0, 42.0, 66.0, 59.0, 63.0, 59.0, 66.0, 52.0, 55.0, 44.0, 19.0, 29.0, 18.0, 22.0, 12.0, 12.0, 9.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1099323034286499, -0.10628964006900787, -0.10264697670936584, -0.09900431334972382, -0.09536164999008179, -0.09171898663043976, -0.08807633072137833, -0.0844336673617363, -0.08079100400209427, -0.07714834064245224, -0.07350567728281021, -0.06986301392316818, -0.06622035801410675, -0.06257769465446472, -0.05893503129482269, -0.055292367935180664, -0.051649704575538635, -0.048007041215896606, -0.04436437785625458, -0.04072171822190285, -0.03707905486226082, -0.03343639150261879, -0.02979373000562191, -0.02615106850862503, -0.022508405148983, -0.018865741789340973, -0.015223080292344093, -0.011580417864024639, -0.007937755435705185, -0.004295092076063156, -0.0006524305790662766, 0.002990230917930603, 0.006632894277572632, 0.010275556705892086, 0.01391821913421154, 0.01756088063120842, 0.02120354399085045, 0.024846207350492477, 0.028488868847489357, 0.03213153034448624, 0.035774193704128265, 0.039416857063770294, 0.04305952042341232, 0.04670218005776405, 0.05034484341740608, 0.05398750677704811, 0.05763016641139984, 0.06127282977104187, 0.0649154931306839, 0.06855815649032593, 0.07220081984996796, 0.07584348320960999, 0.07948614656925201, 0.08312880992889404, 0.08677146583795547, 0.0904141291975975, 0.09405679255723953, 0.09769945591688156, 0.10134211927652359, 0.10498478263616562, 0.10862743854522705, 0.11227010190486908, 0.11591276526451111, 0.11955542862415314, 0.12319809198379517]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 9.0, 7.0, 13.0, 7.0, 20.0, 24.0, 40.0, 44.0, 67.0, 68.0, 102.0, 141.0, 232.0, 327.0, 454.0, 664.0, 989.0, 1458.0, 2444.0, 4106.0, 6912.0, 13391.0, 28538.0, 84743.0, 525136.0, 278415.0, 53481.0, 21099.0, 10471.0, 5726.0, 3341.0, 1983.0, 1304.0, 831.0, 605.0, 441.0, 249.0, 164.0, 126.0, 115.0, 75.0, 52.0, 39.0, 27.0, 20.0, 13.0, 13.0, 10.0, 3.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.08612060546875, -0.08332633972167969, -0.08053207397460938, -0.07773780822753906, -0.07494354248046875, -0.07214927673339844, -0.06935501098632812, -0.06656074523925781, -0.0637664794921875, -0.06097221374511719, -0.058177947998046875, -0.05538368225097656, -0.05258941650390625, -0.04979515075683594, -0.047000885009765625, -0.04420661926269531, -0.041412353515625, -0.03861808776855469, -0.035823822021484375, -0.03302955627441406, -0.03023529052734375, -0.027441024780273438, -0.024646759033203125, -0.021852493286132812, -0.0190582275390625, -0.016263961791992188, -0.013469696044921875, -0.010675430297851562, -0.00788116455078125, -0.0050868988037109375, -0.002292633056640625, 0.0005016326904296875, 0.0032958984375, 0.0060901641845703125, 0.008884429931640625, 0.011678695678710938, 0.01447296142578125, 0.017267227172851562, 0.020061492919921875, 0.022855758666992188, 0.0256500244140625, 0.028444290161132812, 0.031238555908203125, 0.03403282165527344, 0.03682708740234375, 0.03962135314941406, 0.042415618896484375, 0.04520988464355469, 0.048004150390625, 0.05079841613769531, 0.053592681884765625, 0.05638694763183594, 0.05918121337890625, 0.06197547912597656, 0.06476974487304688, 0.06756401062011719, 0.0703582763671875, 0.07315254211425781, 0.07594680786132812, 0.07874107360839844, 0.08153533935546875, 0.08432960510253906, 0.08712387084960938, 0.08991813659667969, 0.09271240234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 4.0, 12.0, 16.0, 15.0, 30.0, 37.0, 71.0, 132.0, 224.0, 169.0, 106.0, 52.0, 27.0, 21.0, 10.0, 12.0, 10.0, 7.0, 9.0, 3.0, 6.0, 1.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228424072265625, -0.02212667465209961, -0.02141094207763672, -0.020695209503173828, -0.019979476928710938, -0.019263744354248047, -0.018548011779785156, -0.017832279205322266, -0.017116546630859375, -0.016400814056396484, -0.015685081481933594, -0.014969348907470703, -0.014253616333007812, -0.013537883758544922, -0.012822151184082031, -0.01210641860961914, -0.01139068603515625, -0.01067495346069336, -0.009959220886230469, -0.009243488311767578, -0.008527755737304688, -0.007812023162841797, -0.007096290588378906, -0.006380558013916016, -0.005664825439453125, -0.004949092864990234, -0.004233360290527344, -0.003517627716064453, -0.0028018951416015625, -0.002086162567138672, -0.0013704299926757812, -0.0006546974182128906, 6.103515625e-05, 0.0007767677307128906, 0.0014925003051757812, 0.002208232879638672, 0.0029239654541015625, 0.003639698028564453, 0.004355430603027344, 0.005071163177490234, 0.005786895751953125, 0.006502628326416016, 0.007218360900878906, 0.007934093475341797, 0.008649826049804688, 0.009365558624267578, 0.010081291198730469, 0.01079702377319336, 0.01151275634765625, 0.01222848892211914, 0.012944221496582031, 0.013659954071044922, 0.014375686645507812, 0.015091419219970703, 0.015807151794433594, 0.016522884368896484, 0.017238616943359375, 0.017954349517822266, 0.018670082092285156, 0.019385814666748047, 0.020101547241210938, 0.020817279815673828, 0.02153301239013672, 0.02224874496459961, 0.0229644775390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 11.0, 9.0, 22.0, 24.0, 37.0, 46.0, 65.0, 85.0, 142.0, 254.0, 422.0, 765.0, 1273.0, 2724.0, 5852.0, 15100.0, 46549.0, 179485.0, 480183.0, 225930.0, 58014.0, 18188.0, 6823.0, 2950.0, 1506.0, 811.0, 420.0, 268.0, 165.0, 132.0, 63.0, 60.0, 34.0, 34.0, 24.0, 18.0, 12.0, 11.0, 9.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.060211181640625, -0.05817556381225586, -0.05613994598388672, -0.05410432815551758, -0.05206871032714844, -0.0500330924987793, -0.047997474670410156, -0.045961856842041016, -0.043926239013671875, -0.041890621185302734, -0.039855003356933594, -0.03781938552856445, -0.03578376770019531, -0.03374814987182617, -0.03171253204345703, -0.02967691421508789, -0.02764129638671875, -0.02560567855834961, -0.02357006072998047, -0.021534442901611328, -0.019498825073242188, -0.017463207244873047, -0.015427589416503906, -0.013391971588134766, -0.011356353759765625, -0.009320735931396484, -0.007285118103027344, -0.005249500274658203, -0.0032138824462890625, -0.0011782646179199219, 0.0008573532104492188, 0.0028929710388183594, 0.0049285888671875, 0.006964206695556641, 0.008999824523925781, 0.011035442352294922, 0.013071060180664062, 0.015106678009033203, 0.017142295837402344, 0.019177913665771484, 0.021213531494140625, 0.023249149322509766, 0.025284767150878906, 0.027320384979248047, 0.029356002807617188, 0.03139162063598633, 0.03342723846435547, 0.03546285629272461, 0.03749847412109375, 0.03953409194946289, 0.04156970977783203, 0.04360532760620117, 0.04564094543457031, 0.04767656326293945, 0.049712181091308594, 0.051747798919677734, 0.053783416748046875, 0.055819034576416016, 0.057854652404785156, 0.0598902702331543, 0.06192588806152344, 0.06396150588989258, 0.06599712371826172, 0.06803274154663086, 0.070068359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 6.0, 12.0, 9.0, 16.0, 17.0, 17.0, 24.0, 23.0, 33.0, 31.0, 31.0, 45.0, 32.0, 42.0, 45.0, 52.0, 52.0, 39.0, 48.0, 43.0, 38.0, 39.0, 39.0, 51.0, 36.0, 20.0, 29.0, 27.0, 13.0, 20.0, 8.0, 9.0, 11.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.0501704216003418, -0.048308372497558594, -0.04644632339477539, -0.04458427429199219, -0.042722225189208984, -0.04086017608642578, -0.03899812698364258, -0.037136077880859375, -0.03527402877807617, -0.03341197967529297, -0.031549930572509766, -0.029687881469726562, -0.02782583236694336, -0.025963783264160156, -0.024101734161376953, -0.02223968505859375, -0.020377635955810547, -0.018515586853027344, -0.01665353775024414, -0.014791488647460938, -0.012929439544677734, -0.011067390441894531, -0.009205341339111328, -0.007343292236328125, -0.005481243133544922, -0.0036191940307617188, -0.0017571449279785156, 0.0001049041748046875, 0.0019669532775878906, 0.0038290023803710938, 0.005691051483154297, 0.0075531005859375, 0.009415149688720703, 0.011277198791503906, 0.01313924789428711, 0.015001296997070312, 0.016863346099853516, 0.01872539520263672, 0.020587444305419922, 0.022449493408203125, 0.024311542510986328, 0.02617359161376953, 0.028035640716552734, 0.029897689819335938, 0.03175973892211914, 0.033621788024902344, 0.03548383712768555, 0.03734588623046875, 0.03920793533325195, 0.041069984436035156, 0.04293203353881836, 0.04479408264160156, 0.046656131744384766, 0.04851818084716797, 0.05038022994995117, 0.052242279052734375, 0.05410432815551758, 0.05596637725830078, 0.057828426361083984, 0.05969047546386719, 0.06155252456665039, 0.0634145736694336, 0.0652766227722168, 0.067138671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 8.0, 4.0, 7.0, 6.0, 17.0, 29.0, 31.0, 51.0, 83.0, 157.0, 403.0, 1145.0, 4900.0, 36008.0, 757701.0, 230296.0, 13914.0, 2484.0, 666.0, 295.0, 136.0, 81.0, 43.0, 32.0, 20.0, 7.0, 4.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.12114906311035156, -0.11583328247070312, -0.11051750183105469, -0.10520172119140625, -0.09988594055175781, -0.09457015991210938, -0.08925437927246094, -0.0839385986328125, -0.07862281799316406, -0.07330703735351562, -0.06799125671386719, -0.06267547607421875, -0.05735969543457031, -0.052043914794921875, -0.04672813415527344, -0.041412353515625, -0.03609657287597656, -0.030780792236328125, -0.025465011596679688, -0.02014923095703125, -0.014833450317382812, -0.009517669677734375, -0.0042018890380859375, 0.0011138916015625, 0.0064296722412109375, 0.011745452880859375, 0.017061233520507812, 0.02237701416015625, 0.027692794799804688, 0.033008575439453125, 0.03832435607910156, 0.04364013671875, 0.04895591735839844, 0.054271697998046875, 0.05958747863769531, 0.06490325927734375, 0.07021903991699219, 0.07553482055664062, 0.08085060119628906, 0.0861663818359375, 0.09148216247558594, 0.09679794311523438, 0.10211372375488281, 0.10742950439453125, 0.11274528503417969, 0.11806106567382812, 0.12337684631347656, 0.128692626953125, 0.13400840759277344, 0.13932418823242188, 0.1446399688720703, 0.14995574951171875, 0.1552715301513672, 0.16058731079101562, 0.16590309143066406, 0.1712188720703125, 0.17653465270996094, 0.18185043334960938, 0.1871662139892578, 0.19248199462890625, 0.1977977752685547, 0.20311355590820312, 0.20842933654785156, 0.2137451171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 14.0, 16.0, 13.0, 22.0, 26.0, 32.0, 45.0, 48.0, 66.0, 85.0, 99.0, 89.0, 86.0, 74.0, 65.0, 37.0, 37.0, 31.0, 27.0, 20.0, 16.0, 8.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.561113357543945e-05, -5.383603274822235e-05, -5.206093192100525e-05, -5.028583109378815e-05, -4.8510730266571045e-05, -4.673562943935394e-05, -4.496052861213684e-05, -4.318542778491974e-05, -4.141032695770264e-05, -3.9635226130485535e-05, -3.786012530326843e-05, -3.608502447605133e-05, -3.430992364883423e-05, -3.2534822821617126e-05, -3.0759721994400024e-05, -2.8984621167182922e-05, -2.720952033996582e-05, -2.5434419512748718e-05, -2.3659318685531616e-05, -2.1884217858314514e-05, -2.0109117031097412e-05, -1.833401620388031e-05, -1.6558915376663208e-05, -1.4783814549446106e-05, -1.3008713722229004e-05, -1.1233612895011902e-05, -9.4585120677948e-06, -7.683411240577698e-06, -5.908310413360596e-06, -4.133209586143494e-06, -2.3581087589263916e-06, -5.830079317092896e-07, 1.1920928955078125e-06, 2.9671937227249146e-06, 4.742294549942017e-06, 6.517395377159119e-06, 8.29249620437622e-06, 1.0067597031593323e-05, 1.1842697858810425e-05, 1.3617798686027527e-05, 1.539289951324463e-05, 1.716800034046173e-05, 1.8943101167678833e-05, 2.0718201994895935e-05, 2.2493302822113037e-05, 2.426840364933014e-05, 2.604350447654724e-05, 2.7818605303764343e-05, 2.9593706130981445e-05, 3.136880695819855e-05, 3.314390778541565e-05, 3.491900861263275e-05, 3.6694109439849854e-05, 3.8469210267066956e-05, 4.024431109428406e-05, 4.201941192150116e-05, 4.379451274871826e-05, 4.5569613575935364e-05, 4.7344714403152466e-05, 4.911981523036957e-05, 5.089491605758667e-05, 5.267001688480377e-05, 5.4445117712020874e-05, 5.6220218539237976e-05, 5.799531936645508e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 4.0, 9.0, 17.0, 20.0, 40.0, 58.0, 85.0, 213.0, 371.0, 868.0, 2138.0, 6459.0, 27412.0, 198763.0, 658308.0, 125903.0, 19544.0, 5062.0, 1780.0, 744.0, 354.0, 161.0, 97.0, 49.0, 34.0, 18.0, 17.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1051025390625, -0.10221481323242188, -0.09932708740234375, -0.09643936157226562, -0.0935516357421875, -0.09066390991210938, -0.08777618408203125, -0.08488845825195312, -0.082000732421875, -0.07911300659179688, -0.07622528076171875, -0.07333755493164062, -0.0704498291015625, -0.06756210327148438, -0.06467437744140625, -0.061786651611328125, -0.05889892578125, -0.056011199951171875, -0.05312347412109375, -0.050235748291015625, -0.0473480224609375, -0.044460296630859375, -0.04157257080078125, -0.038684844970703125, -0.035797119140625, -0.032909393310546875, -0.03002166748046875, -0.027133941650390625, -0.0242462158203125, -0.021358489990234375, -0.01847076416015625, -0.015583038330078125, -0.0126953125, -0.009807586669921875, -0.00691986083984375, -0.004032135009765625, -0.0011444091796875, 0.001743316650390625, 0.00463104248046875, 0.007518768310546875, 0.010406494140625, 0.013294219970703125, 0.01618194580078125, 0.019069671630859375, 0.0219573974609375, 0.024845123291015625, 0.02773284912109375, 0.030620574951171875, 0.03350830078125, 0.036396026611328125, 0.03928375244140625, 0.042171478271484375, 0.0450592041015625, 0.047946929931640625, 0.05083465576171875, 0.053722381591796875, 0.056610107421875, 0.059497833251953125, 0.06238555908203125, 0.06527328491210938, 0.0681610107421875, 0.07104873657226562, 0.07393646240234375, 0.07682418823242188, 0.0797119140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 9.0, 7.0, 11.0, 16.0, 27.0, 35.0, 50.0, 76.0, 117.0, 120.0, 163.0, 124.0, 78.0, 51.0, 38.0, 26.0, 21.0, 11.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09039306640625, -0.08788681030273438, -0.08538055419921875, -0.08287429809570312, -0.0803680419921875, -0.07786178588867188, -0.07535552978515625, -0.07284927368164062, -0.070343017578125, -0.06783676147460938, -0.06533050537109375, -0.06282424926757812, -0.0603179931640625, -0.057811737060546875, -0.05530548095703125, -0.052799224853515625, -0.05029296875, -0.047786712646484375, -0.04528045654296875, -0.042774200439453125, -0.0402679443359375, -0.037761688232421875, -0.03525543212890625, -0.032749176025390625, -0.030242919921875, -0.027736663818359375, -0.02523040771484375, -0.022724151611328125, -0.0202178955078125, -0.017711639404296875, -0.01520538330078125, -0.012699127197265625, -0.01019287109375, -0.007686614990234375, -0.00518035888671875, -0.002674102783203125, -0.0001678466796875, 0.002338409423828125, 0.00484466552734375, 0.007350921630859375, 0.009857177734375, 0.012363433837890625, 0.01486968994140625, 0.017375946044921875, 0.0198822021484375, 0.022388458251953125, 0.02489471435546875, 0.027400970458984375, 0.0299072265625, 0.032413482666015625, 0.03491973876953125, 0.037425994873046875, 0.0399322509765625, 0.042438507080078125, 0.04494476318359375, 0.047451019287109375, 0.049957275390625, 0.052463531494140625, 0.05496978759765625, 0.057476043701171875, 0.0599822998046875, 0.062488555908203125, 0.06499481201171875, 0.06750106811523438, 0.07000732421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 45.0, 344.0, 462.0, 107.0, 23.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4232504367828369, -0.3711588382720947, -0.3190672695636749, -0.26697567105293274, -0.21488408744335175, -0.16279250383377075, -0.11070090532302856, -0.058609336614608765, -0.006517738103866577, 0.045573849231004715, 0.09766543656587601, 0.1497570276260376, 0.2018486112356186, 0.2539401948451996, 0.3060317933559418, 0.3581233620643616, 0.41021496057510376, 0.46230655908584595, 0.5143981575965881, 0.5664896965026855, 0.6185812950134277, 0.6706728935241699, 0.7227644920349121, 0.7748560905456543, 0.8269476890563965, 0.8790392875671387, 0.9311308860778809, 0.983222484588623, 1.0353140830993652, 1.0874056816101074, 1.1394972801208496, 1.1915887594223022, 1.2436803579330444, 1.2957719564437866, 1.3478635549545288, 1.399955153465271, 1.4520467519760132, 1.5041382312774658, 1.556229829788208, 1.6083214282989502, 1.6604130268096924, 1.7125046253204346, 1.7645962238311768, 1.816687822341919, 1.8687794208526611, 1.9208710193634033, 1.9729626178741455, 2.0250542163848877, 2.07714581489563, 2.129237413406372, 2.1813290119171143, 2.2334206104278564, 2.2855122089385986, 2.337603807449341, 2.389695405960083, 2.441787004470825, 2.4938783645629883, 2.5459699630737305, 2.5980615615844727, 2.650153160095215, 2.702244758605957, 2.754336357116699, 2.8064279556274414, 2.8585195541381836, 2.910611152648926]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 9.0, 6.0, 15.0, 11.0, 23.0, 35.0, 44.0, 60.0, 69.0, 97.0, 75.0, 104.0, 85.0, 89.0, 59.0, 55.0, 41.0, 25.0, 22.0, 16.0, 12.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7189944386482239, -0.696451723575592, -0.6739090085029602, -0.6513662338256836, -0.6288235187530518, -0.6062808036804199, -0.5837380886077881, -0.5611953735351562, -0.5386526584625244, -0.5161099433898926, -0.49356719851493835, -0.4710244834423065, -0.4484817385673523, -0.42593902349472046, -0.4033963084220886, -0.3808535933494568, -0.3583108186721802, -0.33576810359954834, -0.3132253587245941, -0.2906826436519623, -0.26813989877700806, -0.24559718370437622, -0.22305446863174438, -0.20051173865795135, -0.17796900868415833, -0.1554262787103653, -0.13288354873657227, -0.11034083366394043, -0.0877981036901474, -0.06525537371635437, -0.042712658643722534, -0.020169928669929504, 0.0023728609085083008, 0.024915587157011032, 0.04745831340551376, 0.0700010359287262, 0.09254376590251923, 0.11508649587631226, 0.1376292109489441, 0.16017194092273712, 0.18271467089653015, 0.20525740087032318, 0.2278001308441162, 0.25034284591674805, 0.2728855609893799, 0.2954283058643341, 0.31797102093696594, 0.34051376581192017, 0.363056480884552, 0.38559919595718384, 0.40814194083213806, 0.4306846559047699, 0.4532274007797241, 0.47577011585235596, 0.4983128309249878, 0.5208555459976196, 0.5433982610702515, 0.5659409761428833, 0.5884836912155151, 0.611026406288147, 0.6335691809654236, 0.6561118960380554, 0.6786546111106873, 0.7011973261833191, 0.7237401008605957]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 3.0, 13.0, 11.0, 15.0, 25.0, 22.0, 38.0, 37.0, 62.0, 73.0, 101.0, 107.0, 160.0, 235.0, 322.0, 506.0, 829.0, 1438.0, 2797.0, 5954.0, 16258.0, 70799.0, 3752701.0, 287989.0, 32747.0, 10082.0, 4424.0, 2343.0, 1405.0, 887.0, 614.0, 397.0, 293.0, 182.0, 111.0, 101.0, 69.0, 44.0, 29.0, 20.0, 16.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.25048828125, -0.2434844970703125, -0.236480712890625, -0.2294769287109375, -0.22247314453125, -0.2154693603515625, -0.208465576171875, -0.2014617919921875, -0.1944580078125, -0.1874542236328125, -0.180450439453125, -0.1734466552734375, -0.16644287109375, -0.1594390869140625, -0.152435302734375, -0.1454315185546875, -0.138427734375, -0.1314239501953125, -0.124420166015625, -0.1174163818359375, -0.11041259765625, -0.1034088134765625, -0.096405029296875, -0.0894012451171875, -0.0823974609375, -0.0753936767578125, -0.068389892578125, -0.0613861083984375, -0.05438232421875, -0.0473785400390625, -0.040374755859375, -0.0333709716796875, -0.0263671875, -0.0193634033203125, -0.012359619140625, -0.0053558349609375, 0.00164794921875, 0.0086517333984375, 0.015655517578125, 0.0226593017578125, 0.0296630859375, 0.0366668701171875, 0.043670654296875, 0.0506744384765625, 0.05767822265625, 0.0646820068359375, 0.071685791015625, 0.0786895751953125, 0.085693359375, 0.0926971435546875, 0.099700927734375, 0.1067047119140625, 0.11370849609375, 0.1207122802734375, 0.127716064453125, 0.1347198486328125, 0.1417236328125, 0.1487274169921875, 0.155731201171875, 0.1627349853515625, 0.16973876953125, 0.1767425537109375, 0.183746337890625, 0.1907501220703125, 0.19775390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 11.0, 18.0, 33.0, 61.0, 101.0, 118.0, 187.0, 170.0, 93.0, 61.0, 29.0, 20.0, 13.0, 7.0, 6.0, 17.0, 4.0, 6.0, 2.0, 2.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025299072265625, -0.02457261085510254, -0.023846149444580078, -0.023119688034057617, -0.022393226623535156, -0.021666765213012695, -0.020940303802490234, -0.020213842391967773, -0.019487380981445312, -0.01876091957092285, -0.01803445816040039, -0.01730799674987793, -0.01658153533935547, -0.015855073928833008, -0.015128612518310547, -0.014402151107788086, -0.013675689697265625, -0.012949228286743164, -0.012222766876220703, -0.011496305465698242, -0.010769844055175781, -0.01004338264465332, -0.00931692123413086, -0.008590459823608398, -0.007863998413085938, -0.0071375370025634766, -0.006411075592041016, -0.005684614181518555, -0.004958152770996094, -0.004231691360473633, -0.003505229949951172, -0.002778768539428711, -0.00205230712890625, -0.001325845718383789, -0.0005993843078613281, 0.0001270771026611328, 0.0008535385131835938, 0.0015799999237060547, 0.0023064613342285156, 0.0030329227447509766, 0.0037593841552734375, 0.0044858455657958984, 0.005212306976318359, 0.00593876838684082, 0.006665229797363281, 0.007391691207885742, 0.008118152618408203, 0.008844614028930664, 0.009571075439453125, 0.010297536849975586, 0.011023998260498047, 0.011750459671020508, 0.012476921081542969, 0.01320338249206543, 0.01392984390258789, 0.014656305313110352, 0.015382766723632812, 0.016109228134155273, 0.016835689544677734, 0.017562150955200195, 0.018288612365722656, 0.019015073776245117, 0.019741535186767578, 0.02046799659729004, 0.0211944580078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 13.0, 16.0, 26.0, 25.0, 71.0, 117.0, 223.0, 537.0, 1433.0, 5316.0, 26481.0, 338320.0, 3699938.0, 103256.0, 13556.0, 3121.0, 989.0, 368.0, 185.0, 115.0, 56.0, 39.0, 18.0, 9.0, 16.0, 11.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.270263671875, -0.26260948181152344, -0.2549552917480469, -0.2473011016845703, -0.23964691162109375, -0.2319927215576172, -0.22433853149414062, -0.21668434143066406, -0.2090301513671875, -0.20137596130371094, -0.19372177124023438, -0.1860675811767578, -0.17841339111328125, -0.1707592010498047, -0.16310501098632812, -0.15545082092285156, -0.147796630859375, -0.14014244079589844, -0.13248825073242188, -0.12483406066894531, -0.11717987060546875, -0.10952568054199219, -0.10187149047851562, -0.09421730041503906, -0.0865631103515625, -0.07890892028808594, -0.07125473022460938, -0.06360054016113281, -0.05594635009765625, -0.04829216003417969, -0.040637969970703125, -0.03298377990722656, -0.02532958984375, -0.017675399780273438, -0.010021209716796875, -0.0023670196533203125, 0.00528717041015625, 0.012941360473632812, 0.020595550537109375, 0.028249740600585938, 0.0359039306640625, 0.04355812072753906, 0.051212310791015625, 0.05886650085449219, 0.06652069091796875, 0.07417488098144531, 0.08182907104492188, 0.08948326110839844, 0.097137451171875, 0.10479164123535156, 0.11244583129882812, 0.12010002136230469, 0.12775421142578125, 0.1354084014892578, 0.14306259155273438, 0.15071678161621094, 0.1583709716796875, 0.16602516174316406, 0.17367935180664062, 0.1813335418701172, 0.18898773193359375, 0.1966419219970703, 0.20429611206054688, 0.21195030212402344, 0.2196044921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 1.0, 9.0, 5.0, 23.0, 29.0, 23.0, 41.0, 70.0, 73.0, 136.0, 205.0, 395.0, 1474.0, 721.0, 322.0, 170.0, 113.0, 71.0, 35.0, 34.0, 28.0, 8.0, 14.0, 12.0, 13.0, 9.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0222320556640625, -0.02136969566345215, -0.020507335662841797, -0.019644975662231445, -0.018782615661621094, -0.017920255661010742, -0.01705789566040039, -0.01619553565979004, -0.015333175659179688, -0.014470815658569336, -0.013608455657958984, -0.012746095657348633, -0.011883735656738281, -0.01102137565612793, -0.010159015655517578, -0.009296655654907227, -0.008434295654296875, -0.0075719356536865234, -0.006709575653076172, -0.00584721565246582, -0.004984855651855469, -0.004122495651245117, -0.0032601356506347656, -0.002397775650024414, -0.0015354156494140625, -0.0006730556488037109, 0.00018930435180664062, 0.0010516643524169922, 0.0019140243530273438, 0.0027763843536376953, 0.003638744354248047, 0.0045011043548583984, 0.00536346435546875, 0.0062258243560791016, 0.007088184356689453, 0.007950544357299805, 0.008812904357910156, 0.009675264358520508, 0.01053762435913086, 0.011399984359741211, 0.012262344360351562, 0.013124704360961914, 0.013987064361572266, 0.014849424362182617, 0.01571178436279297, 0.01657414436340332, 0.017436504364013672, 0.018298864364624023, 0.019161224365234375, 0.020023584365844727, 0.020885944366455078, 0.02174830436706543, 0.02261066436767578, 0.023473024368286133, 0.024335384368896484, 0.025197744369506836, 0.026060104370117188, 0.02692246437072754, 0.02778482437133789, 0.028647184371948242, 0.029509544372558594, 0.030371904373168945, 0.031234264373779297, 0.03209662437438965, 0.032958984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 30.0, 72.0, 242.0, 314.0, 204.0, 89.0, 30.0, 10.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09958233684301376, -0.08903111517429352, -0.07847990095615387, -0.06792868673801422, -0.057377465069293976, -0.04682624712586403, -0.03627502918243408, -0.025723807513713837, -0.015172593295574188, -0.004621375352144241, 0.005929842591285706, 0.016481060534715652, 0.0270322784781456, 0.037583496421575546, 0.04813471436500549, 0.05868593603372574, 0.06923715025186539, 0.07978837192058563, 0.09033958613872528, 0.10089080035686493, 0.11144202202558517, 0.12199324369430542, 0.13254445791244507, 0.14309567213058472, 0.15364688634872437, 0.164198100566864, 0.17474931478500366, 0.1853005439043045, 0.19585175812244415, 0.2064029723405838, 0.21695420145988464, 0.2275054156780243, 0.23805665969848633, 0.24860787391662598, 0.2591590881347656, 0.2697103023529053, 0.2802615165710449, 0.29081276059150696, 0.3013639748096466, 0.31191518902778625, 0.3224664032459259, 0.33301761746406555, 0.3435688316822052, 0.35412004590034485, 0.3646712899208069, 0.37522250413894653, 0.3857737183570862, 0.39632493257522583, 0.4068761467933655, 0.4174273610115051, 0.4279785752296448, 0.4385297894477844, 0.4490810036659241, 0.4596322476863861, 0.47018346190452576, 0.4807346761226654, 0.49128589034080505, 0.5018371343612671, 0.5123883485794067, 0.5229395627975464, 0.533490777015686, 0.5440419912338257, 0.5545932054519653, 0.565144419670105, 0.5756956338882446]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 0.0, 8.0, 5.0, 6.0, 10.0, 11.0, 14.0, 26.0, 28.0, 33.0, 50.0, 43.0, 52.0, 53.0, 55.0, 64.0, 88.0, 54.0, 64.0, 53.0, 45.0, 50.0, 39.0, 32.0, 27.0, 19.0, 15.0, 10.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.12629568576812744, -0.12237454950809479, -0.11845341324806213, -0.11453226953744888, -0.11061113327741623, -0.10668999701738358, -0.10276885330677032, -0.09884771704673767, -0.09492658078670502, -0.09100544452667236, -0.08708430826663971, -0.08316316455602646, -0.0792420282959938, -0.07532089203596115, -0.0713997483253479, -0.06747861206531525, -0.06355747580528259, -0.05963633954524994, -0.05571519955992699, -0.051794059574604034, -0.04787292331457138, -0.04395178705453873, -0.040030647069215775, -0.03610950708389282, -0.03218837082386017, -0.028267232701182365, -0.024346094578504562, -0.02042495645582676, -0.016503818333148956, -0.012582680210471153, -0.00866154208779335, -0.004740403965115547, -0.0008192658424377441, 0.003101872280240059, 0.007023010402917862, 0.010944148525595665, 0.014865286648273468, 0.01878642477095127, 0.022707562893629074, 0.026628701016306877, 0.03054983913898468, 0.034470975399017334, 0.038392115384340286, 0.04231325536966324, 0.04623439162969589, 0.050155527889728546, 0.0540766678750515, 0.05799780786037445, 0.061918944120407104, 0.06584008038043976, 0.06976121664047241, 0.07368236035108566, 0.07760349661111832, 0.08152463287115097, 0.08544577658176422, 0.08936691284179688, 0.09328804910182953, 0.09720918536186218, 0.10113032162189484, 0.10505146533250809, 0.10897260159254074, 0.1128937378525734, 0.11681488156318665, 0.1207360178232193, 0.12465715408325195]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 10.0, 16.0, 17.0, 39.0, 50.0, 78.0, 85.0, 159.0, 249.0, 388.0, 704.0, 1138.0, 2099.0, 4163.0, 9525.0, 27606.0, 127409.0, 635826.0, 182371.0, 34853.0, 11550.0, 4773.0, 2284.0, 1227.0, 722.0, 423.0, 267.0, 169.0, 107.0, 74.0, 48.0, 34.0, 25.0, 14.0, 8.0, 12.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.14125633239746094, -0.13663864135742188, -0.1320209503173828, -0.12740325927734375, -0.12278556823730469, -0.11816787719726562, -0.11355018615722656, -0.1089324951171875, -0.10431480407714844, -0.09969711303710938, -0.09507942199707031, -0.09046173095703125, -0.08584403991699219, -0.08122634887695312, -0.07660865783691406, -0.071990966796875, -0.06737327575683594, -0.06275558471679688, -0.05813789367675781, -0.05352020263671875, -0.04890251159667969, -0.044284820556640625, -0.03966712951660156, -0.0350494384765625, -0.030431747436523438, -0.025814056396484375, -0.021196365356445312, -0.01657867431640625, -0.011960983276367188, -0.007343292236328125, -0.0027256011962890625, 0.00189208984375, 0.0065097808837890625, 0.011127471923828125, 0.015745162963867188, 0.02036285400390625, 0.024980545043945312, 0.029598236083984375, 0.03421592712402344, 0.0388336181640625, 0.04345130920410156, 0.048069000244140625, 0.05268669128417969, 0.05730438232421875, 0.06192207336425781, 0.06653976440429688, 0.07115745544433594, 0.075775146484375, 0.08039283752441406, 0.08501052856445312, 0.08962821960449219, 0.09424591064453125, 0.09886360168457031, 0.10348129272460938, 0.10809898376464844, 0.1127166748046875, 0.11733436584472656, 0.12195205688476562, 0.1265697479248047, 0.13118743896484375, 0.1358051300048828, 0.14042282104492188, 0.14504051208496094, 0.149658203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 5.0, 3.0, 7.0, 17.0, 25.0, 34.0, 51.0, 102.0, 126.0, 188.0, 131.0, 103.0, 75.0, 35.0, 27.0, 10.0, 13.0, 11.0, 11.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0243988037109375, -0.023699283599853516, -0.02299976348876953, -0.022300243377685547, -0.021600723266601562, -0.020901203155517578, -0.020201683044433594, -0.01950216293334961, -0.018802642822265625, -0.01810312271118164, -0.017403602600097656, -0.016704082489013672, -0.016004562377929688, -0.015305042266845703, -0.014605522155761719, -0.013906002044677734, -0.01320648193359375, -0.012506961822509766, -0.011807441711425781, -0.011107921600341797, -0.010408401489257812, -0.009708881378173828, -0.009009361267089844, -0.00830984115600586, -0.007610321044921875, -0.006910800933837891, -0.006211280822753906, -0.005511760711669922, -0.0048122406005859375, -0.004112720489501953, -0.0034132003784179688, -0.0027136802673339844, -0.00201416015625, -0.0013146400451660156, -0.0006151199340820312, 8.440017700195312e-05, 0.0007839202880859375, 0.0014834403991699219, 0.0021829605102539062, 0.0028824806213378906, 0.003582000732421875, 0.004281520843505859, 0.004981040954589844, 0.005680561065673828, 0.0063800811767578125, 0.007079601287841797, 0.007779121398925781, 0.008478641510009766, 0.00917816162109375, 0.009877681732177734, 0.010577201843261719, 0.011276721954345703, 0.011976242065429688, 0.012675762176513672, 0.013375282287597656, 0.01407480239868164, 0.014774322509765625, 0.01547384262084961, 0.016173362731933594, 0.016872882843017578, 0.017572402954101562, 0.018271923065185547, 0.01897144317626953, 0.019670963287353516, 0.0203704833984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 5.0, 8.0, 21.0, 29.0, 23.0, 39.0, 57.0, 98.0, 121.0, 179.0, 260.0, 405.0, 647.0, 1173.0, 2587.0, 7146.0, 24591.0, 109258.0, 455568.0, 345090.0, 73038.0, 17991.0, 5412.0, 2035.0, 1041.0, 546.0, 340.0, 243.0, 160.0, 112.0, 75.0, 71.0, 45.0, 30.0, 25.0, 21.0, 7.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1275634765625, -0.12368202209472656, -0.11980056762695312, -0.11591911315917969, -0.11203765869140625, -0.10815620422363281, -0.10427474975585938, -0.10039329528808594, -0.0965118408203125, -0.09263038635253906, -0.08874893188476562, -0.08486747741699219, -0.08098602294921875, -0.07710456848144531, -0.07322311401367188, -0.06934165954589844, -0.065460205078125, -0.06157875061035156, -0.057697296142578125, -0.05381584167480469, -0.04993438720703125, -0.04605293273925781, -0.042171478271484375, -0.03829002380371094, -0.0344085693359375, -0.030527114868164062, -0.026645660400390625, -0.022764205932617188, -0.01888275146484375, -0.015001296997070312, -0.011119842529296875, -0.0072383880615234375, -0.00335693359375, 0.0005245208740234375, 0.004405975341796875, 0.008287429809570312, 0.01216888427734375, 0.016050338745117188, 0.019931793212890625, 0.023813247680664062, 0.0276947021484375, 0.03157615661621094, 0.035457611083984375, 0.03933906555175781, 0.04322052001953125, 0.04710197448730469, 0.050983428955078125, 0.05486488342285156, 0.058746337890625, 0.06262779235839844, 0.06650924682617188, 0.07039070129394531, 0.07427215576171875, 0.07815361022949219, 0.08203506469726562, 0.08591651916503906, 0.0897979736328125, 0.09367942810058594, 0.09756088256835938, 0.10144233703613281, 0.10532379150390625, 0.10920524597167969, 0.11308670043945312, 0.11696815490722656, 0.120849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 7.0, 13.0, 13.0, 14.0, 24.0, 26.0, 24.0, 26.0, 34.0, 37.0, 38.0, 36.0, 40.0, 38.0, 38.0, 43.0, 45.0, 45.0, 44.0, 35.0, 34.0, 41.0, 37.0, 28.0, 26.0, 24.0, 21.0, 21.0, 21.0, 16.0, 14.0, 7.0, 11.0, 12.0, 7.0, 9.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0611572265625, -0.05928516387939453, -0.05741310119628906, -0.055541038513183594, -0.053668975830078125, -0.051796913146972656, -0.04992485046386719, -0.04805278778076172, -0.04618072509765625, -0.04430866241455078, -0.04243659973144531, -0.040564537048339844, -0.038692474365234375, -0.036820411682128906, -0.03494834899902344, -0.03307628631591797, -0.0312042236328125, -0.02933216094970703, -0.027460098266601562, -0.025588035583496094, -0.023715972900390625, -0.021843910217285156, -0.019971847534179688, -0.01809978485107422, -0.01622772216796875, -0.014355659484863281, -0.012483596801757812, -0.010611534118652344, -0.008739471435546875, -0.006867408752441406, -0.0049953460693359375, -0.0031232833862304688, -0.001251220703125, 0.0006208419799804688, 0.0024929046630859375, 0.004364967346191406, 0.006237030029296875, 0.008109092712402344, 0.009981155395507812, 0.011853218078613281, 0.01372528076171875, 0.015597343444824219, 0.017469406127929688, 0.019341468811035156, 0.021213531494140625, 0.023085594177246094, 0.024957656860351562, 0.02682971954345703, 0.0287017822265625, 0.03057384490966797, 0.03244590759277344, 0.034317970275878906, 0.036190032958984375, 0.038062095642089844, 0.03993415832519531, 0.04180622100830078, 0.04367828369140625, 0.04555034637451172, 0.04742240905761719, 0.049294471740722656, 0.051166534423828125, 0.053038597106933594, 0.05491065979003906, 0.05678272247314453, 0.05865478515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 9.0, 11.0, 18.0, 14.0, 26.0, 41.0, 48.0, 81.0, 146.0, 201.0, 317.0, 498.0, 839.0, 1413.0, 2582.0, 4923.0, 10884.0, 28084.0, 90444.0, 325958.0, 397777.0, 122222.0, 35966.0, 13087.0, 5812.0, 2910.0, 1657.0, 958.0, 581.0, 346.0, 233.0, 161.0, 89.0, 56.0, 54.0, 31.0, 20.0, 18.0, 9.0, 7.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06120014190673828, -0.05916786193847656, -0.057135581970214844, -0.055103302001953125, -0.053071022033691406, -0.05103874206542969, -0.04900646209716797, -0.04697418212890625, -0.04494190216064453, -0.04290962219238281, -0.040877342224121094, -0.038845062255859375, -0.036812782287597656, -0.03478050231933594, -0.03274822235107422, -0.0307159423828125, -0.02868366241455078, -0.026651382446289062, -0.024619102478027344, -0.022586822509765625, -0.020554542541503906, -0.018522262573242188, -0.01648998260498047, -0.01445770263671875, -0.012425422668457031, -0.010393142700195312, -0.008360862731933594, -0.006328582763671875, -0.004296302795410156, -0.0022640228271484375, -0.00023174285888671875, 0.001800537109375, 0.0038328170776367188, 0.0058650970458984375, 0.007897377014160156, 0.009929656982421875, 0.011961936950683594, 0.013994216918945312, 0.01602649688720703, 0.01805877685546875, 0.02009105682373047, 0.022123336791992188, 0.024155616760253906, 0.026187896728515625, 0.028220176696777344, 0.030252456665039062, 0.03228473663330078, 0.0343170166015625, 0.03634929656982422, 0.03838157653808594, 0.040413856506347656, 0.042446136474609375, 0.044478416442871094, 0.04651069641113281, 0.04854297637939453, 0.05057525634765625, 0.05260753631591797, 0.05463981628417969, 0.056672096252441406, 0.058704376220703125, 0.060736656188964844, 0.06276893615722656, 0.06480121612548828, 0.06683349609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 12.0, 9.0, 19.0, 14.0, 12.0, 35.0, 39.0, 51.0, 62.0, 52.0, 71.0, 83.0, 86.0, 68.0, 59.0, 63.0, 51.0, 39.0, 34.0, 27.0, 22.0, 13.0, 17.0, 16.0, 7.0, 8.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.03795051574707e-05, -5.8525241911411285e-05, -5.667097866535187e-05, -5.481671541929245e-05, -5.296245217323303e-05, -5.1108188927173615e-05, -4.92539256811142e-05, -4.739966243505478e-05, -4.554539918899536e-05, -4.3691135942935944e-05, -4.1836872696876526e-05, -3.998260945081711e-05, -3.812834620475769e-05, -3.627408295869827e-05, -3.4419819712638855e-05, -3.256555646657944e-05, -3.071129322052002e-05, -2.8857029974460602e-05, -2.7002766728401184e-05, -2.5148503482341766e-05, -2.329424023628235e-05, -2.143997699022293e-05, -1.9585713744163513e-05, -1.7731450498104095e-05, -1.5877187252044678e-05, -1.402292400598526e-05, -1.2168660759925842e-05, -1.0314397513866425e-05, -8.460134267807007e-06, -6.605871021747589e-06, -4.751607775688171e-06, -2.8973445296287537e-06, -1.043081283569336e-06, 8.111819624900818e-07, 2.6654452085494995e-06, 4.519708454608917e-06, 6.373971700668335e-06, 8.228234946727753e-06, 1.008249819278717e-05, 1.1936761438846588e-05, 1.3791024684906006e-05, 1.5645287930965424e-05, 1.749955117702484e-05, 1.935381442308426e-05, 2.1208077669143677e-05, 2.3062340915203094e-05, 2.4916604161262512e-05, 2.677086740732193e-05, 2.8625130653381348e-05, 3.0479393899440765e-05, 3.233365714550018e-05, 3.41879203915596e-05, 3.604218363761902e-05, 3.7896446883678436e-05, 3.9750710129737854e-05, 4.160497337579727e-05, 4.345923662185669e-05, 4.531349986791611e-05, 4.7167763113975525e-05, 4.902202636003494e-05, 5.087628960609436e-05, 5.273055285215378e-05, 5.4584816098213196e-05, 5.6439079344272614e-05, 5.829334259033203e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 13.0, 5.0, 15.0, 13.0, 25.0, 42.0, 49.0, 78.0, 152.0, 255.0, 488.0, 968.0, 2151.0, 6628.0, 27793.0, 181395.0, 643250.0, 151123.0, 24288.0, 5870.0, 2082.0, 838.0, 434.0, 246.0, 142.0, 74.0, 43.0, 38.0, 19.0, 3.0, 9.0, 10.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.10397720336914062, -0.10095977783203125, -0.09794235229492188, -0.0949249267578125, -0.09190750122070312, -0.08889007568359375, -0.08587265014648438, -0.082855224609375, -0.07983779907226562, -0.07682037353515625, -0.07380294799804688, -0.0707855224609375, -0.06776809692382812, -0.06475067138671875, -0.061733245849609375, -0.0587158203125, -0.055698394775390625, -0.05268096923828125, -0.049663543701171875, -0.0466461181640625, -0.043628692626953125, -0.04061126708984375, -0.037593841552734375, -0.034576416015625, -0.031558990478515625, -0.02854156494140625, -0.025524139404296875, -0.0225067138671875, -0.019489288330078125, -0.01647186279296875, -0.013454437255859375, -0.01043701171875, -0.007419586181640625, -0.00440216064453125, -0.001384735107421875, 0.0016326904296875, 0.004650115966796875, 0.00766754150390625, 0.010684967041015625, 0.013702392578125, 0.016719818115234375, 0.01973724365234375, 0.022754669189453125, 0.0257720947265625, 0.028789520263671875, 0.03180694580078125, 0.034824371337890625, 0.037841796875, 0.040859222412109375, 0.04387664794921875, 0.046894073486328125, 0.0499114990234375, 0.052928924560546875, 0.05594635009765625, 0.058963775634765625, 0.061981201171875, 0.06499862670898438, 0.06801605224609375, 0.07103347778320312, 0.0740509033203125, 0.07706832885742188, 0.08008575439453125, 0.08310317993164062, 0.08612060546875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 5.0, 8.0, 12.0, 19.0, 21.0, 29.0, 33.0, 34.0, 47.0, 54.0, 66.0, 69.0, 56.0, 83.0, 57.0, 65.0, 57.0, 39.0, 43.0, 41.0, 28.0, 28.0, 26.0, 16.0, 11.0, 6.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.046600341796875, -0.045503854751586914, -0.04440736770629883, -0.04331088066101074, -0.042214393615722656, -0.04111790657043457, -0.040021419525146484, -0.0389249324798584, -0.03782844543457031, -0.03673195838928223, -0.03563547134399414, -0.034538984298706055, -0.03344249725341797, -0.03234601020812988, -0.031249523162841797, -0.03015303611755371, -0.029056549072265625, -0.02796006202697754, -0.026863574981689453, -0.025767087936401367, -0.02467060089111328, -0.023574113845825195, -0.02247762680053711, -0.021381139755249023, -0.020284652709960938, -0.01918816566467285, -0.018091678619384766, -0.01699519157409668, -0.015898704528808594, -0.014802217483520508, -0.013705730438232422, -0.012609243392944336, -0.01151275634765625, -0.010416269302368164, -0.009319782257080078, -0.008223295211791992, -0.007126808166503906, -0.00603032112121582, -0.004933834075927734, -0.0038373470306396484, -0.0027408599853515625, -0.0016443729400634766, -0.0005478858947753906, 0.0005486011505126953, 0.0016450881958007812, 0.002741575241088867, 0.003838062286376953, 0.004934549331665039, 0.006031036376953125, 0.007127523422241211, 0.008224010467529297, 0.009320497512817383, 0.010416984558105469, 0.011513471603393555, 0.01260995864868164, 0.013706445693969727, 0.014802932739257812, 0.0158994197845459, 0.016995906829833984, 0.01809239387512207, 0.019188880920410156, 0.020285367965698242, 0.021381855010986328, 0.022478342056274414, 0.0235748291015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 8.0, 44.0, 156.0, 360.0, 304.0, 98.0, 21.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.775293231010437, -0.715581476688385, -0.655869722366333, -0.5961580276489258, -0.5364462733268738, -0.4767345190048218, -0.41702279448509216, -0.35731106996536255, -0.29759931564331055, -0.23788757622241974, -0.17817583680152893, -0.11846409738063812, -0.058752357959747314, 0.0009593963623046875, 0.0606711208820343, 0.12038284540176392, 0.18009459972381592, 0.23980633914470673, 0.29951807856559753, 0.35922980308532715, 0.41894155740737915, 0.47865331172943115, 0.5383650064468384, 0.5980767607688904, 0.6577885150909424, 0.7175002694129944, 0.7772120237350464, 0.8369237184524536, 0.8966354727745056, 0.9563472270965576, 1.0160589218139648, 1.075770616531372, 1.1354823112487793, 1.1951940059661865, 1.2549058198928833, 1.3146175146102905, 1.3743293285369873, 1.4340410232543945, 1.4937527179718018, 1.553464412689209, 1.6131762266159058, 1.672887921333313, 1.7325997352600098, 1.792311429977417, 1.8520231246948242, 1.911734938621521, 1.9714466333389282, 2.031158447265625, 2.0908701419830322, 2.1505818367004395, 2.2102935314178467, 2.270005464553833, 2.3297171592712402, 2.3894288539886475, 2.4491405487060547, 2.508852243423462, 2.568563938140869, 2.6282756328582764, 2.6879873275756836, 2.74769926071167, 2.807410955429077, 2.8671226501464844, 2.9268343448638916, 2.986546039581299, 3.046257972717285]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 8.0, 12.0, 24.0, 15.0, 22.0, 23.0, 23.0, 31.0, 34.0, 39.0, 36.0, 38.0, 40.0, 65.0, 59.0, 65.0, 48.0, 56.0, 62.0, 42.0, 38.0, 34.0, 33.0, 32.0, 17.0, 14.0, 17.0, 12.0, 10.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5495665073394775, -0.5306557416915894, -0.5117449760437012, -0.4928342401981354, -0.4739234745502472, -0.455012708902359, -0.4361019730567932, -0.41719120740890503, -0.39828044176101685, -0.37936967611312866, -0.3604589104652405, -0.3415481746196747, -0.3226374089717865, -0.3037266433238983, -0.2848159074783325, -0.26590514183044434, -0.24699437618255615, -0.22808361053466797, -0.20917285978794098, -0.190262109041214, -0.1713513433933258, -0.15244057774543762, -0.13352982699871063, -0.11461907625198364, -0.09570831060409546, -0.07679755240678787, -0.057886794209480286, -0.0389760360121727, -0.020065277814865112, -0.0011545196175575256, 0.01775623857975006, 0.03666698932647705, 0.055577754974365234, 0.07448851317167282, 0.09339927136898041, 0.112310029566288, 0.13122078776359558, 0.15013155341148376, 0.16904230415821075, 0.18795305490493774, 0.20686382055282593, 0.2257745862007141, 0.2446853369474411, 0.2635960876941681, 0.2825068533420563, 0.30141761898994446, 0.32032835483551025, 0.33923912048339844, 0.3581498861312866, 0.3770606517791748, 0.395971417427063, 0.4148821532726288, 0.43379291892051697, 0.45270368456840515, 0.47161442041397095, 0.49052518606185913, 0.5094359517097473, 0.5283467173576355, 0.5472574830055237, 0.5661682486534119, 0.5850789546966553, 0.6039897203445435, 0.6229004859924316, 0.6418112516403198, 0.660722017288208]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 17.0, 30.0, 41.0, 87.0, 160.0, 330.0, 902.0, 3219.0, 24182.0, 4015332.0, 139540.0, 7654.0, 1659.0, 580.0, 226.0, 117.0, 76.0, 39.0, 21.0, 18.0, 3.0, 9.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4582366943359375, -0.443328857421875, -0.4284210205078125, -0.41351318359375, -0.3986053466796875, -0.383697509765625, -0.3687896728515625, -0.3538818359375, -0.3389739990234375, -0.324066162109375, -0.3091583251953125, -0.29425048828125, -0.2793426513671875, -0.264434814453125, -0.2495269775390625, -0.234619140625, -0.2197113037109375, -0.204803466796875, -0.1898956298828125, -0.17498779296875, -0.1600799560546875, -0.145172119140625, -0.1302642822265625, -0.1153564453125, -0.1004486083984375, -0.085540771484375, -0.0706329345703125, -0.05572509765625, -0.0408172607421875, -0.025909423828125, -0.0110015869140625, 0.00390625, 0.0188140869140625, 0.033721923828125, 0.0486297607421875, 0.06353759765625, 0.0784454345703125, 0.093353271484375, 0.1082611083984375, 0.1231689453125, 0.1380767822265625, 0.152984619140625, 0.1678924560546875, 0.18280029296875, 0.1977081298828125, 0.212615966796875, 0.2275238037109375, 0.242431640625, 0.2573394775390625, 0.272247314453125, 0.2871551513671875, 0.30206298828125, 0.3169708251953125, 0.331878662109375, 0.3467864990234375, 0.3616943359375, 0.3766021728515625, 0.391510009765625, 0.4064178466796875, 0.42132568359375, 0.4362335205078125, 0.451141357421875, 0.4660491943359375, 0.48095703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 20.0, 31.0, 29.0, 45.0, 75.0, 127.0, 129.0, 122.0, 120.0, 72.0, 69.0, 38.0, 29.0, 27.0, 14.0, 7.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.024997949600219727, -0.024178028106689453, -0.02335810661315918, -0.022538185119628906, -0.021718263626098633, -0.02089834213256836, -0.020078420639038086, -0.019258499145507812, -0.01843857765197754, -0.017618656158447266, -0.016798734664916992, -0.01597881317138672, -0.015158891677856445, -0.014338970184326172, -0.013519048690795898, -0.012699127197265625, -0.011879205703735352, -0.011059284210205078, -0.010239362716674805, -0.009419441223144531, -0.008599519729614258, -0.007779598236083984, -0.006959676742553711, -0.0061397552490234375, -0.005319833755493164, -0.004499912261962891, -0.003679990768432617, -0.0028600692749023438, -0.0020401477813720703, -0.0012202262878417969, -0.00040030479431152344, 0.00041961669921875, 0.0012395381927490234, 0.002059459686279297, 0.0028793811798095703, 0.0036993026733398438, 0.004519224166870117, 0.005339145660400391, 0.006159067153930664, 0.0069789886474609375, 0.007798910140991211, 0.008618831634521484, 0.009438753128051758, 0.010258674621582031, 0.011078596115112305, 0.011898517608642578, 0.012718439102172852, 0.013538360595703125, 0.014358282089233398, 0.015178203582763672, 0.015998125076293945, 0.01681804656982422, 0.017637968063354492, 0.018457889556884766, 0.01927781105041504, 0.020097732543945312, 0.020917654037475586, 0.02173757553100586, 0.022557497024536133, 0.023377418518066406, 0.02419734001159668, 0.025017261505126953, 0.025837182998657227, 0.0266571044921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 22.0, 15.0, 32.0, 53.0, 73.0, 114.0, 213.0, 340.0, 582.0, 1201.0, 2616.0, 7066.0, 25439.0, 160390.0, 3504243.0, 429401.0, 44930.0, 10640.0, 3595.0, 1494.0, 745.0, 405.0, 230.0, 129.0, 99.0, 46.0, 47.0, 28.0, 18.0, 12.0, 5.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1662731170654297, -0.16067123413085938, -0.15506935119628906, -0.14946746826171875, -0.14386558532714844, -0.13826370239257812, -0.1326618194580078, -0.1270599365234375, -0.12145805358886719, -0.11585617065429688, -0.11025428771972656, -0.10465240478515625, -0.09905052185058594, -0.09344863891601562, -0.08784675598144531, -0.082244873046875, -0.07664299011230469, -0.07104110717773438, -0.06543922424316406, -0.05983734130859375, -0.05423545837402344, -0.048633575439453125, -0.04303169250488281, -0.0374298095703125, -0.03182792663574219, -0.026226043701171875, -0.020624160766601562, -0.01502227783203125, -0.009420394897460938, -0.003818511962890625, 0.0017833709716796875, 0.00738525390625, 0.012987136840820312, 0.018589019775390625, 0.024190902709960938, 0.02979278564453125, 0.03539466857910156, 0.040996551513671875, 0.04659843444824219, 0.0522003173828125, 0.05780220031738281, 0.06340408325195312, 0.06900596618652344, 0.07460784912109375, 0.08020973205566406, 0.08581161499023438, 0.09141349792480469, 0.097015380859375, 0.10261726379394531, 0.10821914672851562, 0.11382102966308594, 0.11942291259765625, 0.12502479553222656, 0.13062667846679688, 0.1362285614013672, 0.1418304443359375, 0.1474323272705078, 0.15303421020507812, 0.15863609313964844, 0.16423797607421875, 0.16983985900878906, 0.17544174194335938, 0.1810436248779297, 0.1866455078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 13.0, 10.0, 21.0, 20.0, 29.0, 49.0, 83.0, 141.0, 269.0, 627.0, 1798.0, 429.0, 239.0, 123.0, 55.0, 41.0, 35.0, 13.0, 19.0, 11.0, 9.0, 7.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.03126859664916992, -0.030035972595214844, -0.028803348541259766, -0.027570724487304688, -0.02633810043334961, -0.02510547637939453, -0.023872852325439453, -0.022640228271484375, -0.021407604217529297, -0.02017498016357422, -0.01894235610961914, -0.017709732055664062, -0.016477108001708984, -0.015244483947753906, -0.014011859893798828, -0.01277923583984375, -0.011546611785888672, -0.010313987731933594, -0.009081363677978516, -0.007848739624023438, -0.006616115570068359, -0.005383491516113281, -0.004150867462158203, -0.002918243408203125, -0.0016856193542480469, -0.00045299530029296875, 0.0007796287536621094, 0.0020122528076171875, 0.0032448768615722656, 0.004477500915527344, 0.005710124969482422, 0.0069427490234375, 0.008175373077392578, 0.009407997131347656, 0.010640621185302734, 0.011873245239257812, 0.01310586929321289, 0.014338493347167969, 0.015571117401123047, 0.016803741455078125, 0.018036365509033203, 0.01926898956298828, 0.02050161361694336, 0.021734237670898438, 0.022966861724853516, 0.024199485778808594, 0.025432109832763672, 0.02666473388671875, 0.027897357940673828, 0.029129981994628906, 0.030362606048583984, 0.03159523010253906, 0.03282785415649414, 0.03406047821044922, 0.0352931022644043, 0.036525726318359375, 0.03775835037231445, 0.03899097442626953, 0.04022359848022461, 0.04145622253417969, 0.042688846588134766, 0.043921470642089844, 0.04515409469604492, 0.04638671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 14.0, 22.0, 46.0, 70.0, 121.0, 140.0, 146.0, 134.0, 117.0, 73.0, 46.0, 18.0, 12.0, 12.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2676220238208771, -0.2612111270427704, -0.2548002600669861, -0.2483893632888794, -0.2419784665107727, -0.2355675846338272, -0.2291567027568817, -0.22274580597877502, -0.21633490920066833, -0.20992402732372284, -0.20351313054561615, -0.19710224866867065, -0.19069135189056396, -0.18428047001361847, -0.17786958813667297, -0.17145869135856628, -0.1650478094816208, -0.1586369276046753, -0.1522260308265686, -0.1458151489496231, -0.13940425217151642, -0.13299337029457092, -0.12658247351646423, -0.12017159163951874, -0.11376070231199265, -0.10734981298446655, -0.10093892365694046, -0.09452803432941437, -0.08811715245246887, -0.08170625567436218, -0.07529537379741669, -0.0688844844698906, -0.062473610043525696, -0.0560627207159996, -0.04965183138847351, -0.04324094578623772, -0.036830056458711624, -0.03041916713118553, -0.024008281528949738, -0.017597392201423645, -0.011186502873897552, -0.004775614477694035, 0.0016352739185094833, 0.008046161383390427, 0.01445705071091652, 0.02086794003844261, 0.027278825640678406, 0.0336897149682045, 0.04010060429573059, 0.04651149362325668, 0.052922382950782776, 0.05933326855301857, 0.06574416160583496, 0.07215504348278046, 0.07856593281030655, 0.08497682213783264, 0.09138771146535873, 0.09779860079288483, 0.10420949012041092, 0.11062037944793701, 0.11703126132488251, 0.1234421581029892, 0.1298530399799347, 0.13626393675804138, 0.14267481863498688]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 15.0, 7.0, 11.0, 10.0, 7.0, 15.0, 15.0, 19.0, 14.0, 27.0, 34.0, 36.0, 37.0, 41.0, 41.0, 51.0, 52.0, 44.0, 48.0, 47.0, 44.0, 40.0, 33.0, 44.0, 24.0, 37.0, 38.0, 23.0, 19.0, 13.0, 26.0, 14.0, 20.0, 13.0, 13.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.12018674612045288, -0.11640593409538269, -0.1126251146197319, -0.10884430259466171, -0.10506348311901093, -0.10128267109394073, -0.09750185906887054, -0.09372104704380035, -0.08994022756814957, -0.08615941554307938, -0.08237859606742859, -0.0785977840423584, -0.07481697201728821, -0.07103615254163742, -0.06725534051656723, -0.06347452104091644, -0.05969370901584625, -0.055912893265485764, -0.052132077515125275, -0.048351265490055084, -0.044570449739694595, -0.040789633989334106, -0.037008821964263916, -0.03322800621390343, -0.029447190463542938, -0.02566637471318245, -0.02188556082546711, -0.01810474693775177, -0.014323931187391281, -0.010543115437030792, -0.006762301549315453, -0.002981487661600113, 0.000799328088760376, 0.00458014290779829, 0.008360957726836205, 0.012141772545874119, 0.015922587364912033, 0.019703403115272522, 0.02348421700298786, 0.0272650308907032, 0.03104584664106369, 0.03482666239142418, 0.03860747814178467, 0.04238829016685486, 0.04616910591721535, 0.049949921667575836, 0.05373073369264603, 0.057511549443006516, 0.061292365193367004, 0.0650731772184372, 0.06885399669408798, 0.07263480871915817, 0.07641562819480896, 0.08019644021987915, 0.08397725224494934, 0.08775806427001953, 0.09153888374567032, 0.09531969577074051, 0.0991005152463913, 0.10288132727146149, 0.10666213929653168, 0.11044295877218246, 0.11422377079725266, 0.11800459027290344, 0.12178540229797363]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 11.0, 14.0, 24.0, 33.0, 38.0, 79.0, 95.0, 199.0, 320.0, 490.0, 926.0, 1610.0, 3394.0, 7932.0, 25434.0, 104829.0, 445859.0, 348406.0, 76432.0, 19620.0, 6541.0, 2841.0, 1419.0, 790.0, 441.0, 256.0, 179.0, 107.0, 81.0, 31.0, 34.0, 15.0, 13.0, 11.0, 9.0, 2.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1279296875, -0.12378883361816406, -0.11964797973632812, -0.11550712585449219, -0.11136627197265625, -0.10722541809082031, -0.10308456420898438, -0.09894371032714844, -0.0948028564453125, -0.09066200256347656, -0.08652114868164062, -0.08238029479980469, -0.07823944091796875, -0.07409858703613281, -0.06995773315429688, -0.06581687927246094, -0.061676025390625, -0.05753517150878906, -0.053394317626953125, -0.04925346374511719, -0.04511260986328125, -0.04097175598144531, -0.036830902099609375, -0.03269004821777344, -0.0285491943359375, -0.024408340454101562, -0.020267486572265625, -0.016126632690429688, -0.01198577880859375, -0.007844924926757812, -0.003704071044921875, 0.0004367828369140625, 0.00457763671875, 0.008718490600585938, 0.012859344482421875, 0.017000198364257812, 0.02114105224609375, 0.025281906127929688, 0.029422760009765625, 0.03356361389160156, 0.0377044677734375, 0.04184532165527344, 0.045986175537109375, 0.05012702941894531, 0.05426788330078125, 0.05840873718261719, 0.06254959106445312, 0.06669044494628906, 0.070831298828125, 0.07497215270996094, 0.07911300659179688, 0.08325386047363281, 0.08739471435546875, 0.09153556823730469, 0.09567642211914062, 0.09981727600097656, 0.1039581298828125, 0.10809898376464844, 0.11223983764648438, 0.11638069152832031, 0.12052154541015625, 0.12466239929199219, 0.12880325317382812, 0.13294410705566406, 0.1370849609375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 14.0, 17.0, 23.0, 46.0, 62.0, 102.0, 112.0, 113.0, 102.0, 101.0, 80.0, 62.0, 44.0, 33.0, 25.0, 21.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0260467529296875, -0.02523946762084961, -0.02443218231201172, -0.023624897003173828, -0.022817611694335938, -0.022010326385498047, -0.021203041076660156, -0.020395755767822266, -0.019588470458984375, -0.018781185150146484, -0.017973899841308594, -0.017166614532470703, -0.016359329223632812, -0.015552043914794922, -0.014744758605957031, -0.01393747329711914, -0.01313018798828125, -0.01232290267944336, -0.011515617370605469, -0.010708332061767578, -0.009901046752929688, -0.009093761444091797, -0.008286476135253906, -0.007479190826416016, -0.006671905517578125, -0.005864620208740234, -0.005057334899902344, -0.004250049591064453, -0.0034427642822265625, -0.002635478973388672, -0.0018281936645507812, -0.0010209083557128906, -0.000213623046875, 0.0005936622619628906, 0.0014009475708007812, 0.002208232879638672, 0.0030155181884765625, 0.003822803497314453, 0.004630088806152344, 0.005437374114990234, 0.006244659423828125, 0.007051944732666016, 0.007859230041503906, 0.008666515350341797, 0.009473800659179688, 0.010281085968017578, 0.011088371276855469, 0.01189565658569336, 0.01270294189453125, 0.01351022720336914, 0.014317512512207031, 0.015124797821044922, 0.015932083129882812, 0.016739368438720703, 0.017546653747558594, 0.018353939056396484, 0.019161224365234375, 0.019968509674072266, 0.020775794982910156, 0.021583080291748047, 0.022390365600585938, 0.023197650909423828, 0.02400493621826172, 0.02481222152709961, 0.0256195068359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 16.0, 23.0, 23.0, 21.0, 51.0, 60.0, 98.0, 124.0, 123.0, 177.0, 229.0, 367.0, 479.0, 816.0, 1438.0, 2919.0, 7003.0, 20810.0, 67895.0, 218052.0, 432687.0, 200212.0, 62715.0, 19135.0, 6450.0, 2742.0, 1302.0, 780.0, 450.0, 388.0, 268.0, 170.0, 138.0, 89.0, 73.0, 53.0, 37.0, 36.0, 28.0, 12.0, 14.0, 8.0, 9.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.09792137145996094, -0.09470748901367188, -0.09149360656738281, -0.08827972412109375, -0.08506584167480469, -0.08185195922851562, -0.07863807678222656, -0.0754241943359375, -0.07221031188964844, -0.06899642944335938, -0.06578254699707031, -0.06256866455078125, -0.05935478210449219, -0.056140899658203125, -0.05292701721191406, -0.049713134765625, -0.04649925231933594, -0.043285369873046875, -0.04007148742675781, -0.03685760498046875, -0.03364372253417969, -0.030429840087890625, -0.027215957641601562, -0.0240020751953125, -0.020788192749023438, -0.017574310302734375, -0.014360427856445312, -0.01114654541015625, -0.007932662963867188, -0.004718780517578125, -0.0015048980712890625, 0.001708984375, 0.0049228668212890625, 0.008136749267578125, 0.011350631713867188, 0.01456451416015625, 0.017778396606445312, 0.020992279052734375, 0.024206161499023438, 0.0274200439453125, 0.030633926391601562, 0.033847808837890625, 0.03706169128417969, 0.04027557373046875, 0.04348945617675781, 0.046703338623046875, 0.04991722106933594, 0.053131103515625, 0.05634498596191406, 0.059558868408203125, 0.06277275085449219, 0.06598663330078125, 0.06920051574707031, 0.07241439819335938, 0.07562828063964844, 0.0788421630859375, 0.08205604553222656, 0.08526992797851562, 0.08848381042480469, 0.09169769287109375, 0.09491157531738281, 0.09812545776367188, 0.10133934020996094, 0.10455322265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 18.0, 22.0, 25.0, 16.0, 30.0, 25.0, 28.0, 43.0, 37.0, 51.0, 40.0, 41.0, 53.0, 54.0, 50.0, 43.0, 52.0, 48.0, 32.0, 31.0, 43.0, 28.0, 28.0, 20.0, 18.0, 16.0, 16.0, 8.0, 12.0, 5.0, 5.0, 8.0, 7.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07817745208740234, -0.07548332214355469, -0.07278919219970703, -0.07009506225585938, -0.06740093231201172, -0.06470680236816406, -0.062012672424316406, -0.05931854248046875, -0.056624412536621094, -0.05393028259277344, -0.05123615264892578, -0.048542022705078125, -0.04584789276123047, -0.04315376281738281, -0.040459632873535156, -0.0377655029296875, -0.035071372985839844, -0.03237724304199219, -0.02968311309814453, -0.026988983154296875, -0.02429485321044922, -0.021600723266601562, -0.018906593322753906, -0.01621246337890625, -0.013518333435058594, -0.010824203491210938, -0.008130073547363281, -0.005435943603515625, -0.0027418136596679688, -4.76837158203125e-05, 0.0026464462280273438, 0.005340576171875, 0.008034706115722656, 0.010728836059570312, 0.013422966003417969, 0.016117095947265625, 0.01881122589111328, 0.021505355834960938, 0.024199485778808594, 0.02689361572265625, 0.029587745666503906, 0.03228187561035156, 0.03497600555419922, 0.037670135498046875, 0.04036426544189453, 0.04305839538574219, 0.045752525329589844, 0.0484466552734375, 0.051140785217285156, 0.05383491516113281, 0.05652904510498047, 0.059223175048828125, 0.06191730499267578, 0.06461143493652344, 0.0673055648803711, 0.06999969482421875, 0.0726938247680664, 0.07538795471191406, 0.07808208465576172, 0.08077621459960938, 0.08347034454345703, 0.08616447448730469, 0.08885860443115234, 0.091552734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 15.0, 12.0, 12.0, 23.0, 64.0, 43.0, 80.0, 120.0, 207.0, 312.0, 538.0, 877.0, 1467.0, 2516.0, 4450.0, 8202.0, 16136.0, 33305.0, 76734.0, 211720.0, 385615.0, 178420.0, 66548.0, 29460.0, 14317.0, 7544.0, 4135.0, 2280.0, 1275.0, 788.0, 454.0, 314.0, 179.0, 126.0, 76.0, 53.0, 53.0, 16.0, 10.0, 15.0, 10.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049163818359375, -0.04743385314941406, -0.045703887939453125, -0.04397392272949219, -0.04224395751953125, -0.04051399230957031, -0.038784027099609375, -0.03705406188964844, -0.0353240966796875, -0.03359413146972656, -0.031864166259765625, -0.030134201049804688, -0.02840423583984375, -0.026674270629882812, -0.024944305419921875, -0.023214340209960938, -0.021484375, -0.019754409790039062, -0.018024444580078125, -0.016294479370117188, -0.01456451416015625, -0.012834548950195312, -0.011104583740234375, -0.009374618530273438, -0.0076446533203125, -0.0059146881103515625, -0.004184722900390625, -0.0024547576904296875, -0.00072479248046875, 0.0010051727294921875, 0.002735137939453125, 0.0044651031494140625, 0.006195068359375, 0.007925033569335938, 0.009654998779296875, 0.011384963989257812, 0.01311492919921875, 0.014844894409179688, 0.016574859619140625, 0.018304824829101562, 0.0200347900390625, 0.021764755249023438, 0.023494720458984375, 0.025224685668945312, 0.02695465087890625, 0.028684616088867188, 0.030414581298828125, 0.03214454650878906, 0.03387451171875, 0.03560447692871094, 0.037334442138671875, 0.03906440734863281, 0.04079437255859375, 0.04252433776855469, 0.044254302978515625, 0.04598426818847656, 0.0477142333984375, 0.04944419860839844, 0.051174163818359375, 0.05290412902832031, 0.05463409423828125, 0.05636405944824219, 0.058094024658203125, 0.05982398986816406, 0.061553955078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 15.0, 17.0, 26.0, 33.0, 37.0, 45.0, 44.0, 73.0, 92.0, 111.0, 72.0, 77.0, 76.0, 61.0, 33.0, 46.0, 29.0, 23.0, 12.0, 13.0, 15.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.118680953979492e-05, -3.96091490983963e-05, -3.803148865699768e-05, -3.645382821559906e-05, -3.487616777420044e-05, -3.329850733280182e-05, -3.17208468914032e-05, -3.0143186450004578e-05, -2.8565526008605957e-05, -2.6987865567207336e-05, -2.5410205125808716e-05, -2.3832544684410095e-05, -2.2254884243011475e-05, -2.0677223801612854e-05, -1.9099563360214233e-05, -1.7521902918815613e-05, -1.5944242477416992e-05, -1.4366582036018372e-05, -1.2788921594619751e-05, -1.121126115322113e-05, -9.63360071182251e-06, -8.05594027042389e-06, -6.4782798290252686e-06, -4.900619387626648e-06, -3.3229589462280273e-06, -1.7452985048294067e-06, -1.6763806343078613e-07, 1.4100223779678345e-06, 2.987682819366455e-06, 4.565343260765076e-06, 6.143003702163696e-06, 7.720664143562317e-06, 9.298324584960938e-06, 1.0875985026359558e-05, 1.2453645467758179e-05, 1.40313059091568e-05, 1.560896635055542e-05, 1.718662679195404e-05, 1.876428723335266e-05, 2.0341947674751282e-05, 2.1919608116149902e-05, 2.3497268557548523e-05, 2.5074928998947144e-05, 2.6652589440345764e-05, 2.8230249881744385e-05, 2.9807910323143005e-05, 3.1385570764541626e-05, 3.2963231205940247e-05, 3.454089164733887e-05, 3.611855208873749e-05, 3.769621253013611e-05, 3.927387297153473e-05, 4.085153341293335e-05, 4.242919385433197e-05, 4.400685429573059e-05, 4.558451473712921e-05, 4.716217517852783e-05, 4.873983561992645e-05, 5.031749606132507e-05, 5.1895156502723694e-05, 5.3472816944122314e-05, 5.5050477385520935e-05, 5.6628137826919556e-05, 5.8205798268318176e-05, 5.97834587097168e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 7.0, 11.0, 9.0, 15.0, 25.0, 30.0, 38.0, 70.0, 114.0, 148.0, 245.0, 428.0, 840.0, 1932.0, 5304.0, 20321.0, 105762.0, 669688.0, 198657.0, 32078.0, 7812.0, 2570.0, 1090.0, 523.0, 280.0, 162.0, 120.0, 69.0, 63.0, 32.0, 30.0, 20.0, 12.0, 10.0, 10.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.137939453125, -0.13417625427246094, -0.13041305541992188, -0.1266498565673828, -0.12288665771484375, -0.11912345886230469, -0.11536026000976562, -0.11159706115722656, -0.1078338623046875, -0.10407066345214844, -0.10030746459960938, -0.09654426574707031, -0.09278106689453125, -0.08901786804199219, -0.08525466918945312, -0.08149147033691406, -0.077728271484375, -0.07396507263183594, -0.07020187377929688, -0.06643867492675781, -0.06267547607421875, -0.05891227722167969, -0.055149078369140625, -0.05138587951660156, -0.0476226806640625, -0.04385948181152344, -0.040096282958984375, -0.03633308410644531, -0.03256988525390625, -0.028806686401367188, -0.025043487548828125, -0.021280288696289062, -0.01751708984375, -0.013753890991210938, -0.009990692138671875, -0.0062274932861328125, -0.00246429443359375, 0.0012989044189453125, 0.005062103271484375, 0.008825302124023438, 0.0125885009765625, 0.016351699829101562, 0.020114898681640625, 0.023878097534179688, 0.02764129638671875, 0.03140449523925781, 0.035167694091796875, 0.03893089294433594, 0.042694091796875, 0.04645729064941406, 0.050220489501953125, 0.05398368835449219, 0.05774688720703125, 0.06151008605957031, 0.06527328491210938, 0.06903648376464844, 0.0727996826171875, 0.07656288146972656, 0.08032608032226562, 0.08408927917480469, 0.08785247802734375, 0.09161567687988281, 0.09537887573242188, 0.09914207458496094, 0.1029052734375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 8.0, 2.0, 11.0, 7.0, 8.0, 14.0, 12.0, 11.0, 23.0, 24.0, 23.0, 29.0, 42.0, 54.0, 66.0, 73.0, 78.0, 78.0, 84.0, 57.0, 63.0, 54.0, 24.0, 31.0, 20.0, 18.0, 23.0, 10.0, 13.0, 10.0, 5.0, 3.0, 8.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.051788330078125, -0.050187110900878906, -0.04858589172363281, -0.04698467254638672, -0.045383453369140625, -0.04378223419189453, -0.04218101501464844, -0.040579795837402344, -0.03897857666015625, -0.037377357482910156, -0.03577613830566406, -0.03417491912841797, -0.032573699951171875, -0.03097248077392578, -0.029371261596679688, -0.027770042419433594, -0.0261688232421875, -0.024567604064941406, -0.022966384887695312, -0.02136516571044922, -0.019763946533203125, -0.01816272735595703, -0.016561508178710938, -0.014960289001464844, -0.01335906982421875, -0.011757850646972656, -0.010156631469726562, -0.008555412292480469, -0.006954193115234375, -0.005352973937988281, -0.0037517547607421875, -0.0021505355834960938, -0.00054931640625, 0.0010519027709960938, 0.0026531219482421875, 0.004254341125488281, 0.005855560302734375, 0.007456779479980469, 0.009057998657226562, 0.010659217834472656, 0.01226043701171875, 0.013861656188964844, 0.015462875366210938, 0.01706409454345703, 0.018665313720703125, 0.02026653289794922, 0.021867752075195312, 0.023468971252441406, 0.0250701904296875, 0.026671409606933594, 0.028272628784179688, 0.02987384796142578, 0.031475067138671875, 0.03307628631591797, 0.03467750549316406, 0.036278724670410156, 0.03787994384765625, 0.039481163024902344, 0.04108238220214844, 0.04268360137939453, 0.044284820556640625, 0.04588603973388672, 0.04748725891113281, 0.049088478088378906, 0.050689697265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 22.0, 52.0, 123.0, 203.0, 250.0, 168.0, 98.0, 40.0, 18.0, 9.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1698739528656006, -1.1302838325500488, -1.090693712234497, -1.0511035919189453, -1.0115134716033936, -0.971923291683197, -0.9323331117630005, -0.8927429914474487, -0.853152871131897, -0.8135627508163452, -0.7739726305007935, -0.7343824505805969, -0.6947923302650452, -0.6552022099494934, -0.6156120300292969, -0.5760219097137451, -0.5364317893981934, -0.4968416690826416, -0.45725151896476746, -0.4176613688468933, -0.37807124853134155, -0.3384811282157898, -0.29889097809791565, -0.2593008279800415, -0.21971070766448975, -0.1801205724477768, -0.14053043723106384, -0.10094030201435089, -0.06135016679763794, -0.021760031580924988, 0.017830103635787964, 0.05742025375366211, 0.09701037406921387, 0.13660050928592682, 0.17619064450263977, 0.21578077971935272, 0.2553709149360657, 0.29496103525161743, 0.3345511853694916, 0.3741413354873657, 0.4137314558029175, 0.45332157611846924, 0.4929117262363434, 0.5325018763542175, 0.5720919966697693, 0.611682116985321, 0.6512722969055176, 0.6908624172210693, 0.7304525375366211, 0.7700426578521729, 0.8096327781677246, 0.8492229580879211, 0.8888130784034729, 0.9284031987190247, 0.9679933786392212, 1.007583498954773, 1.0471736192703247, 1.0867637395858765, 1.1263538599014282, 1.16594398021698, 1.2055342197418213, 1.245124340057373, 1.2847144603729248, 1.3243045806884766, 1.3638947010040283]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 7.0, 8.0, 8.0, 12.0, 21.0, 14.0, 15.0, 13.0, 15.0, 12.0, 21.0, 23.0, 28.0, 22.0, 36.0, 28.0, 30.0, 43.0, 44.0, 40.0, 33.0, 33.0, 40.0, 41.0, 46.0, 34.0, 50.0, 26.0, 27.0, 31.0, 33.0, 23.0, 19.0, 21.0, 16.0, 14.0, 10.0, 10.0, 10.0, 9.0, 8.0, 5.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.49877625703811646, -0.48435696959495544, -0.46993765234947205, -0.45551836490631104, -0.44109907746315, -0.426679790019989, -0.4122604727745056, -0.3978411853313446, -0.3834218978881836, -0.3690026104450226, -0.3545832931995392, -0.3401640057563782, -0.32574471831321716, -0.31132543087005615, -0.29690611362457275, -0.28248682618141174, -0.26806750893592834, -0.25364822149276733, -0.23922891914844513, -0.22480961680412292, -0.21039032936096191, -0.1959710270166397, -0.1815517246723175, -0.1671324372291565, -0.1527131348848343, -0.13829383254051208, -0.12387454509735107, -0.10945524275302887, -0.09503594785928726, -0.08061665296554565, -0.06619735062122345, -0.05177805572748184, -0.037358760833740234, -0.022939464077353477, -0.00852016732096672, 0.0058991312980651855, 0.020318426191806793, 0.0347377210855484, 0.049157023429870605, 0.06357631832361221, 0.07799561321735382, 0.09241490811109543, 0.10683420300483704, 0.12125350534915924, 0.13567280769348145, 0.15009209513664246, 0.16451139748096466, 0.17893069982528687, 0.19334998726844788, 0.20776928961277008, 0.2221885770559311, 0.2366078794002533, 0.2510271668434143, 0.2654464840888977, 0.2798657715320587, 0.2942850589752197, 0.3087043762207031, 0.32312366366386414, 0.33754298090934753, 0.35196226835250854, 0.36638155579566956, 0.38080084323883057, 0.39522016048431396, 0.409639447927475, 0.424058735370636]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 12.0, 13.0, 11.0, 21.0, 38.0, 43.0, 101.0, 127.0, 197.0, 431.0, 750.0, 1434.0, 3176.0, 8837.0, 35862.0, 374283.0, 3648371.0, 93867.0, 17015.0, 5278.0, 2095.0, 979.0, 532.0, 299.0, 157.0, 109.0, 72.0, 56.0, 20.0, 19.0, 12.0, 13.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16650390625, -0.1608104705810547, -0.15511703491210938, -0.14942359924316406, -0.14373016357421875, -0.13803672790527344, -0.13234329223632812, -0.1266498565673828, -0.1209564208984375, -0.11526298522949219, -0.10956954956054688, -0.10387611389160156, -0.09818267822265625, -0.09248924255371094, -0.08679580688476562, -0.08110237121582031, -0.075408935546875, -0.06971549987792969, -0.06402206420898438, -0.05832862854003906, -0.05263519287109375, -0.04694175720214844, -0.041248321533203125, -0.03555488586425781, -0.0298614501953125, -0.024168014526367188, -0.018474578857421875, -0.012781143188476562, -0.00708770751953125, -0.0013942718505859375, 0.004299163818359375, 0.009992599487304688, 0.01568603515625, 0.021379470825195312, 0.027072906494140625, 0.03276634216308594, 0.03845977783203125, 0.04415321350097656, 0.049846649169921875, 0.05554008483886719, 0.0612335205078125, 0.06692695617675781, 0.07262039184570312, 0.07831382751464844, 0.08400726318359375, 0.08970069885253906, 0.09539413452148438, 0.10108757019042969, 0.106781005859375, 0.11247444152832031, 0.11816787719726562, 0.12386131286621094, 0.12955474853515625, 0.13524818420410156, 0.14094161987304688, 0.1466350555419922, 0.1523284912109375, 0.1580219268798828, 0.16371536254882812, 0.16940879821777344, 0.17510223388671875, 0.18079566955566406, 0.18648910522460938, 0.1921825408935547, 0.1978759765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 19.0, 24.0, 31.0, 39.0, 54.0, 74.0, 75.0, 83.0, 98.0, 96.0, 86.0, 62.0, 55.0, 42.0, 36.0, 31.0, 31.0, 11.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.028154850006103516, -0.02731800079345703, -0.026481151580810547, -0.025644302368164062, -0.024807453155517578, -0.023970603942871094, -0.02313375473022461, -0.022296905517578125, -0.02146005630493164, -0.020623207092285156, -0.019786357879638672, -0.018949508666992188, -0.018112659454345703, -0.01727581024169922, -0.016438961029052734, -0.01560211181640625, -0.014765262603759766, -0.013928413391113281, -0.013091564178466797, -0.012254714965820312, -0.011417865753173828, -0.010581016540527344, -0.00974416732788086, -0.008907318115234375, -0.00807046890258789, -0.007233619689941406, -0.006396770477294922, -0.0055599212646484375, -0.004723072052001953, -0.0038862228393554688, -0.0030493736267089844, -0.0022125244140625, -0.0013756752014160156, -0.0005388259887695312, 0.0002980232238769531, 0.0011348724365234375, 0.001971721649169922, 0.0028085708618164062, 0.0036454200744628906, 0.004482269287109375, 0.005319118499755859, 0.006155967712402344, 0.006992816925048828, 0.007829666137695312, 0.008666515350341797, 0.009503364562988281, 0.010340213775634766, 0.01117706298828125, 0.012013912200927734, 0.012850761413574219, 0.013687610626220703, 0.014524459838867188, 0.015361309051513672, 0.016198158264160156, 0.01703500747680664, 0.017871856689453125, 0.01870870590209961, 0.019545555114746094, 0.020382404327392578, 0.021219253540039062, 0.022056102752685547, 0.02289295196533203, 0.023729801177978516, 0.024566650390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 0.0, 4.0, 7.0, 7.0, 2.0, 9.0, 15.0, 16.0, 19.0, 32.0, 59.0, 50.0, 111.0, 177.0, 302.0, 518.0, 834.0, 1729.0, 3797.0, 12447.0, 72911.0, 2629886.0, 1389578.0, 63571.0, 11353.0, 3541.0, 1476.0, 753.0, 380.0, 249.0, 163.0, 103.0, 61.0, 41.0, 26.0, 13.0, 10.0, 13.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17353057861328125, -0.1677398681640625, -0.16194915771484375, -0.156158447265625, -0.15036773681640625, -0.1445770263671875, -0.13878631591796875, -0.13299560546875, -0.12720489501953125, -0.1214141845703125, -0.11562347412109375, -0.109832763671875, -0.10404205322265625, -0.0982513427734375, -0.09246063232421875, -0.086669921875, -0.08087921142578125, -0.0750885009765625, -0.06929779052734375, -0.063507080078125, -0.05771636962890625, -0.0519256591796875, -0.04613494873046875, -0.04034423828125, -0.03455352783203125, -0.0287628173828125, -0.02297210693359375, -0.017181396484375, -0.01139068603515625, -0.0055999755859375, 0.00019073486328125, 0.0059814453125, 0.01177215576171875, 0.0175628662109375, 0.02335357666015625, 0.029144287109375, 0.03493499755859375, 0.0407257080078125, 0.04651641845703125, 0.05230712890625, 0.05809783935546875, 0.0638885498046875, 0.06967926025390625, 0.075469970703125, 0.08126068115234375, 0.0870513916015625, 0.09284210205078125, 0.0986328125, 0.10442352294921875, 0.1102142333984375, 0.11600494384765625, 0.121795654296875, 0.12758636474609375, 0.1333770751953125, 0.13916778564453125, 0.14495849609375, 0.15074920654296875, 0.1565399169921875, 0.16233062744140625, 0.168121337890625, 0.17391204833984375, 0.1797027587890625, 0.18549346923828125, 0.1912841796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 14.0, 21.0, 43.0, 74.0, 173.0, 453.0, 2218.0, 625.0, 207.0, 93.0, 57.0, 21.0, 28.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.078125, -0.07615423202514648, -0.07418346405029297, -0.07221269607543945, -0.07024192810058594, -0.06827116012573242, -0.0663003921508789, -0.06432962417602539, -0.062358856201171875, -0.06038808822631836, -0.058417320251464844, -0.05644655227661133, -0.05447578430175781, -0.0525050163269043, -0.05053424835205078, -0.048563480377197266, -0.04659271240234375, -0.044621944427490234, -0.04265117645263672, -0.0406804084777832, -0.03870964050292969, -0.03673887252807617, -0.034768104553222656, -0.03279733657836914, -0.030826568603515625, -0.02885580062866211, -0.026885032653808594, -0.024914264678955078, -0.022943496704101562, -0.020972728729248047, -0.01900196075439453, -0.017031192779541016, -0.0150604248046875, -0.013089656829833984, -0.011118888854980469, -0.009148120880126953, -0.0071773529052734375, -0.005206584930419922, -0.0032358169555664062, -0.0012650489807128906, 0.000705718994140625, 0.0026764869689941406, 0.004647254943847656, 0.006618022918701172, 0.008588790893554688, 0.010559558868408203, 0.012530326843261719, 0.014501094818115234, 0.01647186279296875, 0.018442630767822266, 0.02041339874267578, 0.022384166717529297, 0.024354934692382812, 0.026325702667236328, 0.028296470642089844, 0.03026723861694336, 0.032238006591796875, 0.03420877456665039, 0.036179542541503906, 0.03815031051635742, 0.04012107849121094, 0.04209184646606445, 0.04406261444091797, 0.046033382415771484, 0.048004150390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 4.0, 4.0, 12.0, 6.0, 16.0, 26.0, 43.0, 59.0, 93.0, 128.0, 134.0, 123.0, 94.0, 88.0, 73.0, 39.0, 29.0, 10.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1828184276819229, -0.17528069019317627, -0.16774295270442963, -0.16020521521568298, -0.15266746282577515, -0.1451297402381897, -0.13759198784828186, -0.13005425035953522, -0.12251651287078857, -0.11497877538204193, -0.10744103789329529, -0.09990329295396805, -0.0923655554652214, -0.08482781797647476, -0.07729007303714752, -0.06975233554840088, -0.062214598059654236, -0.05467686057090759, -0.04713911935687065, -0.03960137814283371, -0.03206364065408707, -0.024525903165340424, -0.016988161951303482, -0.00945042073726654, -0.0019126832485198975, 0.005625056102871895, 0.013162795454263687, 0.02070053480565548, 0.02823827415704727, 0.035776011645793915, 0.043313752859830856, 0.0508514940738678, 0.058389246463775635, 0.06592698395252228, 0.07346472144126892, 0.08100246638059616, 0.0885402038693428, 0.09607794135808945, 0.10361568629741669, 0.11115342378616333, 0.11869116127490997, 0.12622889876365662, 0.13376663625240326, 0.1413043737411499, 0.14884212613105774, 0.1563798487186432, 0.16391760110855103, 0.17145533859729767, 0.1789930760860443, 0.18653081357479095, 0.1940685510635376, 0.20160628855228424, 0.20914402604103088, 0.21668177843093872, 0.22421951591968536, 0.231757253408432, 0.23929499089717865, 0.2468327283859253, 0.25437048077583313, 0.2619082033634186, 0.2694459557533264, 0.27698367834091187, 0.2845214307308197, 0.29205918312072754, 0.299596905708313]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 2.0, 5.0, 11.0, 15.0, 17.0, 10.0, 20.0, 24.0, 23.0, 21.0, 23.0, 31.0, 30.0, 33.0, 36.0, 39.0, 29.0, 33.0, 43.0, 38.0, 34.0, 44.0, 34.0, 32.0, 30.0, 27.0, 25.0, 26.0, 19.0, 28.0, 21.0, 29.0, 24.0, 21.0, 26.0, 14.0, 9.0, 13.0, 9.0, 5.0, 11.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.1259007453918457, -0.12195496261119843, -0.11800917983055115, -0.11406338959932327, -0.110117606818676, -0.10617182403802872, -0.10222603380680084, -0.09828025102615356, -0.09433446824550629, -0.09038868546485901, -0.08644290268421173, -0.08249711245298386, -0.07855132967233658, -0.0746055468916893, -0.07065975666046143, -0.06671397387981415, -0.06276819109916687, -0.05882240831851959, -0.054876621812582016, -0.05093083530664444, -0.04698505252599716, -0.043039269745349884, -0.03909348323941231, -0.03514769673347473, -0.031201913952827454, -0.027256129309535027, -0.0233103446662426, -0.019364560022950172, -0.015418775379657745, -0.011472990736365318, -0.007527206093072891, -0.003581421449780464, 0.0003643631935119629, 0.00431014783680439, 0.008255932480096817, 0.012201717123389244, 0.01614750176668167, 0.020093286409974098, 0.024039071053266525, 0.027984855696558952, 0.03193064033985138, 0.03587642312049866, 0.039822209626436234, 0.04376799613237381, 0.04771377891302109, 0.051659561693668365, 0.05560534819960594, 0.05955113470554352, 0.0634969174861908, 0.06744270026683807, 0.07138848304748535, 0.07533427327871323, 0.0792800560593605, 0.08322583884000778, 0.08717162907123566, 0.09111741185188293, 0.09506319463253021, 0.09900897741317749, 0.10295476019382477, 0.10690055042505264, 0.11084633320569992, 0.1147921159863472, 0.11873790621757507, 0.12268368899822235, 0.12662947177886963]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 8.0, 7.0, 9.0, 15.0, 17.0, 26.0, 30.0, 43.0, 80.0, 103.0, 160.0, 201.0, 332.0, 528.0, 903.0, 1438.0, 2802.0, 5378.0, 10782.0, 23174.0, 52400.0, 120483.0, 258893.0, 298215.0, 150503.0, 65724.0, 28819.0, 13349.0, 6346.0, 3173.0, 1782.0, 993.0, 630.0, 360.0, 257.0, 177.0, 117.0, 84.0, 45.0, 44.0, 43.0, 23.0, 17.0, 7.0, 8.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.079345703125, -0.07708740234375, -0.0748291015625, -0.07257080078125, -0.0703125, -0.06805419921875, -0.0657958984375, -0.06353759765625, -0.061279296875, -0.05902099609375, -0.0567626953125, -0.05450439453125, -0.05224609375, -0.04998779296875, -0.0477294921875, -0.04547119140625, -0.043212890625, -0.04095458984375, -0.0386962890625, -0.03643798828125, -0.0341796875, -0.03192138671875, -0.0296630859375, -0.02740478515625, -0.025146484375, -0.02288818359375, -0.0206298828125, -0.01837158203125, -0.01611328125, -0.01385498046875, -0.0115966796875, -0.00933837890625, -0.007080078125, -0.00482177734375, -0.0025634765625, -0.00030517578125, 0.001953125, 0.00421142578125, 0.0064697265625, 0.00872802734375, 0.010986328125, 0.01324462890625, 0.0155029296875, 0.01776123046875, 0.02001953125, 0.02227783203125, 0.0245361328125, 0.02679443359375, 0.029052734375, 0.03131103515625, 0.0335693359375, 0.03582763671875, 0.0380859375, 0.04034423828125, 0.0426025390625, 0.04486083984375, 0.047119140625, 0.04937744140625, 0.0516357421875, 0.05389404296875, 0.05615234375, 0.05841064453125, 0.0606689453125, 0.06292724609375, 0.065185546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 13.0, 12.0, 22.0, 26.0, 42.0, 47.0, 50.0, 82.0, 69.0, 91.0, 83.0, 81.0, 63.0, 68.0, 56.0, 45.0, 35.0, 39.0, 18.0, 14.0, 11.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.027905941009521484, -0.02704906463623047, -0.026192188262939453, -0.025335311889648438, -0.024478435516357422, -0.023621559143066406, -0.02276468276977539, -0.021907806396484375, -0.02105093002319336, -0.020194053649902344, -0.019337177276611328, -0.018480300903320312, -0.017623424530029297, -0.01676654815673828, -0.015909671783447266, -0.01505279541015625, -0.014195919036865234, -0.013339042663574219, -0.012482166290283203, -0.011625289916992188, -0.010768413543701172, -0.009911537170410156, -0.00905466079711914, -0.008197784423828125, -0.007340908050537109, -0.006484031677246094, -0.005627155303955078, -0.0047702789306640625, -0.003913402557373047, -0.0030565261840820312, -0.0021996498107910156, -0.0013427734375, -0.0004858970642089844, 0.00037097930908203125, 0.0012278556823730469, 0.0020847320556640625, 0.002941608428955078, 0.0037984848022460938, 0.004655361175537109, 0.005512237548828125, 0.006369113922119141, 0.007225990295410156, 0.008082866668701172, 0.008939743041992188, 0.009796619415283203, 0.010653495788574219, 0.011510372161865234, 0.01236724853515625, 0.013224124908447266, 0.014081001281738281, 0.014937877655029297, 0.015794754028320312, 0.016651630401611328, 0.017508506774902344, 0.01836538314819336, 0.019222259521484375, 0.02007913589477539, 0.020936012268066406, 0.021792888641357422, 0.022649765014648438, 0.023506641387939453, 0.02436351776123047, 0.025220394134521484, 0.0260772705078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 7.0, 5.0, 10.0, 8.0, 16.0, 21.0, 18.0, 41.0, 48.0, 69.0, 81.0, 130.0, 184.0, 223.0, 322.0, 536.0, 810.0, 1290.0, 2461.0, 5613.0, 13960.0, 41784.0, 133899.0, 370809.0, 316134.0, 105077.0, 33268.0, 11459.0, 4637.0, 2169.0, 1178.0, 735.0, 463.0, 312.0, 230.0, 139.0, 118.0, 63.0, 54.0, 38.0, 43.0, 25.0, 24.0, 14.0, 6.0, 9.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.097412109375, -0.0944509506225586, -0.09148979187011719, -0.08852863311767578, -0.08556747436523438, -0.08260631561279297, -0.07964515686035156, -0.07668399810791016, -0.07372283935546875, -0.07076168060302734, -0.06780052185058594, -0.06483936309814453, -0.061878204345703125, -0.05891704559326172, -0.05595588684082031, -0.052994728088378906, -0.0500335693359375, -0.047072410583496094, -0.04411125183105469, -0.04115009307861328, -0.038188934326171875, -0.03522777557373047, -0.03226661682128906, -0.029305458068847656, -0.02634429931640625, -0.023383140563964844, -0.020421981811523438, -0.01746082305908203, -0.014499664306640625, -0.011538505554199219, -0.008577346801757812, -0.005616188049316406, -0.002655029296875, 0.00030612945556640625, 0.0032672882080078125, 0.006228446960449219, 0.009189605712890625, 0.012150764465332031, 0.015111923217773438, 0.018073081970214844, 0.02103424072265625, 0.023995399475097656, 0.026956558227539062, 0.02991771697998047, 0.032878875732421875, 0.03584003448486328, 0.03880119323730469, 0.041762351989746094, 0.0447235107421875, 0.047684669494628906, 0.05064582824707031, 0.05360698699951172, 0.056568145751953125, 0.05952930450439453, 0.06249046325683594, 0.06545162200927734, 0.06841278076171875, 0.07137393951416016, 0.07433509826660156, 0.07729625701904297, 0.08025741577148438, 0.08321857452392578, 0.08617973327636719, 0.0891408920288086, 0.09210205078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 19.0, 23.0, 30.0, 21.0, 35.0, 30.0, 42.0, 44.0, 45.0, 55.0, 65.0, 58.0, 49.0, 43.0, 61.0, 52.0, 52.0, 30.0, 23.0, 34.0, 22.0, 22.0, 21.0, 18.0, 13.0, 16.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11798095703125, -0.11449813842773438, -0.11101531982421875, -0.10753250122070312, -0.1040496826171875, -0.10056686401367188, -0.09708404541015625, -0.09360122680664062, -0.090118408203125, -0.08663558959960938, -0.08315277099609375, -0.07966995239257812, -0.0761871337890625, -0.07270431518554688, -0.06922149658203125, -0.06573867797851562, -0.062255859375, -0.058773040771484375, -0.05529022216796875, -0.051807403564453125, -0.0483245849609375, -0.044841766357421875, -0.04135894775390625, -0.037876129150390625, -0.034393310546875, -0.030910491943359375, -0.02742767333984375, -0.023944854736328125, -0.0204620361328125, -0.016979217529296875, -0.01349639892578125, -0.010013580322265625, -0.00653076171875, -0.003047943115234375, 0.00043487548828125, 0.003917694091796875, 0.0074005126953125, 0.010883331298828125, 0.01436614990234375, 0.017848968505859375, 0.021331787109375, 0.024814605712890625, 0.02829742431640625, 0.031780242919921875, 0.0352630615234375, 0.038745880126953125, 0.04222869873046875, 0.045711517333984375, 0.0491943359375, 0.052677154541015625, 0.05615997314453125, 0.059642791748046875, 0.0631256103515625, 0.06660842895507812, 0.07009124755859375, 0.07357406616210938, 0.077056884765625, 0.08053970336914062, 0.08402252197265625, 0.08750534057617188, 0.0909881591796875, 0.09447097778320312, 0.09795379638671875, 0.10143661499023438, 0.10491943359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 15.0, 11.0, 13.0, 22.0, 42.0, 63.0, 94.0, 125.0, 219.0, 377.0, 704.0, 1184.0, 2353.0, 4775.0, 10342.0, 25200.0, 72515.0, 296114.0, 460401.0, 111637.0, 35675.0, 13895.0, 6163.0, 2990.0, 1569.0, 830.0, 447.0, 266.0, 180.0, 104.0, 70.0, 57.0, 29.0, 21.0, 20.0, 6.0, 11.0, 7.0, 1.0, 0.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.0547032356262207, -0.052613258361816406, -0.05052328109741211, -0.04843330383300781, -0.046343326568603516, -0.04425334930419922, -0.04216337203979492, -0.040073394775390625, -0.03798341751098633, -0.03589344024658203, -0.033803462982177734, -0.03171348571777344, -0.02962350845336914, -0.027533531188964844, -0.025443553924560547, -0.02335357666015625, -0.021263599395751953, -0.019173622131347656, -0.01708364486694336, -0.014993667602539062, -0.012903690338134766, -0.010813713073730469, -0.008723735809326172, -0.006633758544921875, -0.004543781280517578, -0.0024538040161132812, -0.0003638267517089844, 0.0017261505126953125, 0.0038161277770996094, 0.005906105041503906, 0.007996082305908203, 0.0100860595703125, 0.012176036834716797, 0.014266014099121094, 0.01635599136352539, 0.018445968627929688, 0.020535945892333984, 0.02262592315673828, 0.024715900421142578, 0.026805877685546875, 0.028895854949951172, 0.03098583221435547, 0.033075809478759766, 0.03516578674316406, 0.03725576400756836, 0.039345741271972656, 0.04143571853637695, 0.04352569580078125, 0.04561567306518555, 0.047705650329589844, 0.04979562759399414, 0.05188560485839844, 0.053975582122802734, 0.05606555938720703, 0.05815553665161133, 0.060245513916015625, 0.06233549118041992, 0.06442546844482422, 0.06651544570922852, 0.06860542297363281, 0.07069540023803711, 0.0727853775024414, 0.0748753547668457, 0.07696533203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 17.0, 22.0, 32.0, 47.0, 72.0, 63.0, 78.0, 97.0, 114.0, 103.0, 78.0, 71.0, 61.0, 39.0, 21.0, 21.0, 18.0, 10.0, 7.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2319297790527344e-05, -4.043988883495331e-05, -3.856047987937927e-05, -3.668107092380524e-05, -3.48016619682312e-05, -3.2922253012657166e-05, -3.104284405708313e-05, -2.9163435101509094e-05, -2.728402614593506e-05, -2.5404617190361023e-05, -2.3525208234786987e-05, -2.164579927921295e-05, -1.9766390323638916e-05, -1.788698136806488e-05, -1.6007572412490845e-05, -1.4128163456916809e-05, -1.2248754501342773e-05, -1.0369345545768738e-05, -8.489936590194702e-06, -6.6105276346206665e-06, -4.731118679046631e-06, -2.8517097234725952e-06, -9.723007678985596e-07, 9.071081876754761e-07, 2.7865171432495117e-06, 4.665926098823547e-06, 6.545335054397583e-06, 8.424744009971619e-06, 1.0304152965545654e-05, 1.218356192111969e-05, 1.4062970876693726e-05, 1.594237983226776e-05, 1.7821788787841797e-05, 1.9701197743415833e-05, 2.1580606698989868e-05, 2.3460015654563904e-05, 2.533942461013794e-05, 2.7218833565711975e-05, 2.909824252128601e-05, 3.0977651476860046e-05, 3.285706043243408e-05, 3.473646938800812e-05, 3.661587834358215e-05, 3.849528729915619e-05, 4.0374696254730225e-05, 4.225410521030426e-05, 4.4133514165878296e-05, 4.601292312145233e-05, 4.789233207702637e-05, 4.97717410326004e-05, 5.165114998817444e-05, 5.3530558943748474e-05, 5.540996789932251e-05, 5.7289376854896545e-05, 5.916878581047058e-05, 6.104819476604462e-05, 6.292760372161865e-05, 6.480701267719269e-05, 6.668642163276672e-05, 6.856583058834076e-05, 7.04452395439148e-05, 7.232464849948883e-05, 7.420405745506287e-05, 7.60834664106369e-05, 7.796287536621094e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 11.0, 13.0, 10.0, 12.0, 22.0, 26.0, 38.0, 56.0, 77.0, 114.0, 180.0, 266.0, 520.0, 847.0, 1827.0, 4155.0, 10959.0, 33791.0, 141930.0, 610947.0, 181656.0, 39563.0, 12376.0, 4771.0, 1966.0, 987.0, 495.0, 305.0, 180.0, 113.0, 71.0, 77.0, 51.0, 26.0, 24.0, 26.0, 14.0, 7.0, 6.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.0732269287109375, -0.070831298828125, -0.0684356689453125, -0.0660400390625, -0.0636444091796875, -0.061248779296875, -0.0588531494140625, -0.05645751953125, -0.0540618896484375, -0.051666259765625, -0.0492706298828125, -0.046875, -0.0444793701171875, -0.042083740234375, -0.0396881103515625, -0.03729248046875, -0.0348968505859375, -0.032501220703125, -0.0301055908203125, -0.0277099609375, -0.0253143310546875, -0.022918701171875, -0.0205230712890625, -0.01812744140625, -0.0157318115234375, -0.013336181640625, -0.0109405517578125, -0.008544921875, -0.0061492919921875, -0.003753662109375, -0.0013580322265625, 0.00103759765625, 0.0034332275390625, 0.005828857421875, 0.0082244873046875, 0.0106201171875, 0.0130157470703125, 0.015411376953125, 0.0178070068359375, 0.02020263671875, 0.0225982666015625, 0.024993896484375, 0.0273895263671875, 0.02978515625, 0.0321807861328125, 0.034576416015625, 0.0369720458984375, 0.03936767578125, 0.0417633056640625, 0.044158935546875, 0.0465545654296875, 0.0489501953125, 0.0513458251953125, 0.053741455078125, 0.0561370849609375, 0.05853271484375, 0.0609283447265625, 0.063323974609375, 0.0657196044921875, 0.068115234375, 0.0705108642578125, 0.072906494140625, 0.0753021240234375, 0.07769775390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 7.0, 6.0, 11.0, 8.0, 10.0, 14.0, 21.0, 23.0, 30.0, 31.0, 46.0, 57.0, 85.0, 94.0, 92.0, 98.0, 71.0, 76.0, 50.0, 34.0, 22.0, 16.0, 20.0, 14.0, 11.0, 4.0, 9.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0531005859375, -0.051512718200683594, -0.04992485046386719, -0.04833698272705078, -0.046749114990234375, -0.04516124725341797, -0.04357337951660156, -0.041985511779785156, -0.04039764404296875, -0.038809776306152344, -0.03722190856933594, -0.03563404083251953, -0.034046173095703125, -0.03245830535888672, -0.030870437622070312, -0.029282569885253906, -0.0276947021484375, -0.026106834411621094, -0.024518966674804688, -0.02293109893798828, -0.021343231201171875, -0.01975536346435547, -0.018167495727539062, -0.016579627990722656, -0.01499176025390625, -0.013403892517089844, -0.011816024780273438, -0.010228157043457031, -0.008640289306640625, -0.007052421569824219, -0.0054645538330078125, -0.0038766860961914062, -0.002288818359375, -0.0007009506225585938, 0.0008869171142578125, 0.0024747848510742188, 0.004062652587890625, 0.005650520324707031, 0.0072383880615234375, 0.008826255798339844, 0.01041412353515625, 0.012001991271972656, 0.013589859008789062, 0.015177726745605469, 0.016765594482421875, 0.01835346221923828, 0.019941329956054688, 0.021529197692871094, 0.0231170654296875, 0.024704933166503906, 0.026292800903320312, 0.02788066864013672, 0.029468536376953125, 0.03105640411376953, 0.03264427185058594, 0.034232139587402344, 0.03582000732421875, 0.037407875061035156, 0.03899574279785156, 0.04058361053466797, 0.042171478271484375, 0.04375934600830078, 0.04534721374511719, 0.046935081481933594, 0.04852294921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 17.0, 37.0, 60.0, 130.0, 164.0, 197.0, 179.0, 111.0, 61.0, 23.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36662888526916504, -0.3313409984111786, -0.29605311155319214, -0.2607652544975281, -0.22547736763954163, -0.19018948078155518, -0.15490160882472992, -0.11961373686790466, -0.08432585000991821, -0.04903797060251236, -0.013750091195106506, 0.021537788212299347, 0.0568256676197052, 0.09211355447769165, 0.1274014264345169, 0.16268929839134216, 0.1979771852493286, 0.23326507210731506, 0.2685529589653015, 0.3038408160209656, 0.339128702878952, 0.3744165897369385, 0.40970444679260254, 0.444992333650589, 0.48028022050857544, 0.5155680775642395, 0.5508559942245483, 0.5861438512802124, 0.6214317083358765, 0.6567196249961853, 0.6920074820518494, 0.7272953987121582, 0.7625832557678223, 0.7978711128234863, 0.8331590294837952, 0.8684468865394592, 0.9037348031997681, 0.9390226602554321, 0.9743105173110962, 1.0095983743667603, 1.0448863506317139, 1.080174207687378, 1.115462064743042, 1.1507500410079956, 1.1860378980636597, 1.2213257551193237, 1.2566136121749878, 1.2919014692306519, 1.327189326286316, 1.36247718334198, 1.397765040397644, 1.4330530166625977, 1.4683408737182617, 1.5036287307739258, 1.5389165878295898, 1.574204444885254, 1.609492301940918, 1.644780158996582, 1.680068016052246, 1.7153559923171997, 1.7506438493728638, 1.7859317064285278, 1.821219563484192, 1.856507420539856, 1.8917953968048096]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 12.0, 8.0, 27.0, 20.0, 23.0, 26.0, 40.0, 36.0, 49.0, 50.0, 69.0, 54.0, 61.0, 65.0, 62.0, 56.0, 44.0, 48.0, 49.0, 43.0, 27.0, 25.0, 22.0, 18.0, 10.0, 11.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6638667583465576, -0.6416358947753906, -0.6194049715995789, -0.5971741080284119, -0.5749431848526001, -0.5527123212814331, -0.5304814577102661, -0.5082505345344543, -0.48601964116096497, -0.4637887477874756, -0.4415578544139862, -0.4193269610404968, -0.39709609746932983, -0.37486517429351807, -0.3526343107223511, -0.3304034173488617, -0.3081725239753723, -0.28594163060188293, -0.26371073722839355, -0.24147985875606537, -0.219248965382576, -0.1970180720090866, -0.17478719353675842, -0.15255630016326904, -0.13032540678977966, -0.10809451341629028, -0.0858636274933815, -0.06363274157047272, -0.04140184819698334, -0.019170954823493958, 0.0030599236488342285, 0.02529081702232361, 0.047521770000457764, 0.06975266337394714, 0.09198354929685593, 0.11421443521976471, 0.1364453285932541, 0.15867622196674347, 0.18090710043907166, 0.20313799381256104, 0.22536888718605042, 0.2475997805595398, 0.2698306739330292, 0.29206156730651855, 0.31429243087768555, 0.3365233540534973, 0.3587542176246643, 0.3809851109981537, 0.40321600437164307, 0.42544689774513245, 0.4476777911186218, 0.4699086546897888, 0.4921395778656006, 0.5143704414367676, 0.5366013050079346, 0.5588322281837463, 0.5810631513595581, 0.6032940149307251, 0.6255249381065369, 0.6477558016777039, 0.6699867248535156, 0.6922175884246826, 0.7144484519958496, 0.7366793751716614, 0.7589102387428284]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 10.0, 8.0, 11.0, 23.0, 32.0, 54.0, 93.0, 194.0, 348.0, 739.0, 1737.0, 5003.0, 21371.0, 176554.0, 3826009.0, 135625.0, 18810.0, 4659.0, 1604.0, 707.0, 332.0, 146.0, 105.0, 40.0, 33.0, 14.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17201614379882812, -0.16617584228515625, -0.16033554077148438, -0.1544952392578125, -0.14865493774414062, -0.14281463623046875, -0.13697433471679688, -0.131134033203125, -0.12529373168945312, -0.11945343017578125, -0.11361312866210938, -0.1077728271484375, -0.10193252563476562, -0.09609222412109375, -0.09025192260742188, -0.08441162109375, -0.07857131958007812, -0.07273101806640625, -0.06689071655273438, -0.0610504150390625, -0.055210113525390625, -0.04936981201171875, -0.043529510498046875, -0.037689208984375, -0.031848907470703125, -0.02600860595703125, -0.020168304443359375, -0.0143280029296875, -0.008487701416015625, -0.00264739990234375, 0.003192901611328125, 0.009033203125, 0.014873504638671875, 0.02071380615234375, 0.026554107666015625, 0.0323944091796875, 0.038234710693359375, 0.04407501220703125, 0.049915313720703125, 0.055755615234375, 0.061595916748046875, 0.06743621826171875, 0.07327651977539062, 0.0791168212890625, 0.08495712280273438, 0.09079742431640625, 0.09663772583007812, 0.10247802734375, 0.10831832885742188, 0.11415863037109375, 0.11999893188476562, 0.1258392333984375, 0.13167953491210938, 0.13751983642578125, 0.14336013793945312, 0.149200439453125, 0.15504074096679688, 0.16088104248046875, 0.16672134399414062, 0.1725616455078125, 0.17840194702148438, 0.18424224853515625, 0.19008255004882812, 0.1959228515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 9.0, 9.0, 23.0, 23.0, 27.0, 27.0, 53.0, 62.0, 63.0, 58.0, 82.0, 75.0, 83.0, 54.0, 61.0, 42.0, 62.0, 38.0, 38.0, 25.0, 22.0, 14.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02801513671875, -0.027231693267822266, -0.02644824981689453, -0.025664806365966797, -0.024881362915039062, -0.024097919464111328, -0.023314476013183594, -0.02253103256225586, -0.021747589111328125, -0.02096414566040039, -0.020180702209472656, -0.019397258758544922, -0.018613815307617188, -0.017830371856689453, -0.01704692840576172, -0.016263484954833984, -0.01548004150390625, -0.014696598052978516, -0.013913154602050781, -0.013129711151123047, -0.012346267700195312, -0.011562824249267578, -0.010779380798339844, -0.00999593734741211, -0.009212493896484375, -0.00842905044555664, -0.007645606994628906, -0.006862163543701172, -0.0060787200927734375, -0.005295276641845703, -0.004511833190917969, -0.0037283897399902344, -0.0029449462890625, -0.0021615028381347656, -0.0013780593872070312, -0.0005946159362792969, 0.0001888275146484375, 0.0009722709655761719, 0.0017557144165039062, 0.0025391578674316406, 0.003322601318359375, 0.004106044769287109, 0.004889488220214844, 0.005672931671142578, 0.0064563751220703125, 0.007239818572998047, 0.008023262023925781, 0.008806705474853516, 0.00959014892578125, 0.010373592376708984, 0.011157035827636719, 0.011940479278564453, 0.012723922729492188, 0.013507366180419922, 0.014290809631347656, 0.01507425308227539, 0.015857696533203125, 0.01664113998413086, 0.017424583435058594, 0.018208026885986328, 0.018991470336914062, 0.019774913787841797, 0.02055835723876953, 0.021341800689697266, 0.022125244140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 8.0, 11.0, 8.0, 21.0, 18.0, 33.0, 32.0, 38.0, 37.0, 54.0, 82.0, 157.0, 344.0, 1037.0, 4337.0, 31020.0, 2887850.0, 1235929.0, 27547.0, 3995.0, 987.0, 344.0, 117.0, 74.0, 47.0, 24.0, 22.0, 25.0, 13.0, 13.0, 13.0, 10.0, 5.0, 6.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317626953125, -0.3073692321777344, -0.29711151123046875, -0.2868537902832031, -0.2765960693359375, -0.2663383483886719, -0.25608062744140625, -0.24582290649414062, -0.235565185546875, -0.22530746459960938, -0.21504974365234375, -0.20479202270507812, -0.1945343017578125, -0.18427658081054688, -0.17401885986328125, -0.16376113891601562, -0.15350341796875, -0.14324569702148438, -0.13298797607421875, -0.12273025512695312, -0.1124725341796875, -0.10221481323242188, -0.09195709228515625, -0.08169937133789062, -0.071441650390625, -0.061183929443359375, -0.05092620849609375, -0.040668487548828125, -0.0304107666015625, -0.020153045654296875, -0.00989532470703125, 0.000362396240234375, 0.0106201171875, 0.020877838134765625, 0.03113555908203125, 0.041393280029296875, 0.0516510009765625, 0.061908721923828125, 0.07216644287109375, 0.08242416381835938, 0.092681884765625, 0.10293960571289062, 0.11319732666015625, 0.12345504760742188, 0.1337127685546875, 0.14397048950195312, 0.15422821044921875, 0.16448593139648438, 0.17474365234375, 0.18500137329101562, 0.19525909423828125, 0.20551681518554688, 0.2157745361328125, 0.22603225708007812, 0.23628997802734375, 0.24654769897460938, 0.256805419921875, 0.2670631408691406, 0.27732086181640625, 0.2875785827636719, 0.2978363037109375, 0.3080940246582031, 0.31835174560546875, 0.3286094665527344, 0.3388671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 20.0, 25.0, 91.0, 188.0, 715.0, 2356.0, 381.0, 149.0, 48.0, 39.0, 23.0, 13.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.142333984375, -0.1393880844116211, -0.1364421844482422, -0.13349628448486328, -0.13055038452148438, -0.12760448455810547, -0.12465858459472656, -0.12171268463134766, -0.11876678466796875, -0.11582088470458984, -0.11287498474121094, -0.10992908477783203, -0.10698318481445312, -0.10403728485107422, -0.10109138488769531, -0.0981454849243164, -0.0951995849609375, -0.0922536849975586, -0.08930778503417969, -0.08636188507080078, -0.08341598510742188, -0.08047008514404297, -0.07752418518066406, -0.07457828521728516, -0.07163238525390625, -0.06868648529052734, -0.06574058532714844, -0.06279468536376953, -0.059848785400390625, -0.05690288543701172, -0.05395698547363281, -0.051011085510253906, -0.048065185546875, -0.045119285583496094, -0.04217338562011719, -0.03922748565673828, -0.036281585693359375, -0.03333568572998047, -0.030389785766601562, -0.027443885803222656, -0.02449798583984375, -0.021552085876464844, -0.018606185913085938, -0.01566028594970703, -0.012714385986328125, -0.009768486022949219, -0.0068225860595703125, -0.0038766860961914062, -0.0009307861328125, 0.0020151138305664062, 0.0049610137939453125, 0.007906913757324219, 0.010852813720703125, 0.013798713684082031, 0.016744613647460938, 0.019690513610839844, 0.02263641357421875, 0.025582313537597656, 0.028528213500976562, 0.03147411346435547, 0.034420013427734375, 0.03736591339111328, 0.04031181335449219, 0.043257713317871094, 0.04620361328125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 14.0, 30.0, 61.0, 88.0, 140.0, 168.0, 161.0, 133.0, 93.0, 65.0, 24.0, 11.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18401604890823364, -0.17166294157505035, -0.15930983424186707, -0.14695671200752258, -0.1346036046743393, -0.122250497341156, -0.10989739000797272, -0.09754427522420883, -0.08519116789102554, -0.07283806055784225, -0.06048494577407837, -0.04813183844089508, -0.035778727382421494, -0.023425616323947906, -0.011072508990764618, 0.0012806057929992676, 0.013633713126182556, 0.025986824184656143, 0.03833993524312973, 0.05069304257631302, 0.0630461573600769, 0.07539926469326019, 0.08775237202644348, 0.10010548681020737, 0.11245859414339066, 0.12481170147657394, 0.13716481626033783, 0.14951792359352112, 0.1618710309267044, 0.1742241382598877, 0.18657726049423218, 0.19893036782741547, 0.21128347516059875, 0.22363658249378204, 0.23598968982696533, 0.24834281206130981, 0.2606959044933319, 0.2730490267276764, 0.2854021191596985, 0.29775524139404297, 0.31010836362838745, 0.32246148586273193, 0.33481457829475403, 0.3471677005290985, 0.3595207929611206, 0.3718739151954651, 0.38422703742980957, 0.39658012986183167, 0.40893322229385376, 0.42128634452819824, 0.43363943696022034, 0.4459925591945648, 0.4583456516265869, 0.4706987738609314, 0.4830518960952759, 0.495404988527298, 0.5077581405639648, 0.5201112627983093, 0.5324643850326538, 0.5448174476623535, 0.557170569896698, 0.5695236921310425, 0.581876814365387, 0.5942299365997314, 0.6065829992294312]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 10.0, 11.0, 5.0, 18.0, 23.0, 24.0, 28.0, 30.0, 28.0, 23.0, 35.0, 50.0, 46.0, 40.0, 36.0, 32.0, 51.0, 42.0, 34.0, 44.0, 37.0, 45.0, 35.0, 41.0, 29.0, 19.0, 25.0, 20.0, 21.0, 12.0, 19.0, 9.0, 7.0, 14.0, 6.0, 6.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.16341900825500488, -0.1584937572479248, -0.15356852114200592, -0.14864327013492584, -0.14371801912784576, -0.13879278302192688, -0.1338675320148468, -0.12894228100776672, -0.12401703745126724, -0.11909179389476776, -0.11416654288768768, -0.1092412993311882, -0.10431605577468872, -0.09939080476760864, -0.09446556121110916, -0.08954031765460968, -0.0846150666475296, -0.07968982309103012, -0.07476457208395004, -0.06983932852745056, -0.06491407752037048, -0.059988833963871, -0.05506359040737152, -0.05013834312558174, -0.04521309584379196, -0.04028784856200218, -0.0353626012802124, -0.03043735772371292, -0.02551211044192314, -0.020586863160133362, -0.01566161774098873, -0.010736372321844101, -0.005811125040054321, -0.0008858786895871162, 0.004039367660880089, 0.008964614011347294, 0.013889860361814499, 0.01881510764360428, 0.02374035306274891, 0.02866559848189354, 0.03359084576368332, 0.0385160930454731, 0.04344134032726288, 0.04836658388376236, 0.05329183116555214, 0.05821707844734192, 0.0631423220038414, 0.06806756556034088, 0.07299281656742096, 0.07791806012392044, 0.08284331113100052, 0.0877685546875, 0.09269380569458008, 0.09761904925107956, 0.10254429280757904, 0.10746954381465912, 0.1123947873711586, 0.11732003092765808, 0.12224528193473816, 0.12717053294181824, 0.13209576904773712, 0.1370210200548172, 0.14194627106189728, 0.14687150716781616, 0.15179675817489624]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 9.0, 9.0, 18.0, 23.0, 33.0, 43.0, 80.0, 133.0, 191.0, 314.0, 570.0, 972.0, 1916.0, 3876.0, 7944.0, 17487.0, 41180.0, 97913.0, 230820.0, 340556.0, 174744.0, 72925.0, 30731.0, 13254.0, 6154.0, 3024.0, 1556.0, 838.0, 513.0, 248.0, 187.0, 80.0, 77.0, 50.0, 31.0, 18.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0860595703125, -0.08362388610839844, -0.08118820190429688, -0.07875251770019531, -0.07631683349609375, -0.07388114929199219, -0.07144546508789062, -0.06900978088378906, -0.0665740966796875, -0.06413841247558594, -0.061702728271484375, -0.05926704406738281, -0.05683135986328125, -0.05439567565917969, -0.051959991455078125, -0.04952430725097656, -0.047088623046875, -0.04465293884277344, -0.042217254638671875, -0.03978157043457031, -0.03734588623046875, -0.03491020202636719, -0.032474517822265625, -0.030038833618164062, -0.0276031494140625, -0.025167465209960938, -0.022731781005859375, -0.020296096801757812, -0.01786041259765625, -0.015424728393554688, -0.012989044189453125, -0.010553359985351562, -0.00811767578125, -0.0056819915771484375, -0.003246307373046875, -0.0008106231689453125, 0.00162506103515625, 0.0040607452392578125, 0.006496429443359375, 0.008932113647460938, 0.0113677978515625, 0.013803482055664062, 0.016239166259765625, 0.018674850463867188, 0.02111053466796875, 0.023546218872070312, 0.025981903076171875, 0.028417587280273438, 0.030853271484375, 0.03328895568847656, 0.035724639892578125, 0.03816032409667969, 0.04059600830078125, 0.04303169250488281, 0.045467376708984375, 0.04790306091308594, 0.0503387451171875, 0.05277442932128906, 0.055210113525390625, 0.05764579772949219, 0.06008148193359375, 0.06251716613769531, 0.06495285034179688, 0.06738853454589844, 0.06982421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 5.0, 13.0, 11.0, 31.0, 22.0, 40.0, 39.0, 48.0, 48.0, 55.0, 68.0, 90.0, 69.0, 62.0, 49.0, 62.0, 49.0, 51.0, 36.0, 32.0, 36.0, 18.0, 17.0, 7.0, 10.0, 7.0, 4.0, 3.0, 1.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0295867919921875, -0.028775691986083984, -0.02796459197998047, -0.027153491973876953, -0.026342391967773438, -0.025531291961669922, -0.024720191955566406, -0.02390909194946289, -0.023097991943359375, -0.02228689193725586, -0.021475791931152344, -0.020664691925048828, -0.019853591918945312, -0.019042491912841797, -0.01823139190673828, -0.017420291900634766, -0.01660919189453125, -0.015798091888427734, -0.014986991882324219, -0.014175891876220703, -0.013364791870117188, -0.012553691864013672, -0.011742591857910156, -0.01093149185180664, -0.010120391845703125, -0.00930929183959961, -0.008498191833496094, -0.007687091827392578, -0.0068759918212890625, -0.006064891815185547, -0.005253791809082031, -0.004442691802978516, -0.003631591796875, -0.0028204917907714844, -0.0020093917846679688, -0.0011982917785644531, -0.0003871917724609375, 0.0004239082336425781, 0.0012350082397460938, 0.0020461082458496094, 0.002857208251953125, 0.0036683082580566406, 0.004479408264160156, 0.005290508270263672, 0.0061016082763671875, 0.006912708282470703, 0.007723808288574219, 0.008534908294677734, 0.00934600830078125, 0.010157108306884766, 0.010968208312988281, 0.011779308319091797, 0.012590408325195312, 0.013401508331298828, 0.014212608337402344, 0.01502370834350586, 0.015834808349609375, 0.01664590835571289, 0.017457008361816406, 0.018268108367919922, 0.019079208374023438, 0.019890308380126953, 0.02070140838623047, 0.021512508392333984, 0.0223236083984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 9.0, 11.0, 11.0, 11.0, 17.0, 40.0, 51.0, 76.0, 136.0, 231.0, 354.0, 774.0, 1513.0, 3769.0, 14688.0, 87902.0, 525238.0, 347483.0, 51292.0, 9468.0, 2770.0, 1209.0, 610.0, 338.0, 211.0, 122.0, 88.0, 51.0, 30.0, 18.0, 13.0, 11.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1396484375, -0.1348094940185547, -0.12997055053710938, -0.12513160705566406, -0.12029266357421875, -0.11545372009277344, -0.11061477661132812, -0.10577583312988281, -0.1009368896484375, -0.09609794616699219, -0.09125900268554688, -0.08642005920410156, -0.08158111572265625, -0.07674217224121094, -0.07190322875976562, -0.06706428527832031, -0.062225341796875, -0.05738639831542969, -0.052547454833984375, -0.04770851135253906, -0.04286956787109375, -0.03803062438964844, -0.033191680908203125, -0.028352737426757812, -0.0235137939453125, -0.018674850463867188, -0.013835906982421875, -0.008996963500976562, -0.00415802001953125, 0.0006809234619140625, 0.005519866943359375, 0.010358810424804688, 0.01519775390625, 0.020036697387695312, 0.024875640869140625, 0.029714584350585938, 0.03455352783203125, 0.03939247131347656, 0.044231414794921875, 0.04907035827636719, 0.0539093017578125, 0.05874824523925781, 0.06358718872070312, 0.06842613220214844, 0.07326507568359375, 0.07810401916503906, 0.08294296264648438, 0.08778190612792969, 0.092620849609375, 0.09745979309082031, 0.10229873657226562, 0.10713768005371094, 0.11197662353515625, 0.11681556701660156, 0.12165451049804688, 0.1264934539794922, 0.1313323974609375, 0.1361713409423828, 0.14101028442382812, 0.14584922790527344, 0.15068817138671875, 0.15552711486816406, 0.16036605834960938, 0.1652050018310547, 0.1700439453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 3.0, 11.0, 14.0, 24.0, 20.0, 25.0, 36.0, 48.0, 26.0, 43.0, 29.0, 44.0, 74.0, 56.0, 59.0, 57.0, 48.0, 47.0, 47.0, 46.0, 29.0, 43.0, 27.0, 37.0, 16.0, 15.0, 12.0, 15.0, 15.0, 5.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10943603515625, -0.10591697692871094, -0.10239791870117188, -0.09887886047363281, -0.09535980224609375, -0.09184074401855469, -0.08832168579101562, -0.08480262756347656, -0.0812835693359375, -0.07776451110839844, -0.07424545288085938, -0.07072639465332031, -0.06720733642578125, -0.06368827819824219, -0.060169219970703125, -0.05665016174316406, -0.053131103515625, -0.04961204528808594, -0.046092987060546875, -0.04257392883300781, -0.03905487060546875, -0.03553581237792969, -0.032016754150390625, -0.028497695922851562, -0.0249786376953125, -0.021459579467773438, -0.017940521240234375, -0.014421463012695312, -0.01090240478515625, -0.0073833465576171875, -0.003864288330078125, -0.0003452301025390625, 0.003173828125, 0.0066928863525390625, 0.010211944580078125, 0.013731002807617188, 0.01725006103515625, 0.020769119262695312, 0.024288177490234375, 0.027807235717773438, 0.0313262939453125, 0.03484535217285156, 0.038364410400390625, 0.04188346862792969, 0.04540252685546875, 0.04892158508300781, 0.052440643310546875, 0.05595970153808594, 0.059478759765625, 0.06299781799316406, 0.06651687622070312, 0.07003593444824219, 0.07355499267578125, 0.07707405090332031, 0.08059310913085938, 0.08411216735839844, 0.0876312255859375, 0.09115028381347656, 0.09466934204101562, 0.09818840026855469, 0.10170745849609375, 0.10522651672363281, 0.10874557495117188, 0.11226463317871094, 0.11578369140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 15.0, 17.0, 23.0, 26.0, 51.0, 70.0, 119.0, 177.0, 309.0, 480.0, 880.0, 1657.0, 3136.0, 6487.0, 14612.0, 41046.0, 180104.0, 594953.0, 143502.0, 35331.0, 13194.0, 5841.0, 2952.0, 1511.0, 809.0, 457.0, 284.0, 148.0, 118.0, 86.0, 49.0, 40.0, 18.0, 13.0, 13.0, 4.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.085205078125, -0.08286666870117188, -0.08052825927734375, -0.07818984985351562, -0.0758514404296875, -0.07351303100585938, -0.07117462158203125, -0.06883621215820312, -0.066497802734375, -0.06415939331054688, -0.06182098388671875, -0.059482574462890625, -0.0571441650390625, -0.054805755615234375, -0.05246734619140625, -0.050128936767578125, -0.04779052734375, -0.045452117919921875, -0.04311370849609375, -0.040775299072265625, -0.0384368896484375, -0.036098480224609375, -0.03376007080078125, -0.031421661376953125, -0.029083251953125, -0.026744842529296875, -0.02440643310546875, -0.022068023681640625, -0.0197296142578125, -0.017391204833984375, -0.01505279541015625, -0.012714385986328125, -0.0103759765625, -0.008037567138671875, -0.00569915771484375, -0.003360748291015625, -0.0010223388671875, 0.001316070556640625, 0.00365447998046875, 0.005992889404296875, 0.008331298828125, 0.010669708251953125, 0.01300811767578125, 0.015346527099609375, 0.0176849365234375, 0.020023345947265625, 0.02236175537109375, 0.024700164794921875, 0.02703857421875, 0.029376983642578125, 0.03171539306640625, 0.034053802490234375, 0.0363922119140625, 0.038730621337890625, 0.04106903076171875, 0.043407440185546875, 0.045745849609375, 0.048084259033203125, 0.05042266845703125, 0.052761077880859375, 0.0550994873046875, 0.057437896728515625, 0.05977630615234375, 0.062114715576171875, 0.064453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 13.0, 19.0, 33.0, 60.0, 101.0, 128.0, 184.0, 164.0, 116.0, 75.0, 41.0, 14.0, 18.0, 6.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.091594696044922e-05, -5.781091749668121e-05, -5.470588803291321e-05, -5.16008585691452e-05, -4.84958291053772e-05, -4.539079964160919e-05, -4.2285770177841187e-05, -3.918074071407318e-05, -3.6075711250305176e-05, -3.297068178653717e-05, -2.9865652322769165e-05, -2.676062285900116e-05, -2.3655593395233154e-05, -2.055056393146515e-05, -1.7445534467697144e-05, -1.4340505003929138e-05, -1.1235475540161133e-05, -8.130446076393127e-06, -5.025416612625122e-06, -1.9203871488571167e-06, 1.1846423149108887e-06, 4.289671778678894e-06, 7.394701242446899e-06, 1.0499730706214905e-05, 1.360476016998291e-05, 1.6709789633750916e-05, 1.981481909751892e-05, 2.2919848561286926e-05, 2.602487802505493e-05, 2.9129907488822937e-05, 3.223493695259094e-05, 3.533996641635895e-05, 3.844499588012695e-05, 4.155002534389496e-05, 4.4655054807662964e-05, 4.776008427143097e-05, 5.0865113735198975e-05, 5.397014319896698e-05, 5.7075172662734985e-05, 6.018020212650299e-05, 6.3285231590271e-05, 6.6390261054039e-05, 6.949529051780701e-05, 7.260031998157501e-05, 7.570534944534302e-05, 7.881037890911102e-05, 8.191540837287903e-05, 8.502043783664703e-05, 8.812546730041504e-05, 9.123049676418304e-05, 9.433552622795105e-05, 9.744055569171906e-05, 0.00010054558515548706, 0.00010365061461925507, 0.00010675564408302307, 0.00010986067354679108, 0.00011296570301055908, 0.00011607073247432709, 0.00011917576193809509, 0.0001222807914018631, 0.0001253858208656311, 0.0001284908503293991, 0.00013159587979316711, 0.00013470090925693512, 0.00013780593872070312]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 9.0, 11.0, 14.0, 14.0, 14.0, 26.0, 36.0, 53.0, 85.0, 154.0, 256.0, 463.0, 985.0, 2175.0, 5539.0, 17410.0, 82048.0, 652068.0, 237791.0, 33767.0, 9375.0, 3332.0, 1381.0, 670.0, 345.0, 181.0, 103.0, 73.0, 54.0, 29.0, 25.0, 16.0, 18.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08928298950195312, -0.08628082275390625, -0.08327865600585938, -0.0802764892578125, -0.07727432250976562, -0.07427215576171875, -0.07126998901367188, -0.068267822265625, -0.06526565551757812, -0.06226348876953125, -0.059261322021484375, -0.0562591552734375, -0.053256988525390625, -0.05025482177734375, -0.047252655029296875, -0.04425048828125, -0.041248321533203125, -0.03824615478515625, -0.035243988037109375, -0.0322418212890625, -0.029239654541015625, -0.02623748779296875, -0.023235321044921875, -0.020233154296875, -0.017230987548828125, -0.01422882080078125, -0.011226654052734375, -0.0082244873046875, -0.005222320556640625, -0.00222015380859375, 0.000782012939453125, 0.0037841796875, 0.006786346435546875, 0.00978851318359375, 0.012790679931640625, 0.0157928466796875, 0.018795013427734375, 0.02179718017578125, 0.024799346923828125, 0.027801513671875, 0.030803680419921875, 0.03380584716796875, 0.036808013916015625, 0.0398101806640625, 0.042812347412109375, 0.04581451416015625, 0.048816680908203125, 0.05181884765625, 0.054821014404296875, 0.05782318115234375, 0.060825347900390625, 0.0638275146484375, 0.06682968139648438, 0.06983184814453125, 0.07283401489257812, 0.075836181640625, 0.07883834838867188, 0.08184051513671875, 0.08484268188476562, 0.0878448486328125, 0.09084701538085938, 0.09384918212890625, 0.09685134887695312, 0.099853515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 21.0, 14.0, 18.0, 38.0, 55.0, 65.0, 119.0, 110.0, 112.0, 109.0, 70.0, 50.0, 42.0, 41.0, 19.0, 20.0, 14.0, 8.0, 11.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.08099365234375, -0.0790705680847168, -0.0771474838256836, -0.07522439956665039, -0.07330131530761719, -0.07137823104858398, -0.06945514678955078, -0.06753206253051758, -0.06560897827148438, -0.06368589401245117, -0.06176280975341797, -0.059839725494384766, -0.05791664123535156, -0.05599355697631836, -0.054070472717285156, -0.05214738845825195, -0.05022430419921875, -0.04830121994018555, -0.046378135681152344, -0.04445505142211914, -0.04253196716308594, -0.040608882904052734, -0.03868579864501953, -0.03676271438598633, -0.034839630126953125, -0.03291654586791992, -0.03099346160888672, -0.029070377349853516, -0.027147293090820312, -0.02522420883178711, -0.023301124572753906, -0.021378040313720703, -0.0194549560546875, -0.017531871795654297, -0.015608787536621094, -0.01368570327758789, -0.011762619018554688, -0.009839534759521484, -0.007916450500488281, -0.005993366241455078, -0.004070281982421875, -0.002147197723388672, -0.00022411346435546875, 0.0016989707946777344, 0.0036220550537109375, 0.005545139312744141, 0.007468223571777344, 0.009391307830810547, 0.01131439208984375, 0.013237476348876953, 0.015160560607910156, 0.01708364486694336, 0.019006729125976562, 0.020929813385009766, 0.02285289764404297, 0.024775981903076172, 0.026699066162109375, 0.028622150421142578, 0.03054523468017578, 0.032468318939208984, 0.03439140319824219, 0.03631448745727539, 0.038237571716308594, 0.0401606559753418, 0.042083740234375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 13.0, 29.0, 73.0, 141.0, 238.0, 213.0, 161.0, 73.0, 48.0, 6.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3839235305786133, -0.3415030539035797, -0.29908257722854614, -0.25666213035583496, -0.2142416536808014, -0.17182117700576782, -0.12940073013305664, -0.08698025345802307, -0.0445597767829895, -0.0021393075585365295, 0.04028116166591644, 0.08270162343978882, 0.1251221001148224, 0.16754257678985596, 0.20996302366256714, 0.2523835003376007, 0.2948039770126343, 0.33722445368766785, 0.3796449303627014, 0.4220653772354126, 0.46448585391044617, 0.5069063305854797, 0.5493267774581909, 0.5917472839355469, 0.6341677308082581, 0.6765881776809692, 0.7190086841583252, 0.7614291310310364, 0.8038495779037476, 0.8462700843811035, 0.8886905312538147, 0.9311109781265259, 0.9735314846038818, 1.0159519910812378, 1.0583723783493042, 1.1007928848266602, 1.1432133913040161, 1.185633897781372, 1.2280542850494385, 1.2704747915267944, 1.3128952980041504, 1.3553158044815063, 1.3977361917495728, 1.4401566982269287, 1.4825772047042847, 1.5249977111816406, 1.567418098449707, 1.609838604927063, 1.6522589921951294, 1.6946794986724854, 1.7370998859405518, 1.7795203924179077, 1.8219408988952637, 1.86436128616333, 1.906781792640686, 1.949202299118042, 1.9916226863861084, 2.034043073654175, 2.0764636993408203, 2.1188840866088867, 2.161304473876953, 2.2037250995635986, 2.246145486831665, 2.2885658740997314, 2.330986499786377]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 6.0, 10.0, 9.0, 21.0, 16.0, 19.0, 37.0, 29.0, 31.0, 26.0, 46.0, 29.0, 32.0, 48.0, 52.0, 37.0, 38.0, 57.0, 38.0, 46.0, 47.0, 41.0, 38.0, 35.0, 17.0, 31.0, 25.0, 22.0, 19.0, 18.0, 14.0, 9.0, 5.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.47896742820739746, -0.46249446272850037, -0.44602149724960327, -0.4295485019683838, -0.4130755364894867, -0.3966025710105896, -0.3801296055316925, -0.3636566400527954, -0.3471836447715759, -0.33071067929267883, -0.31423771381378174, -0.29776471853256226, -0.28129175305366516, -0.26481878757476807, -0.24834582209587097, -0.23187285661697388, -0.21539989113807678, -0.1989269256591797, -0.1824539452791214, -0.1659809798002243, -0.14950799942016602, -0.13303503394126892, -0.11656206846237183, -0.10008909553289413, -0.08361612260341644, -0.06714314967393875, -0.05067018046975136, -0.034197211265563965, -0.017724238336086273, -0.0012512654066085815, 0.015221700072288513, 0.031694673001766205, 0.048167645931243896, 0.06464061886072159, 0.08111359179019928, 0.09758655726909637, 0.11405953019857407, 0.13053250312805176, 0.14700546860694885, 0.16347843408584595, 0.17995141446590424, 0.19642437994480133, 0.21289736032485962, 0.2293703258037567, 0.2458432912826538, 0.2623162865638733, 0.278789222240448, 0.2952622175216675, 0.3117351830005646, 0.32820814847946167, 0.34468111395835876, 0.36115407943725586, 0.37762707471847534, 0.39410004019737244, 0.41057300567626953, 0.4270459711551666, 0.4435189366340637, 0.4599919021129608, 0.4764648675918579, 0.4929378628730774, 0.5094107985496521, 0.5258837938308716, 0.5423567295074463, 0.5588297247886658, 0.5753027200698853]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 10.0, 10.0, 13.0, 13.0, 26.0, 36.0, 60.0, 63.0, 97.0, 160.0, 253.0, 381.0, 577.0, 997.0, 1750.0, 3053.0, 5866.0, 12166.0, 28015.0, 81229.0, 398437.0, 3217664.0, 321066.0, 71780.0, 25910.0, 11417.0, 5647.0, 3115.0, 1716.0, 1019.0, 617.0, 385.0, 249.0, 155.0, 118.0, 61.0, 49.0, 39.0, 15.0, 16.0, 11.0, 2.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08563232421875, -0.08290958404541016, -0.08018684387207031, -0.07746410369873047, -0.07474136352539062, -0.07201862335205078, -0.06929588317871094, -0.0665731430053711, -0.06385040283203125, -0.061127662658691406, -0.05840492248535156, -0.05568218231201172, -0.052959442138671875, -0.05023670196533203, -0.04751396179199219, -0.044791221618652344, -0.0420684814453125, -0.039345741271972656, -0.03662300109863281, -0.03390026092529297, -0.031177520751953125, -0.02845478057861328, -0.025732040405273438, -0.023009300231933594, -0.02028656005859375, -0.017563819885253906, -0.014841079711914062, -0.012118339538574219, -0.009395599365234375, -0.006672859191894531, -0.0039501190185546875, -0.0012273788452148438, 0.001495361328125, 0.004218101501464844, 0.0069408416748046875, 0.009663581848144531, 0.012386322021484375, 0.015109062194824219, 0.017831802368164062, 0.020554542541503906, 0.02327728271484375, 0.026000022888183594, 0.028722763061523438, 0.03144550323486328, 0.034168243408203125, 0.03689098358154297, 0.03961372375488281, 0.042336463928222656, 0.0450592041015625, 0.047781944274902344, 0.05050468444824219, 0.05322742462158203, 0.055950164794921875, 0.05867290496826172, 0.06139564514160156, 0.0641183853149414, 0.06684112548828125, 0.0695638656616211, 0.07228660583496094, 0.07500934600830078, 0.07773208618164062, 0.08045482635498047, 0.08317756652832031, 0.08590030670166016, 0.088623046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 12.0, 12.0, 15.0, 28.0, 35.0, 33.0, 49.0, 39.0, 69.0, 63.0, 58.0, 79.0, 74.0, 49.0, 57.0, 57.0, 56.0, 49.0, 31.0, 28.0, 24.0, 20.0, 10.0, 9.0, 8.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0264434814453125, -0.02564382553100586, -0.02484416961669922, -0.024044513702392578, -0.023244857788085938, -0.022445201873779297, -0.021645545959472656, -0.020845890045166016, -0.020046234130859375, -0.019246578216552734, -0.018446922302246094, -0.017647266387939453, -0.016847610473632812, -0.016047954559326172, -0.015248298645019531, -0.01444864273071289, -0.01364898681640625, -0.01284933090209961, -0.012049674987792969, -0.011250019073486328, -0.010450363159179688, -0.009650707244873047, -0.008851051330566406, -0.008051395416259766, -0.007251739501953125, -0.006452083587646484, -0.005652427673339844, -0.004852771759033203, -0.0040531158447265625, -0.003253459930419922, -0.0024538040161132812, -0.0016541481018066406, -0.0008544921875, -5.4836273193359375e-05, 0.0007448196411132812, 0.0015444755554199219, 0.0023441314697265625, 0.003143787384033203, 0.003943443298339844, 0.004743099212646484, 0.005542755126953125, 0.006342411041259766, 0.007142066955566406, 0.007941722869873047, 0.008741378784179688, 0.009541034698486328, 0.010340690612792969, 0.01114034652709961, 0.01194000244140625, 0.01273965835571289, 0.013539314270019531, 0.014338970184326172, 0.015138626098632812, 0.015938282012939453, 0.016737937927246094, 0.017537593841552734, 0.018337249755859375, 0.019136905670166016, 0.019936561584472656, 0.020736217498779297, 0.021535873413085938, 0.022335529327392578, 0.02313518524169922, 0.02393484115600586, 0.0247344970703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 8.0, 6.0, 9.0, 14.0, 26.0, 22.0, 27.0, 42.0, 47.0, 80.0, 115.0, 226.0, 436.0, 928.0, 2623.0, 9960.0, 62440.0, 1356542.0, 2660067.0, 82842.0, 12506.0, 3115.0, 1095.0, 440.0, 242.0, 154.0, 87.0, 47.0, 36.0, 31.0, 24.0, 15.0, 8.0, 10.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17898178100585938, -0.17302703857421875, -0.16707229614257812, -0.1611175537109375, -0.15516281127929688, -0.14920806884765625, -0.14325332641601562, -0.137298583984375, -0.13134384155273438, -0.12538909912109375, -0.11943435668945312, -0.1134796142578125, -0.10752487182617188, -0.10157012939453125, -0.09561538696289062, -0.08966064453125, -0.08370590209960938, -0.07775115966796875, -0.07179641723632812, -0.0658416748046875, -0.059886932373046875, -0.05393218994140625, -0.047977447509765625, -0.042022705078125, -0.036067962646484375, -0.03011322021484375, -0.024158477783203125, -0.0182037353515625, -0.012248992919921875, -0.00629425048828125, -0.000339508056640625, 0.005615234375, 0.011569976806640625, 0.01752471923828125, 0.023479461669921875, 0.0294342041015625, 0.035388946533203125, 0.04134368896484375, 0.047298431396484375, 0.053253173828125, 0.059207916259765625, 0.06516265869140625, 0.07111740112304688, 0.0770721435546875, 0.08302688598632812, 0.08898162841796875, 0.09493637084960938, 0.10089111328125, 0.10684585571289062, 0.11280059814453125, 0.11875534057617188, 0.1247100830078125, 0.13066482543945312, 0.13661956787109375, 0.14257431030273438, 0.148529052734375, 0.15448379516601562, 0.16043853759765625, 0.16639328002929688, 0.1723480224609375, 0.17830276489257812, 0.18425750732421875, 0.19021224975585938, 0.1961669921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 12.0, 32.0, 51.0, 96.0, 208.0, 527.0, 1680.0, 842.0, 298.0, 124.0, 78.0, 35.0, 35.0, 8.0, 11.0, 7.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.10387325286865234, -0.10111808776855469, -0.09836292266845703, -0.09560775756835938, -0.09285259246826172, -0.09009742736816406, -0.0873422622680664, -0.08458709716796875, -0.0818319320678711, -0.07907676696777344, -0.07632160186767578, -0.07356643676757812, -0.07081127166748047, -0.06805610656738281, -0.06530094146728516, -0.0625457763671875, -0.059790611267089844, -0.05703544616699219, -0.05428028106689453, -0.051525115966796875, -0.04876995086669922, -0.04601478576660156, -0.043259620666503906, -0.04050445556640625, -0.037749290466308594, -0.03499412536621094, -0.03223896026611328, -0.029483795166015625, -0.02672863006591797, -0.023973464965820312, -0.021218299865722656, -0.018463134765625, -0.015707969665527344, -0.012952804565429688, -0.010197639465332031, -0.007442474365234375, -0.004687309265136719, -0.0019321441650390625, 0.0008230209350585938, 0.00357818603515625, 0.006333351135253906, 0.009088516235351562, 0.011843681335449219, 0.014598846435546875, 0.01735401153564453, 0.020109176635742188, 0.022864341735839844, 0.0256195068359375, 0.028374671936035156, 0.031129837036132812, 0.03388500213623047, 0.036640167236328125, 0.03939533233642578, 0.04215049743652344, 0.044905662536621094, 0.04766082763671875, 0.050415992736816406, 0.05317115783691406, 0.05592632293701172, 0.058681488037109375, 0.06143665313720703, 0.06419181823730469, 0.06694698333740234, 0.0697021484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 16.0, 76.0, 146.0, 265.0, 271.0, 135.0, 59.0, 25.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453777015209198, -0.42830225825309753, -0.40282750129699707, -0.377352774143219, -0.35187798738479614, -0.32640326023101807, -0.3009285032749176, -0.27545374631881714, -0.24997898936271667, -0.2245042324066162, -0.19902947545051575, -0.17355473339557648, -0.148079976439476, -0.12260521948337555, -0.09713047742843628, -0.07165572047233582, -0.04618096351623535, -0.020706210285425186, 0.004768542945384979, 0.030243292450904846, 0.05571804940700531, 0.08119280636310577, 0.10666754841804504, 0.1321423053741455, 0.15761706233024597, 0.18309181928634644, 0.2085665762424469, 0.23404131829738617, 0.25951606035232544, 0.2849908471107483, 0.31046557426452637, 0.33594033122062683, 0.3614150285720825, 0.386889785528183, 0.41236454248428345, 0.4378392696380615, 0.4633140563964844, 0.48878878355026245, 0.5142635107040405, 0.5397382974624634, 0.5652130842208862, 0.5906878113746643, 0.6161625981330872, 0.6416373252868652, 0.6671121120452881, 0.6925868391990662, 0.7180615663528442, 0.7435363531112671, 0.7690110802650452, 0.7944858074188232, 0.8199605941772461, 0.8454353213310242, 0.870910108089447, 0.8963848352432251, 0.921859622001648, 0.947334349155426, 0.9728090763092041, 0.9982838034629822, 1.0237585306167603, 1.049233317375183, 1.074708104133606, 1.1001828908920288, 1.125657558441162, 1.151132345199585, 1.1766071319580078]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 0.0, 7.0, 8.0, 13.0, 16.0, 21.0, 22.0, 22.0, 19.0, 31.0, 45.0, 28.0, 34.0, 49.0, 53.0, 40.0, 53.0, 35.0, 34.0, 51.0, 37.0, 31.0, 43.0, 45.0, 46.0, 36.0, 25.0, 29.0, 27.0, 24.0, 16.0, 13.0, 10.0, 13.0, 8.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20565760135650635, -0.19885583221912384, -0.19205406308174133, -0.18525227904319763, -0.17845050990581512, -0.17164874076843262, -0.16484695672988892, -0.1580451875925064, -0.1512434184551239, -0.1444416493177414, -0.1376398801803589, -0.13083809614181519, -0.12403632700443268, -0.11723455786705017, -0.11043278127908707, -0.10363100469112396, -0.09682923555374146, -0.09002746641635895, -0.08322568982839584, -0.07642391324043274, -0.06962214410305023, -0.06282037496566772, -0.05601859837770462, -0.049216825515031815, -0.04241505265235901, -0.0356132797896862, -0.028811506927013397, -0.02200973406434059, -0.015207961201667786, -0.00840618833899498, -0.001604415476322174, 0.005197357386350632, 0.011999130249023438, 0.018800903111696243, 0.02560267597436905, 0.032404448837041855, 0.03920622169971466, 0.046007994562387466, 0.05280976742506027, 0.05961154028773308, 0.06641331315040588, 0.07321508228778839, 0.0800168588757515, 0.0868186354637146, 0.0936204046010971, 0.10042217373847961, 0.10722395032644272, 0.11402572691440582, 0.12082749605178833, 0.12762926518917084, 0.13443103432655334, 0.14123281836509705, 0.14803458750247955, 0.15483635663986206, 0.16163814067840576, 0.16843990981578827, 0.17524167895317078, 0.18204344809055328, 0.1888452172279358, 0.1956470012664795, 0.202448770403862, 0.2092505395412445, 0.2160523235797882, 0.22285409271717072, 0.22965586185455322]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 16.0, 23.0, 33.0, 57.0, 87.0, 133.0, 186.0, 353.0, 624.0, 1080.0, 1971.0, 3932.0, 8020.0, 17929.0, 39986.0, 94038.0, 258315.0, 376774.0, 139915.0, 57486.0, 25152.0, 11153.0, 5298.0, 2611.0, 1439.0, 775.0, 441.0, 246.0, 175.0, 89.0, 76.0, 45.0, 29.0, 18.0, 11.0, 8.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.095703125, -0.0926370620727539, -0.08957099914550781, -0.08650493621826172, -0.08343887329101562, -0.08037281036376953, -0.07730674743652344, -0.07424068450927734, -0.07117462158203125, -0.06810855865478516, -0.06504249572753906, -0.06197643280029297, -0.058910369873046875, -0.05584430694580078, -0.05277824401855469, -0.049712181091308594, -0.0466461181640625, -0.043580055236816406, -0.04051399230957031, -0.03744792938232422, -0.034381866455078125, -0.03131580352783203, -0.028249740600585938, -0.025183677673339844, -0.02211761474609375, -0.019051551818847656, -0.015985488891601562, -0.012919425964355469, -0.009853363037109375, -0.006787300109863281, -0.0037212371826171875, -0.0006551742553710938, 0.002410888671875, 0.005476951599121094, 0.008543014526367188, 0.011609077453613281, 0.014675140380859375, 0.01774120330810547, 0.020807266235351562, 0.023873329162597656, 0.02693939208984375, 0.030005455017089844, 0.03307151794433594, 0.03613758087158203, 0.039203643798828125, 0.04226970672607422, 0.04533576965332031, 0.048401832580566406, 0.0514678955078125, 0.054533958435058594, 0.05760002136230469, 0.06066608428955078, 0.06373214721679688, 0.06679821014404297, 0.06986427307128906, 0.07293033599853516, 0.07599639892578125, 0.07906246185302734, 0.08212852478027344, 0.08519458770751953, 0.08826065063476562, 0.09132671356201172, 0.09439277648925781, 0.0974588394165039, 0.10052490234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 8.0, 17.0, 19.0, 23.0, 31.0, 22.0, 36.0, 39.0, 39.0, 56.0, 45.0, 55.0, 66.0, 75.0, 66.0, 51.0, 56.0, 55.0, 36.0, 37.0, 37.0, 29.0, 19.0, 14.0, 16.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244903564453125, -0.02372908592224121, -0.022967815399169922, -0.022206544876098633, -0.021445274353027344, -0.020684003829956055, -0.019922733306884766, -0.019161462783813477, -0.018400192260742188, -0.0176389217376709, -0.01687765121459961, -0.01611638069152832, -0.015355110168457031, -0.014593839645385742, -0.013832569122314453, -0.013071298599243164, -0.012310028076171875, -0.011548757553100586, -0.010787487030029297, -0.010026216506958008, -0.009264945983886719, -0.00850367546081543, -0.007742404937744141, -0.0069811344146728516, -0.0062198638916015625, -0.0054585933685302734, -0.004697322845458984, -0.003936052322387695, -0.0031747817993164062, -0.002413511276245117, -0.0016522407531738281, -0.0008909702301025391, -0.00012969970703125, 0.0006315708160400391, 0.0013928413391113281, 0.002154111862182617, 0.0029153823852539062, 0.0036766529083251953, 0.004437923431396484, 0.0051991939544677734, 0.0059604644775390625, 0.0067217350006103516, 0.007483005523681641, 0.00824427604675293, 0.009005546569824219, 0.009766817092895508, 0.010528087615966797, 0.011289358139038086, 0.012050628662109375, 0.012811899185180664, 0.013573169708251953, 0.014334440231323242, 0.015095710754394531, 0.01585698127746582, 0.01661825180053711, 0.0173795223236084, 0.018140792846679688, 0.018902063369750977, 0.019663333892822266, 0.020424604415893555, 0.021185874938964844, 0.021947145462036133, 0.022708415985107422, 0.02346968650817871, 0.02423095703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 12.0, 12.0, 21.0, 34.0, 41.0, 52.0, 76.0, 109.0, 174.0, 233.0, 318.0, 524.0, 954.0, 1895.0, 3884.0, 9881.0, 27873.0, 88781.0, 356294.0, 404812.0, 101579.0, 31174.0, 10726.0, 4361.0, 2016.0, 983.0, 578.0, 378.0, 241.0, 159.0, 93.0, 74.0, 73.0, 37.0, 21.0, 20.0, 21.0, 8.0, 8.0, 6.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.120025634765625, -0.11639404296875, -0.112762451171875, -0.109130859375, -0.105499267578125, -0.10186767578125, -0.098236083984375, -0.0946044921875, -0.090972900390625, -0.08734130859375, -0.083709716796875, -0.080078125, -0.076446533203125, -0.07281494140625, -0.069183349609375, -0.0655517578125, -0.061920166015625, -0.05828857421875, -0.054656982421875, -0.051025390625, -0.047393798828125, -0.04376220703125, -0.040130615234375, -0.0364990234375, -0.032867431640625, -0.02923583984375, -0.025604248046875, -0.02197265625, -0.018341064453125, -0.01470947265625, -0.011077880859375, -0.0074462890625, -0.003814697265625, -0.00018310546875, 0.003448486328125, 0.007080078125, 0.010711669921875, 0.01434326171875, 0.017974853515625, 0.0216064453125, 0.025238037109375, 0.02886962890625, 0.032501220703125, 0.0361328125, 0.039764404296875, 0.04339599609375, 0.047027587890625, 0.0506591796875, 0.054290771484375, 0.05792236328125, 0.061553955078125, 0.065185546875, 0.068817138671875, 0.07244873046875, 0.076080322265625, 0.0797119140625, 0.083343505859375, 0.08697509765625, 0.090606689453125, 0.09423828125, 0.097869873046875, 0.10150146484375, 0.105133056640625, 0.1087646484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 5.0, 10.0, 11.0, 9.0, 14.0, 17.0, 21.0, 27.0, 29.0, 30.0, 42.0, 36.0, 44.0, 47.0, 40.0, 48.0, 52.0, 54.0, 47.0, 46.0, 43.0, 47.0, 52.0, 38.0, 42.0, 26.0, 17.0, 16.0, 14.0, 15.0, 16.0, 11.0, 8.0, 9.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09312629699707031, -0.08957290649414062, -0.08601951599121094, -0.08246612548828125, -0.07891273498535156, -0.07535934448242188, -0.07180595397949219, -0.0682525634765625, -0.06469917297363281, -0.061145782470703125, -0.05759239196777344, -0.05403900146484375, -0.05048561096191406, -0.046932220458984375, -0.04337882995605469, -0.039825439453125, -0.03627204895019531, -0.032718658447265625, -0.029165267944335938, -0.02561187744140625, -0.022058486938476562, -0.018505096435546875, -0.014951705932617188, -0.0113983154296875, -0.007844924926757812, -0.004291534423828125, -0.0007381439208984375, 0.00281524658203125, 0.0063686370849609375, 0.009922027587890625, 0.013475418090820312, 0.01702880859375, 0.020582199096679688, 0.024135589599609375, 0.027688980102539062, 0.03124237060546875, 0.03479576110839844, 0.038349151611328125, 0.04190254211425781, 0.0454559326171875, 0.04900932312011719, 0.052562713623046875, 0.05611610412597656, 0.05966949462890625, 0.06322288513183594, 0.06677627563476562, 0.07032966613769531, 0.073883056640625, 0.07743644714355469, 0.08098983764648438, 0.08454322814941406, 0.08809661865234375, 0.09165000915527344, 0.09520339965820312, 0.09875679016113281, 0.1023101806640625, 0.10586357116699219, 0.10941696166992188, 0.11297035217285156, 0.11652374267578125, 0.12007713317871094, 0.12363052368164062, 0.1271839141845703, 0.1307373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 11.0, 14.0, 34.0, 48.0, 68.0, 95.0, 191.0, 239.0, 531.0, 1054.0, 2345.0, 6162.0, 22586.0, 126141.0, 690588.0, 159301.0, 27021.0, 7087.0, 2612.0, 1129.0, 527.0, 307.0, 148.0, 98.0, 61.0, 46.0, 31.0, 14.0, 21.0, 4.0, 9.0, 5.0, 5.0, 7.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10290718078613281, -0.09888076782226562, -0.09485435485839844, -0.09082794189453125, -0.08680152893066406, -0.08277511596679688, -0.07874870300292969, -0.0747222900390625, -0.07069587707519531, -0.06666946411132812, -0.06264305114746094, -0.05861663818359375, -0.05459022521972656, -0.050563812255859375, -0.04653739929199219, -0.042510986328125, -0.03848457336425781, -0.034458160400390625, -0.030431747436523438, -0.02640533447265625, -0.022378921508789062, -0.018352508544921875, -0.014326095581054688, -0.0102996826171875, -0.0062732696533203125, -0.002246856689453125, 0.0017795562744140625, 0.00580596923828125, 0.009832382202148438, 0.013858795166015625, 0.017885208129882812, 0.02191162109375, 0.025938034057617188, 0.029964447021484375, 0.03399085998535156, 0.03801727294921875, 0.04204368591308594, 0.046070098876953125, 0.05009651184082031, 0.0541229248046875, 0.05814933776855469, 0.062175750732421875, 0.06620216369628906, 0.07022857666015625, 0.07425498962402344, 0.07828140258789062, 0.08230781555175781, 0.086334228515625, 0.09036064147949219, 0.09438705444335938, 0.09841346740722656, 0.10243988037109375, 0.10646629333496094, 0.11049270629882812, 0.11451911926269531, 0.1185455322265625, 0.12257194519042969, 0.12659835815429688, 0.13062477111816406, 0.13465118408203125, 0.13867759704589844, 0.14270401000976562, 0.1467304229736328, 0.1507568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 10.0, 15.0, 13.0, 12.0, 22.0, 35.0, 45.0, 48.0, 50.0, 59.0, 71.0, 61.0, 78.0, 75.0, 67.0, 82.0, 39.0, 42.0, 25.0, 29.0, 16.0, 14.0, 12.0, 16.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.029273986816406e-05, -3.8689933717250824e-05, -3.7087127566337585e-05, -3.548432141542435e-05, -3.388151526451111e-05, -3.227870911359787e-05, -3.067590296268463e-05, -2.9073096811771393e-05, -2.7470290660858154e-05, -2.5867484509944916e-05, -2.4264678359031677e-05, -2.266187220811844e-05, -2.10590660572052e-05, -1.945625990629196e-05, -1.7853453755378723e-05, -1.6250647604465485e-05, -1.4647841453552246e-05, -1.3045035302639008e-05, -1.1442229151725769e-05, -9.83942300081253e-06, -8.236616849899292e-06, -6.6338106989860535e-06, -5.031004548072815e-06, -3.4281983971595764e-06, -1.8253922462463379e-06, -2.2258609533309937e-07, 1.3802200555801392e-06, 2.9830262064933777e-06, 4.585832357406616e-06, 6.188638508319855e-06, 7.791444659233093e-06, 9.394250810146332e-06, 1.099705696105957e-05, 1.2599863111972809e-05, 1.4202669262886047e-05, 1.5805475413799286e-05, 1.7408281564712524e-05, 1.9011087715625763e-05, 2.0613893866539e-05, 2.221670001745224e-05, 2.381950616836548e-05, 2.5422312319278717e-05, 2.7025118470191956e-05, 2.8627924621105194e-05, 3.0230730772018433e-05, 3.183353692293167e-05, 3.343634307384491e-05, 3.503914922475815e-05, 3.664195537567139e-05, 3.8244761526584625e-05, 3.9847567677497864e-05, 4.14503738284111e-05, 4.305317997932434e-05, 4.465598613023758e-05, 4.625879228115082e-05, 4.7861598432064056e-05, 4.9464404582977295e-05, 5.1067210733890533e-05, 5.267001688480377e-05, 5.427282303571701e-05, 5.587562918663025e-05, 5.747843533754349e-05, 5.9081241488456726e-05, 6.0684047639369965e-05, 6.22868537902832e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 10.0, 15.0, 12.0, 24.0, 23.0, 30.0, 55.0, 59.0, 106.0, 121.0, 190.0, 300.0, 518.0, 943.0, 1970.0, 4132.0, 9323.0, 24855.0, 81671.0, 370543.0, 417370.0, 90700.0, 26846.0, 9908.0, 4311.0, 1945.0, 1055.0, 528.0, 321.0, 212.0, 135.0, 85.0, 63.0, 43.0, 33.0, 22.0, 16.0, 12.0, 18.0, 7.0, 9.0, 4.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.071044921875, -0.0686798095703125, -0.066314697265625, -0.0639495849609375, -0.06158447265625, -0.0592193603515625, -0.056854248046875, -0.0544891357421875, -0.0521240234375, -0.0497589111328125, -0.047393798828125, -0.0450286865234375, -0.04266357421875, -0.0402984619140625, -0.037933349609375, -0.0355682373046875, -0.033203125, -0.0308380126953125, -0.028472900390625, -0.0261077880859375, -0.02374267578125, -0.0213775634765625, -0.019012451171875, -0.0166473388671875, -0.0142822265625, -0.0119171142578125, -0.009552001953125, -0.0071868896484375, -0.00482177734375, -0.0024566650390625, -9.1552734375e-05, 0.0022735595703125, 0.004638671875, 0.0070037841796875, 0.009368896484375, 0.0117340087890625, 0.01409912109375, 0.0164642333984375, 0.018829345703125, 0.0211944580078125, 0.0235595703125, 0.0259246826171875, 0.028289794921875, 0.0306549072265625, 0.03302001953125, 0.0353851318359375, 0.037750244140625, 0.0401153564453125, 0.04248046875, 0.0448455810546875, 0.047210693359375, 0.0495758056640625, 0.05194091796875, 0.0543060302734375, 0.056671142578125, 0.0590362548828125, 0.0614013671875, 0.0637664794921875, 0.066131591796875, 0.0684967041015625, 0.07086181640625, 0.0732269287109375, 0.075592041015625, 0.0779571533203125, 0.080322265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 6.0, 5.0, 7.0, 3.0, 9.0, 10.0, 7.0, 11.0, 23.0, 31.0, 32.0, 33.0, 40.0, 58.0, 87.0, 116.0, 113.0, 82.0, 74.0, 62.0, 35.0, 32.0, 23.0, 20.0, 15.0, 8.0, 11.0, 6.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.05446052551269531, -0.052585601806640625, -0.05071067810058594, -0.04883575439453125, -0.04696083068847656, -0.045085906982421875, -0.04321098327636719, -0.0413360595703125, -0.03946113586425781, -0.037586212158203125, -0.03571128845214844, -0.03383636474609375, -0.03196144104003906, -0.030086517333984375, -0.028211593627929688, -0.026336669921875, -0.024461746215820312, -0.022586822509765625, -0.020711898803710938, -0.01883697509765625, -0.016962051391601562, -0.015087127685546875, -0.013212203979492188, -0.0113372802734375, -0.009462356567382812, -0.007587432861328125, -0.0057125091552734375, -0.00383758544921875, -0.0019626617431640625, -8.7738037109375e-05, 0.0017871856689453125, 0.003662109375, 0.0055370330810546875, 0.007411956787109375, 0.009286880493164062, 0.01116180419921875, 0.013036727905273438, 0.014911651611328125, 0.016786575317382812, 0.0186614990234375, 0.020536422729492188, 0.022411346435546875, 0.024286270141601562, 0.02616119384765625, 0.028036117553710938, 0.029911041259765625, 0.03178596496582031, 0.033660888671875, 0.03553581237792969, 0.037410736083984375, 0.03928565979003906, 0.04116058349609375, 0.04303550720214844, 0.044910430908203125, 0.04678535461425781, 0.0486602783203125, 0.05053520202636719, 0.052410125732421875, 0.05428504943847656, 0.05615997314453125, 0.05803489685058594, 0.059909820556640625, 0.06178474426269531, 0.06365966796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 13.0, 17.0, 32.0, 42.0, 64.0, 101.0, 136.0, 126.0, 137.0, 99.0, 100.0, 54.0, 32.0, 12.0, 13.0, 10.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45304882526397705, -0.4243328273296356, -0.3956168293952942, -0.36690086126327515, -0.3381848633289337, -0.3094688653945923, -0.28075286746025085, -0.2520368695259094, -0.2233208864927292, -0.19460488855838776, -0.16588890552520752, -0.1371729075908661, -0.10845691710710526, -0.07974092662334442, -0.05102492868900299, -0.022308945655822754, 0.006407052278518677, 0.03512304276227951, 0.06383903324604034, 0.09255503118038177, 0.12127102166414261, 0.14998701214790344, 0.17870301008224487, 0.2074189931154251, 0.23613499104976654, 0.2648509740829468, 0.2935669720172882, 0.32228296995162964, 0.35099896788597107, 0.3797149658203125, 0.40843093395233154, 0.437146931886673, 0.4658629298210144, 0.49457892775535583, 0.5232949256896973, 0.5520108938217163, 0.5807269215583801, 0.6094428896903992, 0.638158917427063, 0.666874885559082, 0.6955908536911011, 0.7243068218231201, 0.7530228495597839, 0.781738817691803, 0.8104548454284668, 0.8391708135604858, 0.8678867816925049, 0.8966028094291687, 0.9253188371658325, 0.9540348052978516, 0.9827508330345154, 1.0114668607711792, 1.0401828289031982, 1.0688987970352173, 1.0976147651672363, 1.1263307332992554, 1.1550467014312744, 1.1837626695632935, 1.2124786376953125, 1.241194725036621, 1.2699106931686401, 1.2986266613006592, 1.3273426294326782, 1.3560585975646973, 1.3847746849060059]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 4.0, 4.0, 15.0, 3.0, 14.0, 5.0, 26.0, 17.0, 22.0, 22.0, 32.0, 34.0, 26.0, 43.0, 25.0, 43.0, 41.0, 42.0, 46.0, 42.0, 46.0, 29.0, 43.0, 40.0, 50.0, 35.0, 38.0, 31.0, 24.0, 21.0, 25.0, 20.0, 17.0, 18.0, 6.0, 10.0, 5.0, 7.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.6243494153022766, -0.6065165400505066, -0.5886836647987366, -0.5708507895469666, -0.5530179142951965, -0.5351850390434265, -0.5173521637916565, -0.4995192885398865, -0.48168641328811646, -0.46385353803634644, -0.4460206627845764, -0.4281877875328064, -0.4103549122810364, -0.39252203702926636, -0.37468916177749634, -0.3568562865257263, -0.3390234410762787, -0.32119056582450867, -0.30335769057273865, -0.28552481532096863, -0.2676919400691986, -0.2498590648174286, -0.23202620446681976, -0.21419332921504974, -0.19636045396327972, -0.1785275787115097, -0.16069470345973969, -0.14286184310913086, -0.12502896785736084, -0.10719608515501022, -0.0893632173538208, -0.07153034210205078, -0.05369746685028076, -0.03586459159851074, -0.01803172007203102, -0.00019884854555130005, 0.01763402670621872, 0.03546690195798874, 0.05329976975917816, 0.07113264501094818, 0.0889655202627182, 0.10679839551448822, 0.12463127076625824, 0.14246413111686707, 0.16029700636863708, 0.1781298816204071, 0.19596275687217712, 0.21379563212394714, 0.23162850737571716, 0.24946138262748718, 0.2672942578792572, 0.2851271331310272, 0.30296000838279724, 0.32079288363456726, 0.3386257290840149, 0.3564586043357849, 0.37429147958755493, 0.39212435483932495, 0.40995723009109497, 0.427790105342865, 0.445622980594635, 0.46345585584640503, 0.48128873109817505, 0.49912160634994507, 0.5169544816017151]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 10.0, 5.0, 7.0, 8.0, 9.0, 19.0, 26.0, 36.0, 55.0, 95.0, 121.0, 201.0, 324.0, 453.0, 749.0, 1308.0, 2158.0, 3917.0, 7088.0, 14270.0, 31409.0, 82453.0, 347514.0, 3228096.0, 332643.0, 80347.0, 30450.0, 13848.0, 7079.0, 3866.0, 2226.0, 1307.0, 794.0, 518.0, 305.0, 196.0, 122.0, 81.0, 57.0, 34.0, 26.0, 13.0, 12.0, 14.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07579898834228516, -0.07322883605957031, -0.07065868377685547, -0.06808853149414062, -0.06551837921142578, -0.06294822692871094, -0.060378074645996094, -0.05780792236328125, -0.055237770080566406, -0.05266761779785156, -0.05009746551513672, -0.047527313232421875, -0.04495716094970703, -0.04238700866699219, -0.039816856384277344, -0.0372467041015625, -0.034676551818847656, -0.03210639953613281, -0.02953624725341797, -0.026966094970703125, -0.02439594268798828, -0.021825790405273438, -0.019255638122558594, -0.01668548583984375, -0.014115333557128906, -0.011545181274414062, -0.008975028991699219, -0.006404876708984375, -0.0038347244262695312, -0.0012645721435546875, 0.0013055801391601562, 0.003875732421875, 0.006445884704589844, 0.009016036987304688, 0.011586189270019531, 0.014156341552734375, 0.01672649383544922, 0.019296646118164062, 0.021866798400878906, 0.02443695068359375, 0.027007102966308594, 0.029577255249023438, 0.03214740753173828, 0.034717559814453125, 0.03728771209716797, 0.03985786437988281, 0.042428016662597656, 0.0449981689453125, 0.047568321228027344, 0.05013847351074219, 0.05270862579345703, 0.055278778076171875, 0.05784893035888672, 0.06041908264160156, 0.0629892349243164, 0.06555938720703125, 0.0681295394897461, 0.07069969177246094, 0.07326984405517578, 0.07583999633789062, 0.07841014862060547, 0.08098030090332031, 0.08355045318603516, 0.08612060546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 4.0, 14.0, 14.0, 14.0, 19.0, 29.0, 31.0, 23.0, 29.0, 33.0, 39.0, 45.0, 51.0, 55.0, 55.0, 45.0, 46.0, 42.0, 61.0, 47.0, 41.0, 35.0, 32.0, 25.0, 39.0, 16.0, 17.0, 13.0, 17.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0236358642578125, -0.022953510284423828, -0.022271156311035156, -0.021588802337646484, -0.020906448364257812, -0.02022409439086914, -0.01954174041748047, -0.018859386444091797, -0.018177032470703125, -0.017494678497314453, -0.01681232452392578, -0.01612997055053711, -0.015447616577148438, -0.014765262603759766, -0.014082908630371094, -0.013400554656982422, -0.01271820068359375, -0.012035846710205078, -0.011353492736816406, -0.010671138763427734, -0.009988784790039062, -0.00930643081665039, -0.008624076843261719, -0.007941722869873047, -0.007259368896484375, -0.006577014923095703, -0.005894660949707031, -0.005212306976318359, -0.0045299530029296875, -0.0038475990295410156, -0.0031652450561523438, -0.002482891082763672, -0.001800537109375, -0.0011181831359863281, -0.00043582916259765625, 0.0002465248107910156, 0.0009288787841796875, 0.0016112327575683594, 0.0022935867309570312, 0.002975940704345703, 0.003658294677734375, 0.004340648651123047, 0.005023002624511719, 0.005705356597900391, 0.0063877105712890625, 0.007070064544677734, 0.007752418518066406, 0.008434772491455078, 0.00911712646484375, 0.009799480438232422, 0.010481834411621094, 0.011164188385009766, 0.011846542358398438, 0.01252889633178711, 0.013211250305175781, 0.013893604278564453, 0.014575958251953125, 0.015258312225341797, 0.01594066619873047, 0.01662302017211914, 0.017305374145507812, 0.017987728118896484, 0.018670082092285156, 0.019352436065673828, 0.0200347900390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 6.0, 3.0, 13.0, 19.0, 32.0, 32.0, 51.0, 68.0, 122.0, 172.0, 235.0, 375.0, 602.0, 962.0, 1728.0, 3417.0, 7404.0, 19207.0, 58651.0, 264351.0, 3190667.0, 510964.0, 88674.0, 26631.0, 10131.0, 4415.0, 2155.0, 1184.0, 652.0, 426.0, 303.0, 206.0, 126.0, 95.0, 63.0, 40.0, 30.0, 21.0, 19.0, 11.0, 5.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.15625, -0.15174102783203125, -0.1472320556640625, -0.14272308349609375, -0.138214111328125, -0.13370513916015625, -0.1291961669921875, -0.12468719482421875, -0.12017822265625, -0.11566925048828125, -0.1111602783203125, -0.10665130615234375, -0.102142333984375, -0.09763336181640625, -0.0931243896484375, -0.08861541748046875, -0.0841064453125, -0.07959747314453125, -0.0750885009765625, -0.07057952880859375, -0.066070556640625, -0.06156158447265625, -0.0570526123046875, -0.05254364013671875, -0.04803466796875, -0.04352569580078125, -0.0390167236328125, -0.03450775146484375, -0.029998779296875, -0.02548980712890625, -0.0209808349609375, -0.01647186279296875, -0.011962890625, -0.00745391845703125, -0.0029449462890625, 0.00156402587890625, 0.006072998046875, 0.01058197021484375, 0.0150909423828125, 0.01959991455078125, 0.02410888671875, 0.02861785888671875, 0.0331268310546875, 0.03763580322265625, 0.042144775390625, 0.04665374755859375, 0.0511627197265625, 0.05567169189453125, 0.0601806640625, 0.06468963623046875, 0.0691986083984375, 0.07370758056640625, 0.078216552734375, 0.08272552490234375, 0.0872344970703125, 0.09174346923828125, 0.09625244140625, 0.10076141357421875, 0.1052703857421875, 0.10977935791015625, 0.114288330078125, 0.11879730224609375, 0.1233062744140625, 0.12781524658203125, 0.13232421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 2.0, 11.0, 7.0, 6.0, 20.0, 27.0, 43.0, 48.0, 97.0, 203.0, 442.0, 1797.0, 689.0, 286.0, 135.0, 100.0, 55.0, 43.0, 17.0, 15.0, 8.0, 5.0, 2.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08624267578125, -0.08368206024169922, -0.08112144470214844, -0.07856082916259766, -0.07600021362304688, -0.0734395980834961, -0.07087898254394531, -0.06831836700439453, -0.06575775146484375, -0.06319713592529297, -0.06063652038574219, -0.058075904846191406, -0.055515289306640625, -0.052954673767089844, -0.05039405822753906, -0.04783344268798828, -0.0452728271484375, -0.04271221160888672, -0.04015159606933594, -0.037590980529785156, -0.035030364990234375, -0.032469749450683594, -0.029909133911132812, -0.02734851837158203, -0.02478790283203125, -0.02222728729248047, -0.019666671752929688, -0.017106056213378906, -0.014545440673828125, -0.011984825134277344, -0.009424209594726562, -0.006863594055175781, -0.004302978515625, -0.0017423629760742188, 0.0008182525634765625, 0.0033788681030273438, 0.005939483642578125, 0.008500099182128906, 0.011060714721679688, 0.013621330261230469, 0.01618194580078125, 0.01874256134033203, 0.021303176879882812, 0.023863792419433594, 0.026424407958984375, 0.028985023498535156, 0.03154563903808594, 0.03410625457763672, 0.0366668701171875, 0.03922748565673828, 0.04178810119628906, 0.044348716735839844, 0.046909332275390625, 0.049469947814941406, 0.05203056335449219, 0.05459117889404297, 0.05715179443359375, 0.05971240997314453, 0.06227302551269531, 0.0648336410522461, 0.06739425659179688, 0.06995487213134766, 0.07251548767089844, 0.07507610321044922, 0.07763671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 31.0, 87.0, 192.0, 267.0, 242.0, 112.0, 48.0, 8.0, 6.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5530012249946594, -0.5230609178543091, -0.49312061071395874, -0.4631803035736084, -0.43323999643325806, -0.4032996892929077, -0.3733593821525574, -0.34341907501220703, -0.3134787678718567, -0.28353846073150635, -0.253598153591156, -0.22365784645080566, -0.19371753931045532, -0.16377723217010498, -0.13383692502975464, -0.1038966178894043, -0.07395631074905396, -0.04401600360870361, -0.014075696468353271, 0.01586461067199707, 0.04580491781234741, 0.07574522495269775, 0.1056855320930481, 0.13562583923339844, 0.16556614637374878, 0.19550645351409912, 0.22544676065444946, 0.2553870677947998, 0.28532737493515015, 0.3152676820755005, 0.34520798921585083, 0.37514829635620117, 0.4050886631011963, 0.43502897024154663, 0.464969277381897, 0.4949095845222473, 0.5248498916625977, 0.554790198802948, 0.5847305059432983, 0.6146708130836487, 0.644611120223999, 0.6745514273643494, 0.7044917345046997, 0.73443204164505, 0.7643723487854004, 0.7943126559257507, 0.8242529630661011, 0.8541932702064514, 0.8841335773468018, 0.9140738844871521, 0.9440141916275024, 0.9739544987678528, 1.0038948059082031, 1.0338351726531982, 1.0637754201889038, 1.0937156677246094, 1.1236560344696045, 1.1535964012145996, 1.1835366487503052, 1.2134768962860107, 1.2434172630310059, 1.273357629776001, 1.3032978773117065, 1.333238124847412, 1.3631784915924072]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 6.0, 11.0, 10.0, 10.0, 15.0, 28.0, 14.0, 21.0, 37.0, 32.0, 42.0, 38.0, 34.0, 35.0, 36.0, 40.0, 46.0, 47.0, 45.0, 38.0, 38.0, 42.0, 31.0, 35.0, 36.0, 19.0, 31.0, 22.0, 22.0, 19.0, 10.0, 12.0, 12.0, 14.0, 12.0, 8.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20667040348052979, -0.19992177188396454, -0.1931731402873993, -0.18642450869083405, -0.1796758770942688, -0.17292724549770355, -0.1661786139011383, -0.15942999720573425, -0.1526813507080078, -0.14593271911144257, -0.13918408751487732, -0.13243545591831207, -0.12568682432174683, -0.11893819272518158, -0.11218956857919693, -0.10544093698263168, -0.09869231283664703, -0.09194368124008179, -0.08519504964351654, -0.0784464180469513, -0.07169778645038605, -0.0649491548538208, -0.05820053070783615, -0.051451899111270905, -0.04470326751470566, -0.03795463591814041, -0.031206006184220314, -0.024457376450300217, -0.01770874485373497, -0.010960113257169724, -0.004211485385894775, 0.002537146210670471, 0.009285777807235718, 0.016034409403800964, 0.02278303913772106, 0.02953166887164116, 0.036280300468206406, 0.04302893206477165, 0.0497775599360466, 0.05652619153261185, 0.0632748231291771, 0.07002345472574234, 0.07677208632230759, 0.08352071046829224, 0.09026934206485748, 0.09701797366142273, 0.10376660525798798, 0.11051523685455322, 0.11726386845111847, 0.12401250004768372, 0.13076113164424896, 0.1375097632408142, 0.14425839483737946, 0.1510070264339447, 0.15775564312934875, 0.1645042896270752, 0.17125290632247925, 0.1780015379190445, 0.18475016951560974, 0.191498801112175, 0.19824743270874023, 0.20499606430530548, 0.21174469590187073, 0.21849331259727478, 0.22524195909500122]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 11.0, 28.0, 25.0, 46.0, 62.0, 111.0, 175.0, 251.0, 347.0, 602.0, 939.0, 1554.0, 2488.0, 4323.0, 7165.0, 12326.0, 21456.0, 36904.0, 64043.0, 115578.0, 229409.0, 253454.0, 128815.0, 70663.0, 40944.0, 23226.0, 13731.0, 7911.0, 4626.0, 2834.0, 1695.0, 1036.0, 646.0, 408.0, 252.0, 158.0, 96.0, 88.0, 26.0, 25.0, 22.0, 12.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.071533203125, -0.06915569305419922, -0.06677818298339844, -0.06440067291259766, -0.062023162841796875, -0.059645652770996094, -0.05726814270019531, -0.05489063262939453, -0.05251312255859375, -0.05013561248779297, -0.04775810241699219, -0.045380592346191406, -0.043003082275390625, -0.040625572204589844, -0.03824806213378906, -0.03587055206298828, -0.0334930419921875, -0.03111553192138672, -0.028738021850585938, -0.026360511779785156, -0.023983001708984375, -0.021605491638183594, -0.019227981567382812, -0.01685047149658203, -0.01447296142578125, -0.012095451354980469, -0.009717941284179688, -0.007340431213378906, -0.004962921142578125, -0.0025854110717773438, -0.0002079010009765625, 0.0021696090698242188, 0.004547119140625, 0.006924629211425781, 0.009302139282226562, 0.011679649353027344, 0.014057159423828125, 0.016434669494628906, 0.018812179565429688, 0.02118968963623047, 0.02356719970703125, 0.02594470977783203, 0.028322219848632812, 0.030699729919433594, 0.033077239990234375, 0.035454750061035156, 0.03783226013183594, 0.04020977020263672, 0.0425872802734375, 0.04496479034423828, 0.04734230041503906, 0.049719810485839844, 0.052097320556640625, 0.054474830627441406, 0.05685234069824219, 0.05922985076904297, 0.06160736083984375, 0.06398487091064453, 0.06636238098144531, 0.0687398910522461, 0.07111740112304688, 0.07349491119384766, 0.07587242126464844, 0.07824993133544922, 0.08062744140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 5.0, 12.0, 5.0, 13.0, 18.0, 23.0, 15.0, 19.0, 22.0, 18.0, 35.0, 31.0, 36.0, 35.0, 38.0, 43.0, 43.0, 43.0, 42.0, 52.0, 33.0, 53.0, 41.0, 36.0, 30.0, 32.0, 29.0, 22.0, 26.0, 27.0, 18.0, 17.0, 10.0, 9.0, 9.0, 6.0, 9.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0221099853515625, -0.021448612213134766, -0.02078723907470703, -0.020125865936279297, -0.019464492797851562, -0.018803119659423828, -0.018141746520996094, -0.01748037338256836, -0.016819000244140625, -0.01615762710571289, -0.015496253967285156, -0.014834880828857422, -0.014173507690429688, -0.013512134552001953, -0.012850761413574219, -0.012189388275146484, -0.01152801513671875, -0.010866641998291016, -0.010205268859863281, -0.009543895721435547, -0.008882522583007812, -0.008221149444580078, -0.007559776306152344, -0.006898403167724609, -0.006237030029296875, -0.005575656890869141, -0.004914283752441406, -0.004252910614013672, -0.0035915374755859375, -0.002930164337158203, -0.0022687911987304688, -0.0016074180603027344, -0.000946044921875, -0.0002846717834472656, 0.00037670135498046875, 0.0010380744934082031, 0.0016994476318359375, 0.002360820770263672, 0.0030221939086914062, 0.0036835670471191406, 0.004344940185546875, 0.005006313323974609, 0.005667686462402344, 0.006329059600830078, 0.0069904327392578125, 0.007651805877685547, 0.008313179016113281, 0.008974552154541016, 0.00963592529296875, 0.010297298431396484, 0.010958671569824219, 0.011620044708251953, 0.012281417846679688, 0.012942790985107422, 0.013604164123535156, 0.01426553726196289, 0.014926910400390625, 0.01558828353881836, 0.016249656677246094, 0.016911029815673828, 0.017572402954101562, 0.018233776092529297, 0.01889514923095703, 0.019556522369384766, 0.0202178955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 8.0, 14.0, 21.0, 27.0, 44.0, 55.0, 101.0, 176.0, 308.0, 455.0, 819.0, 1565.0, 3591.0, 10891.0, 44515.0, 255486.0, 601776.0, 97470.0, 20538.0, 5886.0, 2225.0, 1076.0, 535.0, 338.0, 216.0, 132.0, 103.0, 56.0, 44.0, 20.0, 16.0, 13.0, 8.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.21923828125, -0.21264266967773438, -0.20604705810546875, -0.19945144653320312, -0.1928558349609375, -0.18626022338867188, -0.17966461181640625, -0.17306900024414062, -0.166473388671875, -0.15987777709960938, -0.15328216552734375, -0.14668655395507812, -0.1400909423828125, -0.13349533081054688, -0.12689971923828125, -0.12030410766601562, -0.11370849609375, -0.10711288452148438, -0.10051727294921875, -0.09392166137695312, -0.0873260498046875, -0.08073043823242188, -0.07413482666015625, -0.06753921508789062, -0.060943603515625, -0.054347991943359375, -0.04775238037109375, -0.041156768798828125, -0.0345611572265625, -0.027965545654296875, -0.02136993408203125, -0.014774322509765625, -0.0081787109375, -0.001583099365234375, 0.00501251220703125, 0.011608123779296875, 0.0182037353515625, 0.024799346923828125, 0.03139495849609375, 0.037990570068359375, 0.044586181640625, 0.051181793212890625, 0.05777740478515625, 0.06437301635742188, 0.0709686279296875, 0.07756423950195312, 0.08415985107421875, 0.09075546264648438, 0.09735107421875, 0.10394668579101562, 0.11054229736328125, 0.11713790893554688, 0.1237335205078125, 0.13032913208007812, 0.13692474365234375, 0.14352035522460938, 0.150115966796875, 0.15671157836914062, 0.16330718994140625, 0.16990280151367188, 0.1764984130859375, 0.18309402465820312, 0.18968963623046875, 0.19628524780273438, 0.202880859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 13.0, 17.0, 12.0, 15.0, 24.0, 29.0, 26.0, 45.0, 41.0, 41.0, 52.0, 55.0, 54.0, 62.0, 52.0, 60.0, 52.0, 51.0, 49.0, 35.0, 40.0, 24.0, 24.0, 27.0, 13.0, 19.0, 13.0, 16.0, 10.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1402587890625, -0.13572311401367188, -0.13118743896484375, -0.12665176391601562, -0.1221160888671875, -0.11758041381835938, -0.11304473876953125, -0.10850906372070312, -0.103973388671875, -0.09943771362304688, -0.09490203857421875, -0.09036636352539062, -0.0858306884765625, -0.08129501342773438, -0.07675933837890625, -0.07222366333007812, -0.06768798828125, -0.06315231323242188, -0.05861663818359375, -0.054080963134765625, -0.0495452880859375, -0.045009613037109375, -0.04047393798828125, -0.035938262939453125, -0.031402587890625, -0.026866912841796875, -0.02233123779296875, -0.017795562744140625, -0.0132598876953125, -0.008724212646484375, -0.00418853759765625, 0.000347137451171875, 0.0048828125, 0.009418487548828125, 0.01395416259765625, 0.018489837646484375, 0.0230255126953125, 0.027561187744140625, 0.03209686279296875, 0.036632537841796875, 0.041168212890625, 0.045703887939453125, 0.05023956298828125, 0.054775238037109375, 0.0593109130859375, 0.06384658813476562, 0.06838226318359375, 0.07291793823242188, 0.07745361328125, 0.08198928833007812, 0.08652496337890625, 0.09106063842773438, 0.0955963134765625, 0.10013198852539062, 0.10466766357421875, 0.10920333862304688, 0.113739013671875, 0.11827468872070312, 0.12281036376953125, 0.12734603881835938, 0.1318817138671875, 0.13641738891601562, 0.14095306396484375, 0.14548873901367188, 0.1500244140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 10.0, 15.0, 12.0, 24.0, 23.0, 46.0, 46.0, 91.0, 182.0, 400.0, 1393.0, 8778.0, 374379.0, 649929.0, 10607.0, 1606.0, 519.0, 197.0, 93.0, 51.0, 34.0, 31.0, 21.0, 22.0, 16.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.490478515625, -0.4764823913574219, -0.46248626708984375, -0.4484901428222656, -0.4344940185546875, -0.4204978942871094, -0.40650177001953125, -0.3925056457519531, -0.378509521484375, -0.3645133972167969, -0.35051727294921875, -0.3365211486816406, -0.3225250244140625, -0.3085289001464844, -0.29453277587890625, -0.2805366516113281, -0.26654052734375, -0.2525444030761719, -0.23854827880859375, -0.22455215454101562, -0.2105560302734375, -0.19655990600585938, -0.18256378173828125, -0.16856765747070312, -0.154571533203125, -0.14057540893554688, -0.12657928466796875, -0.11258316040039062, -0.0985870361328125, -0.08459091186523438, -0.07059478759765625, -0.056598663330078125, -0.0426025390625, -0.028606414794921875, -0.01461029052734375, -0.000614166259765625, 0.0133819580078125, 0.027378082275390625, 0.04137420654296875, 0.055370330810546875, 0.069366455078125, 0.08336257934570312, 0.09735870361328125, 0.11135482788085938, 0.1253509521484375, 0.13934707641601562, 0.15334320068359375, 0.16733932495117188, 0.18133544921875, 0.19533157348632812, 0.20932769775390625, 0.22332382202148438, 0.2373199462890625, 0.2513160705566406, 0.26531219482421875, 0.2793083190917969, 0.293304443359375, 0.3073005676269531, 0.32129669189453125, 0.3352928161621094, 0.3492889404296875, 0.3632850646972656, 0.37728118896484375, 0.3912773132324219, 0.4052734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 5.0, 18.0, 22.0, 28.0, 44.0, 62.0, 79.0, 100.0, 85.0, 100.0, 65.0, 90.0, 74.0, 56.0, 42.0, 25.0, 30.0, 14.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.429983139038086e-05, -5.22444024682045e-05, -5.018897354602814e-05, -4.8133544623851776e-05, -4.6078115701675415e-05, -4.4022686779499054e-05, -4.196725785732269e-05, -3.991182893514633e-05, -3.785640001296997e-05, -3.580097109079361e-05, -3.374554216861725e-05, -3.169011324644089e-05, -2.9634684324264526e-05, -2.7579255402088165e-05, -2.5523826479911804e-05, -2.3468397557735443e-05, -2.1412968635559082e-05, -1.935753971338272e-05, -1.730211079120636e-05, -1.5246681869029999e-05, -1.3191252946853638e-05, -1.1135824024677277e-05, -9.080395102500916e-06, -7.0249661803245544e-06, -4.969537258148193e-06, -2.9141083359718323e-06, -8.586794137954712e-07, 1.1967495083808899e-06, 3.252178430557251e-06, 5.307607352733612e-06, 7.363036274909973e-06, 9.418465197086334e-06, 1.1473894119262695e-05, 1.3529323041439056e-05, 1.5584751963615417e-05, 1.764018088579178e-05, 1.969560980796814e-05, 2.17510387301445e-05, 2.3806467652320862e-05, 2.5861896574497223e-05, 2.7917325496673584e-05, 2.9972754418849945e-05, 3.2028183341026306e-05, 3.408361226320267e-05, 3.613904118537903e-05, 3.819447010755539e-05, 4.024989902973175e-05, 4.230532795190811e-05, 4.436075687408447e-05, 4.6416185796260834e-05, 4.8471614718437195e-05, 5.0527043640613556e-05, 5.258247256278992e-05, 5.463790148496628e-05, 5.669333040714264e-05, 5.8748759329319e-05, 6.080418825149536e-05, 6.285961717367172e-05, 6.491504609584808e-05, 6.697047501802444e-05, 6.90259039402008e-05, 7.108133286237717e-05, 7.313676178455353e-05, 7.519219070672989e-05, 7.724761962890625e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 9.0, 18.0, 11.0, 23.0, 33.0, 49.0, 50.0, 86.0, 132.0, 217.0, 460.0, 871.0, 1874.0, 5280.0, 27694.0, 739424.0, 250553.0, 15071.0, 3631.0, 1421.0, 652.0, 339.0, 216.0, 133.0, 84.0, 45.0, 47.0, 28.0, 19.0, 21.0, 13.0, 7.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20402145385742188, -0.19612884521484375, -0.18823623657226562, -0.1803436279296875, -0.17245101928710938, -0.16455841064453125, -0.15666580200195312, -0.148773193359375, -0.14088058471679688, -0.13298797607421875, -0.12509536743164062, -0.1172027587890625, -0.10931015014648438, -0.10141754150390625, -0.09352493286132812, -0.08563232421875, -0.07773971557617188, -0.06984710693359375, -0.061954498291015625, -0.0540618896484375, -0.046169281005859375, -0.03827667236328125, -0.030384063720703125, -0.022491455078125, -0.014598846435546875, -0.00670623779296875, 0.001186370849609375, 0.0090789794921875, 0.016971588134765625, 0.02486419677734375, 0.032756805419921875, 0.0406494140625, 0.048542022705078125, 0.05643463134765625, 0.06432723999023438, 0.0722198486328125, 0.08011245727539062, 0.08800506591796875, 0.09589767456054688, 0.103790283203125, 0.11168289184570312, 0.11957550048828125, 0.12746810913085938, 0.1353607177734375, 0.14325332641601562, 0.15114593505859375, 0.15903854370117188, 0.16693115234375, 0.17482376098632812, 0.18271636962890625, 0.19060897827148438, 0.1985015869140625, 0.20639419555664062, 0.21428680419921875, 0.22217941284179688, 0.230072021484375, 0.23796463012695312, 0.24585723876953125, 0.2537498474121094, 0.2616424560546875, 0.2695350646972656, 0.27742767333984375, 0.2853202819824219, 0.293212890625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 13.0, 9.0, 37.0, 38.0, 84.0, 121.0, 208.0, 205.0, 112.0, 63.0, 30.0, 19.0, 12.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2017822265625, -0.19672775268554688, -0.19167327880859375, -0.18661880493164062, -0.1815643310546875, -0.17650985717773438, -0.17145538330078125, -0.16640090942382812, -0.161346435546875, -0.15629196166992188, -0.15123748779296875, -0.14618301391601562, -0.1411285400390625, -0.13607406616210938, -0.13101959228515625, -0.12596511840820312, -0.12091064453125, -0.11585617065429688, -0.11080169677734375, -0.10574722290039062, -0.1006927490234375, -0.09563827514648438, -0.09058380126953125, -0.08552932739257812, -0.080474853515625, -0.07542037963867188, -0.07036590576171875, -0.06531143188476562, -0.0602569580078125, -0.055202484130859375, -0.05014801025390625, -0.045093536376953125, -0.0400390625, -0.034984588623046875, -0.02993011474609375, -0.024875640869140625, -0.0198211669921875, -0.014766693115234375, -0.00971221923828125, -0.004657745361328125, 0.000396728515625, 0.005451202392578125, 0.01050567626953125, 0.015560150146484375, 0.0206146240234375, 0.025669097900390625, 0.03072357177734375, 0.035778045654296875, 0.04083251953125, 0.045886993408203125, 0.05094146728515625, 0.055995941162109375, 0.0610504150390625, 0.06610488891601562, 0.07115936279296875, 0.07621383666992188, 0.081268310546875, 0.08632278442382812, 0.09137725830078125, 0.09643173217773438, 0.1014862060546875, 0.10654067993164062, 0.11159515380859375, 0.11664962768554688, 0.1217041015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 9.0, 20.0, 26.0, 55.0, 86.0, 144.0, 191.0, 166.0, 151.0, 69.0, 40.0, 22.0, 14.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.904351830482483, -1.8404170274734497, -1.776482343673706, -1.7125475406646729, -1.6486128568649292, -1.584678053855896, -1.5207433700561523, -1.4568085670471191, -1.392873764038086, -1.3289389610290527, -1.265004277229309, -1.2010694742202759, -1.1371347904205322, -1.073199987411499, -1.0092651844024658, -0.9453305006027222, -0.8813958168029785, -0.8174610733985901, -0.7535263299942017, -0.6895915269851685, -0.6256568431854248, -0.5617220401763916, -0.4977872967720032, -0.43385255336761475, -0.3699178099632263, -0.3059830665588379, -0.24204830825328827, -0.17811354994773865, -0.11417880654335022, -0.05024406313896179, 0.013690710067749023, 0.07762545347213745, 0.14156031608581543, 0.20549505949020386, 0.2694298028945923, 0.3333645761013031, 0.39729931950569153, 0.46123406291007996, 0.5251688361167908, 0.5891035795211792, 0.6530383229255676, 0.716973066329956, 0.7809078097343445, 0.8448425531387329, 0.9087773561477661, 0.9727120399475098, 1.036646842956543, 1.1005816459655762, 1.1645163297653198, 1.228451132774353, 1.2923858165740967, 1.3563206195831299, 1.4202553033828735, 1.4841901063919067, 1.5481247901916504, 1.6120595932006836, 1.6759943962097168, 1.73992919921875, 1.8038638830184937, 1.8677986860275269, 1.9317333698272705, 1.9956681728363037, 2.059602975845337, 2.123537540435791, 2.187472343444824]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 1.0, 11.0, 8.0, 15.0, 12.0, 14.0, 23.0, 18.0, 26.0, 32.0, 40.0, 43.0, 48.0, 46.0, 55.0, 51.0, 76.0, 58.0, 55.0, 46.0, 37.0, 46.0, 32.0, 34.0, 34.0, 29.0, 18.0, 22.0, 16.0, 17.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.694084107875824, -0.6658458113670349, -0.6376074552536011, -0.609369158744812, -0.581130862236023, -0.5528925061225891, -0.5246542096138, -0.4964158833026886, -0.46817755699157715, -0.4399392306804657, -0.41170090436935425, -0.3834626078605652, -0.35522428154945374, -0.3269859552383423, -0.2987476587295532, -0.2705093324184418, -0.24227100610733032, -0.21403267979621887, -0.18579436838626862, -0.15755605697631836, -0.1293177306652069, -0.10107940435409546, -0.0728410929441452, -0.044602781534194946, -0.016364455223083496, 0.011873863637447357, 0.04011218249797821, 0.06835050135850906, 0.09658882021903992, 0.12482714653015137, 0.15306545794010162, 0.18130376935005188, 0.20954203605651855, 0.23778036236763, 0.26601868867874146, 0.2942569851875305, 0.32249531149864197, 0.3507336378097534, 0.3789719343185425, 0.40721026062965393, 0.4354485869407654, 0.46368691325187683, 0.4919252395629883, 0.5201635360717773, 0.5484018325805664, 0.5766401886940002, 0.6048784852027893, 0.6331168413162231, 0.6613551378250122, 0.6895934343338013, 0.7178317904472351, 0.7460700869560242, 0.774308443069458, 0.8025467395782471, 0.8307850360870361, 0.8590233325958252, 0.887261688709259, 0.9154999852180481, 0.9437383413314819, 0.971976637840271, 1.00021493434906, 1.0284533500671387, 1.0566916465759277, 1.0849299430847168, 1.1131682395935059]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 11.0, 15.0, 26.0, 42.0, 47.0, 80.0, 114.0, 209.0, 342.0, 544.0, 959.0, 1677.0, 3120.0, 6173.0, 13961.0, 34089.0, 101128.0, 525630.0, 3132314.0, 259427.0, 67353.0, 24888.0, 10825.0, 5152.0, 2608.0, 1434.0, 826.0, 487.0, 285.0, 162.0, 121.0, 68.0, 64.0, 33.0, 19.0, 11.0, 12.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11365509033203125, -0.1102447509765625, -0.10683441162109375, -0.103424072265625, -0.10001373291015625, -0.0966033935546875, -0.09319305419921875, -0.08978271484375, -0.08637237548828125, -0.0829620361328125, -0.07955169677734375, -0.076141357421875, -0.07273101806640625, -0.0693206787109375, -0.06591033935546875, -0.0625, -0.05908966064453125, -0.0556793212890625, -0.05226898193359375, -0.048858642578125, -0.04544830322265625, -0.0420379638671875, -0.03862762451171875, -0.03521728515625, -0.03180694580078125, -0.0283966064453125, -0.02498626708984375, -0.021575927734375, -0.01816558837890625, -0.0147552490234375, -0.01134490966796875, -0.0079345703125, -0.00452423095703125, -0.0011138916015625, 0.00229644775390625, 0.005706787109375, 0.00911712646484375, 0.0125274658203125, 0.01593780517578125, 0.01934814453125, 0.02275848388671875, 0.0261688232421875, 0.02957916259765625, 0.032989501953125, 0.03639984130859375, 0.0398101806640625, 0.04322052001953125, 0.046630859375, 0.05004119873046875, 0.0534515380859375, 0.05686187744140625, 0.060272216796875, 0.06368255615234375, 0.0670928955078125, 0.07050323486328125, 0.07391357421875, 0.07732391357421875, 0.0807342529296875, 0.08414459228515625, 0.087554931640625, 0.09096527099609375, 0.0943756103515625, 0.09778594970703125, 0.1011962890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 11.0, 13.0, 18.0, 30.0, 29.0, 33.0, 39.0, 44.0, 58.0, 42.0, 71.0, 61.0, 49.0, 56.0, 59.0, 67.0, 53.0, 47.0, 46.0, 41.0, 30.0, 23.0, 14.0, 9.0, 5.0, 11.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290374755859375, -0.02801823616027832, -0.02699899673461914, -0.02597975730895996, -0.02496051788330078, -0.0239412784576416, -0.022922039031982422, -0.021902799606323242, -0.020883560180664062, -0.019864320755004883, -0.018845081329345703, -0.017825841903686523, -0.016806602478027344, -0.015787363052368164, -0.014768123626708984, -0.013748884201049805, -0.012729644775390625, -0.011710405349731445, -0.010691165924072266, -0.009671926498413086, -0.008652687072753906, -0.0076334476470947266, -0.006614208221435547, -0.005594968795776367, -0.0045757293701171875, -0.003556489944458008, -0.002537250518798828, -0.0015180110931396484, -0.0004987716674804688, 0.0005204677581787109, 0.0015397071838378906, 0.0025589466094970703, 0.00357818603515625, 0.00459742546081543, 0.005616664886474609, 0.006635904312133789, 0.007655143737792969, 0.008674383163452148, 0.009693622589111328, 0.010712862014770508, 0.011732101440429688, 0.012751340866088867, 0.013770580291748047, 0.014789819717407227, 0.015809059143066406, 0.016828298568725586, 0.017847537994384766, 0.018866777420043945, 0.019886016845703125, 0.020905256271362305, 0.021924495697021484, 0.022943735122680664, 0.023962974548339844, 0.024982213973999023, 0.026001453399658203, 0.027020692825317383, 0.028039932250976562, 0.029059171676635742, 0.030078411102294922, 0.0310976505279541, 0.03211688995361328, 0.03313612937927246, 0.03415536880493164, 0.03517460823059082, 0.03619384765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 11.0, 19.0, 19.0, 40.0, 65.0, 55.0, 122.0, 144.0, 253.0, 465.0, 728.0, 1412.0, 3045.0, 7997.0, 25504.0, 107731.0, 893390.0, 2896106.0, 196583.0, 40754.0, 11754.0, 4207.0, 1787.0, 855.0, 463.0, 277.0, 157.0, 97.0, 69.0, 56.0, 29.0, 23.0, 13.0, 4.0, 11.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12170791625976562, -0.11621856689453125, -0.11072921752929688, -0.1052398681640625, -0.09975051879882812, -0.09426116943359375, -0.08877182006835938, -0.083282470703125, -0.07779312133789062, -0.07230377197265625, -0.06681442260742188, -0.0613250732421875, -0.055835723876953125, -0.05034637451171875, -0.044857025146484375, -0.03936767578125, -0.033878326416015625, -0.02838897705078125, -0.022899627685546875, -0.0174102783203125, -0.011920928955078125, -0.00643157958984375, -0.000942230224609375, 0.004547119140625, 0.010036468505859375, 0.01552581787109375, 0.021015167236328125, 0.0265045166015625, 0.031993865966796875, 0.03748321533203125, 0.042972564697265625, 0.0484619140625, 0.053951263427734375, 0.05944061279296875, 0.06492996215820312, 0.0704193115234375, 0.07590866088867188, 0.08139801025390625, 0.08688735961914062, 0.092376708984375, 0.09786605834960938, 0.10335540771484375, 0.10884475708007812, 0.1143341064453125, 0.11982345581054688, 0.12531280517578125, 0.13080215454101562, 0.13629150390625, 0.14178085327148438, 0.14727020263671875, 0.15275955200195312, 0.1582489013671875, 0.16373825073242188, 0.16922760009765625, 0.17471694946289062, 0.180206298828125, 0.18569564819335938, 0.19118499755859375, 0.19667434692382812, 0.2021636962890625, 0.20765304565429688, 0.21314239501953125, 0.21863174438476562, 0.22412109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 27.0, 38.0, 44.0, 80.0, 115.0, 209.0, 446.0, 1300.0, 931.0, 329.0, 211.0, 117.0, 55.0, 44.0, 30.0, 19.0, 20.0, 10.0, 3.0, 9.0, 1.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1265869140625, -0.123565673828125, -0.12054443359375, -0.117523193359375, -0.114501953125, -0.111480712890625, -0.10845947265625, -0.105438232421875, -0.1024169921875, -0.099395751953125, -0.09637451171875, -0.093353271484375, -0.09033203125, -0.087310791015625, -0.08428955078125, -0.081268310546875, -0.0782470703125, -0.075225830078125, -0.07220458984375, -0.069183349609375, -0.066162109375, -0.063140869140625, -0.06011962890625, -0.057098388671875, -0.0540771484375, -0.051055908203125, -0.04803466796875, -0.045013427734375, -0.0419921875, -0.038970947265625, -0.03594970703125, -0.032928466796875, -0.0299072265625, -0.026885986328125, -0.02386474609375, -0.020843505859375, -0.017822265625, -0.014801025390625, -0.01177978515625, -0.008758544921875, -0.0057373046875, -0.002716064453125, 0.00030517578125, 0.003326416015625, 0.00634765625, 0.009368896484375, 0.01239013671875, 0.015411376953125, 0.0184326171875, 0.021453857421875, 0.02447509765625, 0.027496337890625, 0.030517578125, 0.033538818359375, 0.03656005859375, 0.039581298828125, 0.0426025390625, 0.045623779296875, 0.04864501953125, 0.051666259765625, 0.0546875, 0.057708740234375, 0.06072998046875, 0.063751220703125, 0.0667724609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 36.0, 88.0, 114.0, 182.0, 180.0, 167.0, 100.0, 74.0, 24.0, 11.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478748679161072, -0.5223398208618164, -0.49680474400520325, -0.4712696671485901, -0.4457346200942993, -0.42019957304000854, -0.3946644961833954, -0.3691294193267822, -0.34359437227249146, -0.3180593252182007, -0.2925242483615875, -0.26698917150497437, -0.2414541244506836, -0.21591906249523163, -0.19038400053977966, -0.1648489385843277, -0.13931387662887573, -0.11377881467342377, -0.0882437527179718, -0.06270869076251984, -0.03717362880706787, -0.011638566851615906, 0.01389649510383606, 0.039431557059288025, 0.06496661901473999, 0.09050168097019196, 0.11603674292564392, 0.1415718048810959, 0.16710686683654785, 0.19264192879199982, 0.21817699074745178, 0.24371205270290375, 0.2692471742630005, 0.29478222131729126, 0.3203172981739044, 0.3458523750305176, 0.37138742208480835, 0.3969224691390991, 0.4224575459957123, 0.44799262285232544, 0.4735276699066162, 0.499062716960907, 0.5245977640151978, 0.5501328706741333, 0.5756679177284241, 0.6012029647827148, 0.6267380714416504, 0.6522731184959412, 0.6778081655502319, 0.7033432126045227, 0.7288782596588135, 0.754413366317749, 0.7799484133720398, 0.8054834604263306, 0.8310185670852661, 0.8565536141395569, 0.8820886611938477, 0.9076237082481384, 0.9331587553024292, 0.9586938619613647, 0.9842289090156555, 1.0097639560699463, 1.0352990627288818, 1.0608340501785278, 1.0863691568374634]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 10.0, 6.0, 13.0, 16.0, 17.0, 17.0, 25.0, 32.0, 38.0, 30.0, 36.0, 45.0, 53.0, 49.0, 57.0, 43.0, 54.0, 48.0, 60.0, 54.0, 34.0, 44.0, 42.0, 32.0, 28.0, 19.0, 16.0, 23.0, 9.0, 12.0, 7.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29751962423324585, -0.28751102089881897, -0.2775024473667145, -0.2674938440322876, -0.2574852705001831, -0.24747666716575623, -0.23746807873249054, -0.22745949029922485, -0.21745088696479797, -0.2074422985315323, -0.1974337100982666, -0.18742510676383972, -0.17741651833057404, -0.16740792989730835, -0.15739934146404266, -0.14739075303077698, -0.1373821645975113, -0.1273735761642456, -0.11736498028039932, -0.10735639184713364, -0.09734779596328735, -0.08733920753002167, -0.07733061909675598, -0.0673220232129097, -0.05731343477964401, -0.04730484262108803, -0.03729625046253204, -0.027287662029266357, -0.017279069870710373, -0.007270477712154388, 0.0027381107211112976, 0.01274670660495758, 0.022755295038223267, 0.03276388719677925, 0.042772479355335236, 0.05278106778860092, 0.0627896636724472, 0.07279825210571289, 0.08280684053897858, 0.09281543642282486, 0.10282402485609055, 0.11283261328935623, 0.12284120917320251, 0.1328497976064682, 0.1428583860397339, 0.15286698937416077, 0.16287556290626526, 0.17288416624069214, 0.18289275467395782, 0.1929013431072235, 0.2029099315404892, 0.21291851997375488, 0.22292712330818176, 0.23293571174144745, 0.24294430017471313, 0.25295290350914, 0.2629614770412445, 0.2729700803756714, 0.2829786539077759, 0.29298725724220276, 0.30299583077430725, 0.31300443410873413, 0.3230130076408386, 0.3330216109752655, 0.3430302143096924]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 15.0, 14.0, 16.0, 35.0, 57.0, 77.0, 125.0, 232.0, 392.0, 633.0, 1131.0, 2213.0, 4325.0, 8629.0, 18492.0, 39487.0, 91106.0, 454644.0, 292754.0, 71002.0, 32700.0, 15295.0, 7212.0, 3590.0, 1873.0, 1048.0, 544.0, 325.0, 224.0, 105.0, 98.0, 59.0, 35.0, 19.0, 15.0, 11.0, 5.0, 6.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12711524963378906, -0.12312698364257812, -0.11913871765136719, -0.11515045166015625, -0.11116218566894531, -0.10717391967773438, -0.10318565368652344, -0.0991973876953125, -0.09520912170410156, -0.09122085571289062, -0.08723258972167969, -0.08324432373046875, -0.07925605773925781, -0.07526779174804688, -0.07127952575683594, -0.067291259765625, -0.06330299377441406, -0.059314727783203125, -0.05532646179199219, -0.05133819580078125, -0.04734992980957031, -0.043361663818359375, -0.03937339782714844, -0.0353851318359375, -0.03139686584472656, -0.027408599853515625, -0.023420333862304688, -0.01943206787109375, -0.015443801879882812, -0.011455535888671875, -0.0074672698974609375, -0.00347900390625, 0.0005092620849609375, 0.004497528076171875, 0.008485794067382812, 0.01247406005859375, 0.016462326049804688, 0.020450592041015625, 0.024438858032226562, 0.0284271240234375, 0.03241539001464844, 0.036403656005859375, 0.04039192199707031, 0.04438018798828125, 0.04836845397949219, 0.052356719970703125, 0.05634498596191406, 0.060333251953125, 0.06432151794433594, 0.06830978393554688, 0.07229804992675781, 0.07628631591796875, 0.08027458190917969, 0.08426284790039062, 0.08825111389160156, 0.0922393798828125, 0.09622764587402344, 0.10021591186523438, 0.10420417785644531, 0.10819244384765625, 0.11218070983886719, 0.11616897583007812, 0.12015724182128906, 0.1241455078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 3.0, 5.0, 6.0, 7.0, 9.0, 6.0, 10.0, 15.0, 18.0, 15.0, 30.0, 30.0, 28.0, 27.0, 35.0, 33.0, 46.0, 35.0, 47.0, 34.0, 48.0, 39.0, 44.0, 38.0, 54.0, 40.0, 42.0, 33.0, 31.0, 32.0, 29.0, 24.0, 15.0, 14.0, 15.0, 11.0, 11.0, 10.0, 5.0, 8.0, 6.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02496337890625, -0.024183273315429688, -0.023403167724609375, -0.022623062133789062, -0.02184295654296875, -0.021062850952148438, -0.020282745361328125, -0.019502639770507812, -0.0187225341796875, -0.017942428588867188, -0.017162322998046875, -0.016382217407226562, -0.01560211181640625, -0.014822006225585938, -0.014041900634765625, -0.013261795043945312, -0.012481689453125, -0.011701583862304688, -0.010921478271484375, -0.010141372680664062, -0.00936126708984375, -0.008581161499023438, -0.007801055908203125, -0.0070209503173828125, -0.0062408447265625, -0.0054607391357421875, -0.004680633544921875, -0.0039005279541015625, -0.00312042236328125, -0.0023403167724609375, -0.001560211181640625, -0.0007801055908203125, 0.0, 0.0007801055908203125, 0.001560211181640625, 0.0023403167724609375, 0.00312042236328125, 0.0039005279541015625, 0.004680633544921875, 0.0054607391357421875, 0.0062408447265625, 0.0070209503173828125, 0.007801055908203125, 0.008581161499023438, 0.00936126708984375, 0.010141372680664062, 0.010921478271484375, 0.011701583862304688, 0.012481689453125, 0.013261795043945312, 0.014041900634765625, 0.014822006225585938, 0.01560211181640625, 0.016382217407226562, 0.017162322998046875, 0.017942428588867188, 0.0187225341796875, 0.019502639770507812, 0.020282745361328125, 0.021062850952148438, 0.02184295654296875, 0.022623062133789062, 0.023403167724609375, 0.024183273315429688, 0.02496337890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 6.0, 13.0, 23.0, 19.0, 31.0, 39.0, 56.0, 58.0, 73.0, 89.0, 146.0, 217.0, 280.0, 367.0, 633.0, 1118.0, 1925.0, 4037.0, 10661.0, 31264.0, 93729.0, 638720.0, 185822.0, 49795.0, 16896.0, 6171.0, 2583.0, 1301.0, 742.0, 431.0, 328.0, 234.0, 170.0, 142.0, 95.0, 74.0, 56.0, 47.0, 36.0, 23.0, 21.0, 21.0, 4.0, 10.0, 9.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.156982421875, -0.15218353271484375, -0.1473846435546875, -0.14258575439453125, -0.137786865234375, -0.13298797607421875, -0.1281890869140625, -0.12339019775390625, -0.11859130859375, -0.11379241943359375, -0.1089935302734375, -0.10419464111328125, -0.099395751953125, -0.09459686279296875, -0.0897979736328125, -0.08499908447265625, -0.0802001953125, -0.07540130615234375, -0.0706024169921875, -0.06580352783203125, -0.061004638671875, -0.05620574951171875, -0.0514068603515625, -0.04660797119140625, -0.04180908203125, -0.03701019287109375, -0.0322113037109375, -0.02741241455078125, -0.022613525390625, -0.01781463623046875, -0.0130157470703125, -0.00821685791015625, -0.00341796875, 0.00138092041015625, 0.0061798095703125, 0.01097869873046875, 0.015777587890625, 0.02057647705078125, 0.0253753662109375, 0.03017425537109375, 0.03497314453125, 0.03977203369140625, 0.0445709228515625, 0.04936981201171875, 0.054168701171875, 0.05896759033203125, 0.0637664794921875, 0.06856536865234375, 0.0733642578125, 0.07816314697265625, 0.0829620361328125, 0.08776092529296875, 0.092559814453125, 0.09735870361328125, 0.1021575927734375, 0.10695648193359375, 0.11175537109375, 0.11655426025390625, 0.1213531494140625, 0.12615203857421875, 0.130950927734375, 0.13574981689453125, 0.1405487060546875, 0.14534759521484375, 0.150146484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 8.0, 8.0, 19.0, 10.0, 21.0, 28.0, 46.0, 54.0, 55.0, 47.0, 59.0, 58.0, 60.0, 61.0, 52.0, 57.0, 62.0, 58.0, 45.0, 37.0, 28.0, 27.0, 18.0, 15.0, 15.0, 10.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1678466796875, -0.1627788543701172, -0.15771102905273438, -0.15264320373535156, -0.14757537841796875, -0.14250755310058594, -0.13743972778320312, -0.1323719024658203, -0.1273040771484375, -0.12223625183105469, -0.11716842651367188, -0.11210060119628906, -0.10703277587890625, -0.10196495056152344, -0.09689712524414062, -0.09182929992675781, -0.086761474609375, -0.08169364929199219, -0.07662582397460938, -0.07155799865722656, -0.06649017333984375, -0.06142234802246094, -0.056354522705078125, -0.05128669738769531, -0.0462188720703125, -0.04115104675292969, -0.036083221435546875, -0.031015396118164062, -0.02594757080078125, -0.020879745483398438, -0.015811920166015625, -0.010744094848632812, -0.00567626953125, -0.0006084442138671875, 0.004459381103515625, 0.009527206420898438, 0.01459503173828125, 0.019662857055664062, 0.024730682373046875, 0.029798507690429688, 0.0348663330078125, 0.03993415832519531, 0.045001983642578125, 0.05006980895996094, 0.05513763427734375, 0.06020545959472656, 0.06527328491210938, 0.07034111022949219, 0.075408935546875, 0.08047676086425781, 0.08554458618164062, 0.09061241149902344, 0.09568023681640625, 0.10074806213378906, 0.10581588745117188, 0.11088371276855469, 0.1159515380859375, 0.12101936340332031, 0.12608718872070312, 0.13115501403808594, 0.13622283935546875, 0.14129066467285156, 0.14635848999023438, 0.1514263153076172, 0.156494140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 11.0, 10.0, 16.0, 18.0, 26.0, 53.0, 94.0, 189.0, 522.0, 2598.0, 29158.0, 941765.0, 68602.0, 4183.0, 723.0, 261.0, 127.0, 65.0, 49.0, 28.0, 23.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.394134521484375, -0.38275146484375, -0.371368408203125, -0.3599853515625, -0.348602294921875, -0.33721923828125, -0.325836181640625, -0.314453125, -0.303070068359375, -0.29168701171875, -0.280303955078125, -0.2689208984375, -0.257537841796875, -0.24615478515625, -0.234771728515625, -0.223388671875, -0.212005615234375, -0.20062255859375, -0.189239501953125, -0.1778564453125, -0.166473388671875, -0.15509033203125, -0.143707275390625, -0.13232421875, -0.120941162109375, -0.10955810546875, -0.098175048828125, -0.0867919921875, -0.075408935546875, -0.06402587890625, -0.052642822265625, -0.041259765625, -0.029876708984375, -0.01849365234375, -0.007110595703125, 0.0042724609375, 0.015655517578125, 0.02703857421875, 0.038421630859375, 0.0498046875, 0.061187744140625, 0.07257080078125, 0.083953857421875, 0.0953369140625, 0.106719970703125, 0.11810302734375, 0.129486083984375, 0.140869140625, 0.152252197265625, 0.16363525390625, 0.175018310546875, 0.1864013671875, 0.197784423828125, 0.20916748046875, 0.220550537109375, 0.23193359375, 0.243316650390625, 0.25469970703125, 0.266082763671875, 0.2774658203125, 0.288848876953125, 0.30023193359375, 0.311614990234375, 0.322998046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 10.0, 20.0, 31.0, 41.0, 78.0, 129.0, 138.0, 150.0, 142.0, 87.0, 61.0, 31.0, 25.0, 18.0, 11.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.930662155151367e-05, -5.6224875152111053e-05, -5.3143128752708435e-05, -5.006138235330582e-05, -4.69796359539032e-05, -4.389788955450058e-05, -4.081614315509796e-05, -3.773439675569534e-05, -3.4652650356292725e-05, -3.1570903956890106e-05, -2.8489157557487488e-05, -2.540741115808487e-05, -2.232566475868225e-05, -1.9243918359279633e-05, -1.6162171959877014e-05, -1.3080425560474396e-05, -9.998679161071777e-06, -6.916932761669159e-06, -3.8351863622665405e-06, -7.534399628639221e-07, 2.3283064365386963e-06, 5.410052835941315e-06, 8.491799235343933e-06, 1.1573545634746552e-05, 1.465529203414917e-05, 1.773703843355179e-05, 2.0818784832954407e-05, 2.3900531232357025e-05, 2.6982277631759644e-05, 3.0064024031162262e-05, 3.314577043056488e-05, 3.62275168299675e-05, 3.930926322937012e-05, 4.2391009628772736e-05, 4.5472756028175354e-05, 4.855450242757797e-05, 5.163624882698059e-05, 5.471799522638321e-05, 5.779974162578583e-05, 6.0881488025188446e-05, 6.396323442459106e-05, 6.704498082399368e-05, 7.01267272233963e-05, 7.320847362279892e-05, 7.629022002220154e-05, 7.937196642160416e-05, 8.245371282100677e-05, 8.55354592204094e-05, 8.861720561981201e-05, 9.169895201921463e-05, 9.478069841861725e-05, 9.786244481801987e-05, 0.00010094419121742249, 0.0001040259376168251, 0.00010710768401622772, 0.00011018943041563034, 0.00011327117681503296, 0.00011635292321443558, 0.0001194346696138382, 0.00012251641601324081, 0.00012559816241264343, 0.00012867990881204605, 0.00013176165521144867, 0.0001348434016108513, 0.0001379251480102539]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 15.0, 20.0, 22.0, 50.0, 62.0, 115.0, 191.0, 328.0, 757.0, 2540.0, 12395.0, 184138.0, 816426.0, 25448.0, 3885.0, 1081.0, 431.0, 238.0, 143.0, 88.0, 58.0, 39.0, 30.0, 10.0, 10.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2435302734375, -0.23595809936523438, -0.22838592529296875, -0.22081375122070312, -0.2132415771484375, -0.20566940307617188, -0.19809722900390625, -0.19052505493164062, -0.182952880859375, -0.17538070678710938, -0.16780853271484375, -0.16023635864257812, -0.1526641845703125, -0.14509201049804688, -0.13751983642578125, -0.12994766235351562, -0.12237548828125, -0.11480331420898438, -0.10723114013671875, -0.09965896606445312, -0.0920867919921875, -0.08451461791992188, -0.07694244384765625, -0.06937026977539062, -0.061798095703125, -0.054225921630859375, -0.04665374755859375, -0.039081573486328125, -0.0315093994140625, -0.023937225341796875, -0.01636505126953125, -0.008792877197265625, -0.001220703125, 0.006351470947265625, 0.01392364501953125, 0.021495819091796875, 0.0290679931640625, 0.036640167236328125, 0.04421234130859375, 0.051784515380859375, 0.059356689453125, 0.06692886352539062, 0.07450103759765625, 0.08207321166992188, 0.0896453857421875, 0.09721755981445312, 0.10478973388671875, 0.11236190795898438, 0.11993408203125, 0.12750625610351562, 0.13507843017578125, 0.14265060424804688, 0.1502227783203125, 0.15779495239257812, 0.16536712646484375, 0.17293930053710938, 0.180511474609375, 0.18808364868164062, 0.19565582275390625, 0.20322799682617188, 0.2108001708984375, 0.21837234497070312, 0.22594451904296875, 0.23351669311523438, 0.2410888671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 6.0, 12.0, 12.0, 20.0, 19.0, 25.0, 43.0, 68.0, 163.0, 276.0, 162.0, 60.0, 24.0, 31.0, 22.0, 15.0, 11.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1295166015625, -0.125762939453125, -0.12200927734375, -0.118255615234375, -0.114501953125, -0.110748291015625, -0.10699462890625, -0.103240966796875, -0.0994873046875, -0.095733642578125, -0.09197998046875, -0.088226318359375, -0.08447265625, -0.080718994140625, -0.07696533203125, -0.073211669921875, -0.0694580078125, -0.065704345703125, -0.06195068359375, -0.058197021484375, -0.054443359375, -0.050689697265625, -0.04693603515625, -0.043182373046875, -0.0394287109375, -0.035675048828125, -0.03192138671875, -0.028167724609375, -0.0244140625, -0.020660400390625, -0.01690673828125, -0.013153076171875, -0.0093994140625, -0.005645751953125, -0.00189208984375, 0.001861572265625, 0.005615234375, 0.009368896484375, 0.01312255859375, 0.016876220703125, 0.0206298828125, 0.024383544921875, 0.02813720703125, 0.031890869140625, 0.03564453125, 0.039398193359375, 0.04315185546875, 0.046905517578125, 0.0506591796875, 0.054412841796875, 0.05816650390625, 0.061920166015625, 0.065673828125, 0.069427490234375, 0.07318115234375, 0.076934814453125, 0.0806884765625, 0.084442138671875, 0.08819580078125, 0.091949462890625, 0.095703125, 0.099456787109375, 0.10321044921875, 0.106964111328125, 0.1107177734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 5.0, 21.0, 50.0, 123.0, 220.0, 256.0, 199.0, 85.0, 29.0, 13.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1755073070526123, -1.0989019870758057, -1.022296667098999, -0.9456912279129028, -0.8690859079360962, -0.7924805879592896, -0.7158752083778381, -0.6392698287963867, -0.5626645088195801, -0.48605915904045105, -0.409453809261322, -0.332848459482193, -0.25624310970306396, -0.17963775992393494, -0.10303241014480591, -0.026427030563354492, 0.05017828941345215, 0.12678363919258118, 0.2033889889717102, 0.27999433875083923, 0.35659968852996826, 0.4332050383090973, 0.5098103880882263, 0.5864157676696777, 0.6630210876464844, 0.739626407623291, 0.8162317872047424, 0.8928371667861938, 0.9694424867630005, 1.0460478067398071, 1.1226532459259033, 1.19925856590271, 1.2758641242980957, 1.3524694442749023, 1.429074764251709, 1.5056802034378052, 1.5822855234146118, 1.6588908433914185, 1.7354962825775146, 1.8121016025543213, 1.888706922531128, 1.9653122425079346, 2.041917562484741, 2.118522882461548, 2.1951284408569336, 2.2717337608337402, 2.348339080810547, 2.4249444007873535, 2.50154972076416, 2.578155040740967, 2.6547603607177734, 2.73136568069458, 2.8079710006713867, 2.8845765590667725, 2.961181879043579, 3.0377871990203857, 3.1143925189971924, 3.190997838973999, 3.2676031589508057, 3.3442084789276123, 3.420814037322998, 3.4974193572998047, 3.5740246772766113, 3.650629997253418, 3.7272353172302246]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 10.0, 9.0, 14.0, 20.0, 14.0, 16.0, 24.0, 30.0, 23.0, 32.0, 25.0, 36.0, 45.0, 43.0, 44.0, 60.0, 52.0, 55.0, 45.0, 42.0, 56.0, 46.0, 41.0, 24.0, 26.0, 27.0, 20.0, 22.0, 25.0, 9.0, 15.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8387554287910461, -0.8171766996383667, -0.7955979108810425, -0.774019181728363, -0.7524404525756836, -0.7308617234230042, -0.7092829942703247, -0.6877042055130005, -0.666125476360321, -0.6445467472076416, -0.6229679584503174, -0.6013892292976379, -0.5798105001449585, -0.558231770992279, -0.5366530418395996, -0.5150742530822754, -0.49349552392959595, -0.4719167947769165, -0.4503380358219147, -0.42875927686691284, -0.4071805477142334, -0.38560181856155396, -0.3640230596065521, -0.3424443006515503, -0.32086557149887085, -0.2992868423461914, -0.2777080833911896, -0.25612932443618774, -0.2345505952835083, -0.21297185122966766, -0.19139310717582703, -0.1698143631219864, -0.14823567867279053, -0.1266569346189499, -0.10507819056510925, -0.08349944651126862, -0.06192070245742798, -0.04034195840358734, -0.018763214349746704, 0.002815529704093933, 0.02439427375793457, 0.04597301781177521, 0.06755176186561584, 0.08913050591945648, 0.11070924997329712, 0.13228799402713776, 0.1538667380809784, 0.17544548213481903, 0.19702422618865967, 0.2186029702425003, 0.24018171429634094, 0.2617604732513428, 0.2833392024040222, 0.30491793155670166, 0.3264966905117035, 0.3480754494667053, 0.36965417861938477, 0.3912329077720642, 0.41281166672706604, 0.43439042568206787, 0.4559691548347473, 0.47754788398742676, 0.4991266429424286, 0.5207054018974304, 0.5422841310501099]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 14.0, 8.0, 19.0, 26.0, 31.0, 54.0, 100.0, 142.0, 228.0, 389.0, 709.0, 1166.0, 2143.0, 4281.0, 8755.0, 19781.0, 51008.0, 173474.0, 3005724.0, 746496.0, 112258.0, 37534.0, 15310.0, 6829.0, 3472.0, 1798.0, 980.0, 613.0, 348.0, 220.0, 137.0, 74.0, 63.0, 27.0, 21.0, 18.0, 16.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.1324300765991211, -0.1286296844482422, -0.12482929229736328, -0.12102890014648438, -0.11722850799560547, -0.11342811584472656, -0.10962772369384766, -0.10582733154296875, -0.10202693939208984, -0.09822654724121094, -0.09442615509033203, -0.09062576293945312, -0.08682537078857422, -0.08302497863769531, -0.0792245864868164, -0.0754241943359375, -0.0716238021850586, -0.06782341003417969, -0.06402301788330078, -0.060222625732421875, -0.05642223358154297, -0.05262184143066406, -0.048821449279785156, -0.04502105712890625, -0.041220664978027344, -0.03742027282714844, -0.03361988067626953, -0.029819488525390625, -0.02601909637451172, -0.022218704223632812, -0.018418312072753906, -0.014617919921875, -0.010817527770996094, -0.0070171356201171875, -0.0032167434692382812, 0.000583648681640625, 0.004384040832519531, 0.008184432983398438, 0.011984825134277344, 0.01578521728515625, 0.019585609436035156, 0.023386001586914062, 0.02718639373779297, 0.030986785888671875, 0.03478717803955078, 0.03858757019042969, 0.042387962341308594, 0.0461883544921875, 0.049988746643066406, 0.05378913879394531, 0.05758953094482422, 0.061389923095703125, 0.06519031524658203, 0.06899070739746094, 0.07279109954833984, 0.07659149169921875, 0.08039188385009766, 0.08419227600097656, 0.08799266815185547, 0.09179306030273438, 0.09559345245361328, 0.09939384460449219, 0.1031942367553711, 0.10699462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 6.0, 12.0, 8.0, 19.0, 20.0, 25.0, 23.0, 45.0, 40.0, 46.0, 53.0, 42.0, 56.0, 50.0, 63.0, 64.0, 52.0, 57.0, 61.0, 49.0, 42.0, 27.0, 26.0, 24.0, 19.0, 19.0, 11.0, 10.0, 6.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030792236328125, -0.029666900634765625, -0.02854156494140625, -0.027416229248046875, -0.0262908935546875, -0.025165557861328125, -0.02404022216796875, -0.022914886474609375, -0.02178955078125, -0.020664215087890625, -0.01953887939453125, -0.018413543701171875, -0.0172882080078125, -0.016162872314453125, -0.01503753662109375, -0.013912200927734375, -0.012786865234375, -0.011661529541015625, -0.01053619384765625, -0.009410858154296875, -0.0082855224609375, -0.007160186767578125, -0.00603485107421875, -0.004909515380859375, -0.0037841796875, -0.002658843994140625, -0.00153350830078125, -0.000408172607421875, 0.0007171630859375, 0.001842498779296875, 0.00296783447265625, 0.004093170166015625, 0.005218505859375, 0.006343841552734375, 0.00746917724609375, 0.008594512939453125, 0.0097198486328125, 0.010845184326171875, 0.01197052001953125, 0.013095855712890625, 0.01422119140625, 0.015346527099609375, 0.01647186279296875, 0.017597198486328125, 0.0187225341796875, 0.019847869873046875, 0.02097320556640625, 0.022098541259765625, 0.023223876953125, 0.024349212646484375, 0.02547454833984375, 0.026599884033203125, 0.0277252197265625, 0.028850555419921875, 0.02997589111328125, 0.031101226806640625, 0.0322265625, 0.033351898193359375, 0.03447723388671875, 0.035602569580078125, 0.0367279052734375, 0.037853240966796875, 0.03897857666015625, 0.040103912353515625, 0.041229248046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 9.0, 13.0, 14.0, 22.0, 25.0, 27.0, 38.0, 66.0, 87.0, 109.0, 131.0, 222.0, 305.0, 570.0, 992.0, 1992.0, 4874.0, 14218.0, 54503.0, 358490.0, 3460041.0, 235746.0, 41751.0, 11720.0, 4092.0, 1743.0, 927.0, 470.0, 332.0, 195.0, 146.0, 92.0, 78.0, 69.0, 50.0, 25.0, 19.0, 20.0, 13.0, 10.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.224853515625, -0.21831893920898438, -0.21178436279296875, -0.20524978637695312, -0.1987152099609375, -0.19218063354492188, -0.18564605712890625, -0.17911148071289062, -0.172576904296875, -0.16604232788085938, -0.15950775146484375, -0.15297317504882812, -0.1464385986328125, -0.13990402221679688, -0.13336944580078125, -0.12683486938476562, -0.12030029296875, -0.11376571655273438, -0.10723114013671875, -0.10069656372070312, -0.0941619873046875, -0.08762741088867188, -0.08109283447265625, -0.07455825805664062, -0.068023681640625, -0.061489105224609375, -0.05495452880859375, -0.048419952392578125, -0.0418853759765625, -0.035350799560546875, -0.02881622314453125, -0.022281646728515625, -0.0157470703125, -0.009212493896484375, -0.00267791748046875, 0.003856658935546875, 0.0103912353515625, 0.016925811767578125, 0.02346038818359375, 0.029994964599609375, 0.036529541015625, 0.043064117431640625, 0.04959869384765625, 0.056133270263671875, 0.0626678466796875, 0.06920242309570312, 0.07573699951171875, 0.08227157592773438, 0.08880615234375, 0.09534072875976562, 0.10187530517578125, 0.10840988159179688, 0.1149444580078125, 0.12147903442382812, 0.12801361083984375, 0.13454818725585938, 0.141082763671875, 0.14761734008789062, 0.15415191650390625, 0.16068649291992188, 0.1672210693359375, 0.17375564575195312, 0.18029022216796875, 0.18682479858398438, 0.193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 14.0, 21.0, 39.0, 75.0, 134.0, 330.0, 1568.0, 1262.0, 303.0, 141.0, 62.0, 35.0, 21.0, 17.0, 11.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11498737335205078, -0.11101722717285156, -0.10704708099365234, -0.10307693481445312, -0.0991067886352539, -0.09513664245605469, -0.09116649627685547, -0.08719635009765625, -0.08322620391845703, -0.07925605773925781, -0.0752859115600586, -0.07131576538085938, -0.06734561920166016, -0.06337547302246094, -0.05940532684326172, -0.0554351806640625, -0.05146503448486328, -0.04749488830566406, -0.043524742126464844, -0.039554595947265625, -0.035584449768066406, -0.03161430358886719, -0.02764415740966797, -0.02367401123046875, -0.01970386505126953, -0.015733718872070312, -0.011763572692871094, -0.007793426513671875, -0.0038232803344726562, 0.0001468658447265625, 0.004117012023925781, 0.008087158203125, 0.012057304382324219, 0.016027450561523438, 0.019997596740722656, 0.023967742919921875, 0.027937889099121094, 0.03190803527832031, 0.03587818145751953, 0.03984832763671875, 0.04381847381591797, 0.04778861999511719, 0.051758766174316406, 0.055728912353515625, 0.059699058532714844, 0.06366920471191406, 0.06763935089111328, 0.0716094970703125, 0.07557964324951172, 0.07954978942871094, 0.08351993560791016, 0.08749008178710938, 0.0914602279663086, 0.09543037414550781, 0.09940052032470703, 0.10337066650390625, 0.10734081268310547, 0.11131095886230469, 0.1152811050415039, 0.11925125122070312, 0.12322139739990234, 0.12719154357910156, 0.13116168975830078, 0.1351318359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 9.0, 24.0, 45.0, 85.0, 124.0, 184.0, 156.0, 133.0, 97.0, 55.0, 42.0, 20.0, 10.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9729800820350647, -0.9513079524040222, -0.9296358227729797, -0.9079636931419373, -0.8862915635108948, -0.8646194338798523, -0.8429473638534546, -0.8212752342224121, -0.7996031045913696, -0.7779309749603271, -0.7562588453292847, -0.7345867156982422, -0.7129145860671997, -0.6912424564361572, -0.6695703268051147, -0.6478981971740723, -0.6262260675430298, -0.6045539379119873, -0.5828818082809448, -0.5612096786499023, -0.5395375490188599, -0.5178654193878174, -0.4961933195590973, -0.4745211899280548, -0.45284906029701233, -0.43117693066596985, -0.40950480103492737, -0.3878327012062073, -0.3661605715751648, -0.3444884419441223, -0.32281631231307983, -0.30114418268203735, -0.2794719934463501, -0.2577998638153076, -0.23612773418426514, -0.21445561945438385, -0.19278348982334137, -0.1711113601922989, -0.1494392454624176, -0.12776711583137512, -0.10609498620033264, -0.08442285656929016, -0.06275073438882828, -0.041078612208366394, -0.019406482577323914, 0.002265647053718567, 0.023937761783599854, 0.045609891414642334, 0.06728202104568481, 0.0889541506767273, 0.11062627285718918, 0.13229839503765106, 0.15397052466869354, 0.17564265429973602, 0.1973147690296173, 0.2189868986606598, 0.24065902829170227, 0.26233115792274475, 0.28400328755378723, 0.3056753873825073, 0.3273475170135498, 0.3490196466445923, 0.37069177627563477, 0.39236390590667725, 0.4140360355377197]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 7.0, 9.0, 8.0, 16.0, 17.0, 17.0, 18.0, 25.0, 26.0, 28.0, 23.0, 27.0, 27.0, 35.0, 36.0, 44.0, 49.0, 48.0, 34.0, 48.0, 35.0, 33.0, 29.0, 36.0, 41.0, 27.0, 23.0, 32.0, 20.0, 23.0, 23.0, 16.0, 15.0, 17.0, 8.0, 10.0, 10.0, 9.0, 12.0, 10.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.26798975467681885, -0.26048341393470764, -0.25297704339027405, -0.24547070264816284, -0.23796434700489044, -0.23045799136161804, -0.22295165061950684, -0.21544529497623444, -0.20793893933296204, -0.20043258368968964, -0.19292622804641724, -0.18541988730430603, -0.17791353166103363, -0.17040717601776123, -0.16290083527565002, -0.15539447963237762, -0.14788812398910522, -0.14038176834583282, -0.13287541270256042, -0.12536907196044922, -0.11786271631717682, -0.11035636067390442, -0.10285001248121262, -0.09534366428852081, -0.08783730864524841, -0.08033095300197601, -0.07282460480928421, -0.06531825661659241, -0.05781190097332001, -0.050305549055337906, -0.042799197137355804, -0.0352928452193737, -0.0277864933013916, -0.0202801413834095, -0.012773789465427399, -0.005267437547445297, 0.002238914370536804, 0.009745266288518906, 0.017251618206501007, 0.02475797012448311, 0.03226432204246521, 0.03977067396044731, 0.04727702587842941, 0.054783377796411514, 0.062289729714393616, 0.06979608535766602, 0.07730243355035782, 0.08480878174304962, 0.09231513738632202, 0.09982149302959442, 0.10732784122228622, 0.11483418941497803, 0.12234054505825043, 0.12984690070152283, 0.13735324144363403, 0.14485959708690643, 0.15236595273017883, 0.15987230837345123, 0.16737866401672363, 0.17488500475883484, 0.18239136040210724, 0.18989771604537964, 0.19740405678749084, 0.20491041243076324, 0.21241676807403564]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 8.0, 4.0, 7.0, 10.0, 9.0, 27.0, 22.0, 29.0, 56.0, 72.0, 117.0, 163.0, 342.0, 667.0, 1390.0, 2952.0, 6621.0, 13703.0, 27959.0, 64459.0, 348127.0, 444951.0, 76440.0, 31025.0, 15369.0, 7416.0, 3417.0, 1532.0, 734.0, 371.0, 202.0, 111.0, 63.0, 42.0, 33.0, 33.0, 20.0, 16.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.119140625, -0.11542606353759766, -0.11171150207519531, -0.10799694061279297, -0.10428237915039062, -0.10056781768798828, -0.09685325622558594, -0.0931386947631836, -0.08942413330078125, -0.0857095718383789, -0.08199501037597656, -0.07828044891357422, -0.07456588745117188, -0.07085132598876953, -0.06713676452636719, -0.06342220306396484, -0.0597076416015625, -0.055993080139160156, -0.05227851867675781, -0.04856395721435547, -0.044849395751953125, -0.04113483428955078, -0.03742027282714844, -0.033705711364746094, -0.02999114990234375, -0.026276588439941406, -0.022562026977539062, -0.01884746551513672, -0.015132904052734375, -0.011418342590332031, -0.0077037811279296875, -0.003989219665527344, -0.000274658203125, 0.0034399032592773438, 0.0071544647216796875, 0.010869026184082031, 0.014583587646484375, 0.01829814910888672, 0.022012710571289062, 0.025727272033691406, 0.02944183349609375, 0.033156394958496094, 0.03687095642089844, 0.04058551788330078, 0.044300079345703125, 0.04801464080810547, 0.05172920227050781, 0.055443763732910156, 0.0591583251953125, 0.06287288665771484, 0.06658744812011719, 0.07030200958251953, 0.07401657104492188, 0.07773113250732422, 0.08144569396972656, 0.0851602554321289, 0.08887481689453125, 0.0925893783569336, 0.09630393981933594, 0.10001850128173828, 0.10373306274414062, 0.10744762420654297, 0.11116218566894531, 0.11487674713134766, 0.11859130859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 9.0, 11.0, 16.0, 10.0, 15.0, 26.0, 15.0, 21.0, 28.0, 31.0, 24.0, 40.0, 22.0, 43.0, 27.0, 39.0, 43.0, 40.0, 44.0, 47.0, 35.0, 42.0, 33.0, 30.0, 42.0, 29.0, 37.0, 36.0, 18.0, 15.0, 17.0, 15.0, 7.0, 21.0, 6.0, 8.0, 14.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0261993408203125, -0.025350570678710938, -0.024501800537109375, -0.023653030395507812, -0.02280426025390625, -0.021955490112304688, -0.021106719970703125, -0.020257949829101562, -0.0194091796875, -0.018560409545898438, -0.017711639404296875, -0.016862869262695312, -0.01601409912109375, -0.015165328979492188, -0.014316558837890625, -0.013467788696289062, -0.0126190185546875, -0.011770248413085938, -0.010921478271484375, -0.010072708129882812, -0.00922393798828125, -0.008375167846679688, -0.007526397705078125, -0.0066776275634765625, -0.005828857421875, -0.0049800872802734375, -0.004131317138671875, -0.0032825469970703125, -0.00243377685546875, -0.0015850067138671875, -0.000736236572265625, 0.0001125335693359375, 0.0009613037109375, 0.0018100738525390625, 0.002658843994140625, 0.0035076141357421875, 0.00435638427734375, 0.0052051544189453125, 0.006053924560546875, 0.0069026947021484375, 0.00775146484375, 0.008600234985351562, 0.009449005126953125, 0.010297775268554688, 0.01114654541015625, 0.011995315551757812, 0.012844085693359375, 0.013692855834960938, 0.0145416259765625, 0.015390396118164062, 0.016239166259765625, 0.017087936401367188, 0.01793670654296875, 0.018785476684570312, 0.019634246826171875, 0.020483016967773438, 0.021331787109375, 0.022180557250976562, 0.023029327392578125, 0.023878097534179688, 0.02472686767578125, 0.025575637817382812, 0.026424407958984375, 0.027273178100585938, 0.0281219482421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 6.0, 10.0, 13.0, 20.0, 21.0, 36.0, 51.0, 88.0, 162.0, 208.0, 451.0, 941.0, 2422.0, 7056.0, 22383.0, 69406.0, 767240.0, 129440.0, 32029.0, 10460.0, 3450.0, 1285.0, 586.0, 298.0, 163.0, 114.0, 60.0, 40.0, 31.0, 22.0, 9.0, 8.0, 6.0, 12.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.228271484375, -0.2220458984375, -0.2158203125, -0.2095947265625, -0.203369140625, -0.1971435546875, -0.19091796875, -0.1846923828125, -0.178466796875, -0.1722412109375, -0.166015625, -0.1597900390625, -0.153564453125, -0.1473388671875, -0.14111328125, -0.1348876953125, -0.128662109375, -0.1224365234375, -0.1162109375, -0.1099853515625, -0.103759765625, -0.0975341796875, -0.09130859375, -0.0850830078125, -0.078857421875, -0.0726318359375, -0.06640625, -0.0601806640625, -0.053955078125, -0.0477294921875, -0.04150390625, -0.0352783203125, -0.029052734375, -0.0228271484375, -0.0166015625, -0.0103759765625, -0.004150390625, 0.0020751953125, 0.00830078125, 0.0145263671875, 0.020751953125, 0.0269775390625, 0.033203125, 0.0394287109375, 0.045654296875, 0.0518798828125, 0.05810546875, 0.0643310546875, 0.070556640625, 0.0767822265625, 0.0830078125, 0.0892333984375, 0.095458984375, 0.1016845703125, 0.10791015625, 0.1141357421875, 0.120361328125, 0.1265869140625, 0.1328125, 0.1390380859375, 0.145263671875, 0.1514892578125, 0.15771484375, 0.1639404296875, 0.170166015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 6.0, 5.0, 6.0, 17.0, 19.0, 23.0, 28.0, 32.0, 45.0, 53.0, 44.0, 54.0, 61.0, 74.0, 68.0, 71.0, 63.0, 45.0, 48.0, 43.0, 40.0, 28.0, 26.0, 16.0, 14.0, 16.0, 13.0, 6.0, 10.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.20047950744628906, -0.19478225708007812, -0.1890850067138672, -0.18338775634765625, -0.1776905059814453, -0.17199325561523438, -0.16629600524902344, -0.1605987548828125, -0.15490150451660156, -0.14920425415039062, -0.1435070037841797, -0.13780975341796875, -0.1321125030517578, -0.12641525268554688, -0.12071800231933594, -0.115020751953125, -0.10932350158691406, -0.10362625122070312, -0.09792900085449219, -0.09223175048828125, -0.08653450012207031, -0.08083724975585938, -0.07513999938964844, -0.0694427490234375, -0.06374549865722656, -0.058048248291015625, -0.05235099792480469, -0.04665374755859375, -0.04095649719238281, -0.035259246826171875, -0.029561996459960938, -0.02386474609375, -0.018167495727539062, -0.012470245361328125, -0.0067729949951171875, -0.00107574462890625, 0.0046215057373046875, 0.010318756103515625, 0.016016006469726562, 0.0217132568359375, 0.027410507202148438, 0.033107757568359375, 0.03880500793457031, 0.04450225830078125, 0.05019950866699219, 0.055896759033203125, 0.06159400939941406, 0.067291259765625, 0.07298851013183594, 0.07868576049804688, 0.08438301086425781, 0.09008026123046875, 0.09577751159667969, 0.10147476196289062, 0.10717201232910156, 0.1128692626953125, 0.11856651306152344, 0.12426376342773438, 0.1299610137939453, 0.13565826416015625, 0.1413555145263672, 0.14705276489257812, 0.15275001525878906, 0.158447265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 11.0, 20.0, 23.0, 25.0, 38.0, 47.0, 95.0, 133.0, 203.0, 322.0, 563.0, 922.0, 1628.0, 2963.0, 6025.0, 12620.0, 28002.0, 69142.0, 606507.0, 233118.0, 46447.0, 20245.0, 9336.0, 4541.0, 2352.0, 1279.0, 744.0, 443.0, 265.0, 179.0, 90.0, 51.0, 44.0, 28.0, 31.0, 17.0, 14.0, 7.0, 8.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0716552734375, -0.0695352554321289, -0.06741523742675781, -0.06529521942138672, -0.06317520141601562, -0.06105518341064453, -0.05893516540527344, -0.056815147399902344, -0.05469512939453125, -0.052575111389160156, -0.05045509338378906, -0.04833507537841797, -0.046215057373046875, -0.04409503936767578, -0.04197502136230469, -0.039855003356933594, -0.0377349853515625, -0.035614967346191406, -0.03349494934082031, -0.03137493133544922, -0.029254913330078125, -0.02713489532470703, -0.025014877319335938, -0.022894859313964844, -0.02077484130859375, -0.018654823303222656, -0.016534805297851562, -0.014414787292480469, -0.012294769287109375, -0.010174751281738281, -0.008054733276367188, -0.005934715270996094, -0.003814697265625, -0.0016946792602539062, 0.0004253387451171875, 0.0025453567504882812, 0.004665374755859375, 0.006785392761230469, 0.008905410766601562, 0.011025428771972656, 0.01314544677734375, 0.015265464782714844, 0.017385482788085938, 0.01950550079345703, 0.021625518798828125, 0.02374553680419922, 0.025865554809570312, 0.027985572814941406, 0.0301055908203125, 0.032225608825683594, 0.03434562683105469, 0.03646564483642578, 0.038585662841796875, 0.04070568084716797, 0.04282569885253906, 0.044945716857910156, 0.04706573486328125, 0.049185752868652344, 0.05130577087402344, 0.05342578887939453, 0.055545806884765625, 0.05766582489013672, 0.05978584289550781, 0.061905860900878906, 0.06402587890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 15.0, 14.0, 27.0, 38.0, 44.0, 66.0, 75.0, 93.0, 109.0, 119.0, 107.0, 81.0, 56.0, 29.0, 25.0, 17.0, 19.0, 10.0, 17.0, 1.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.645917892456055e-05, -6.464775651693344e-05, -6.283633410930634e-05, -6.102491170167923e-05, -5.9213489294052124e-05, -5.740206688642502e-05, -5.559064447879791e-05, -5.377922207117081e-05, -5.19677996635437e-05, -5.0156377255916595e-05, -4.834495484828949e-05, -4.6533532440662384e-05, -4.472211003303528e-05, -4.291068762540817e-05, -4.109926521778107e-05, -3.928784281015396e-05, -3.7476420402526855e-05, -3.566499799489975e-05, -3.3853575587272644e-05, -3.204215317964554e-05, -3.0230730772018433e-05, -2.8419308364391327e-05, -2.660788595676422e-05, -2.4796463549137115e-05, -2.298504114151001e-05, -2.1173618733882904e-05, -1.93621963262558e-05, -1.7550773918628693e-05, -1.5739351511001587e-05, -1.3927929103374481e-05, -1.2116506695747375e-05, -1.030508428812027e-05, -8.493661880493164e-06, -6.682239472866058e-06, -4.870817065238953e-06, -3.059394657611847e-06, -1.2479722499847412e-06, 5.634501576423645e-07, 2.3748725652694702e-06, 4.186294972896576e-06, 5.997717380523682e-06, 7.809139788150787e-06, 9.620562195777893e-06, 1.1431984603404999e-05, 1.3243407011032104e-05, 1.505482941865921e-05, 1.6866251826286316e-05, 1.867767423391342e-05, 2.0489096641540527e-05, 2.2300519049167633e-05, 2.411194145679474e-05, 2.5923363864421844e-05, 2.773478627204895e-05, 2.9546208679676056e-05, 3.135763108730316e-05, 3.316905349493027e-05, 3.498047590255737e-05, 3.679189831018448e-05, 3.8603320717811584e-05, 4.041474312543869e-05, 4.2226165533065796e-05, 4.40375879406929e-05, 4.584901034832001e-05, 4.766043275594711e-05, 4.947185516357422e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 11.0, 9.0, 9.0, 25.0, 42.0, 69.0, 151.0, 259.0, 593.0, 1562.0, 4633.0, 16197.0, 70088.0, 812799.0, 110708.0, 21933.0, 6041.0, 1968.0, 751.0, 342.0, 159.0, 85.0, 44.0, 30.0, 13.0, 13.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.08701324462890625, -0.0833282470703125, -0.07964324951171875, -0.075958251953125, -0.07227325439453125, -0.0685882568359375, -0.06490325927734375, -0.06121826171875, -0.05753326416015625, -0.0538482666015625, -0.05016326904296875, -0.046478271484375, -0.04279327392578125, -0.0391082763671875, -0.03542327880859375, -0.03173828125, -0.02805328369140625, -0.0243682861328125, -0.02068328857421875, -0.016998291015625, -0.01331329345703125, -0.0096282958984375, -0.00594329833984375, -0.00225830078125, 0.00142669677734375, 0.0051116943359375, 0.00879669189453125, 0.012481689453125, 0.01616668701171875, 0.0198516845703125, 0.02353668212890625, 0.0272216796875, 0.03090667724609375, 0.0345916748046875, 0.03827667236328125, 0.041961669921875, 0.04564666748046875, 0.0493316650390625, 0.05301666259765625, 0.05670166015625, 0.06038665771484375, 0.0640716552734375, 0.06775665283203125, 0.071441650390625, 0.07512664794921875, 0.0788116455078125, 0.08249664306640625, 0.086181640625, 0.08986663818359375, 0.0935516357421875, 0.09723663330078125, 0.100921630859375, 0.10460662841796875, 0.1082916259765625, 0.11197662353515625, 0.11566162109375, 0.11934661865234375, 0.1230316162109375, 0.12671661376953125, 0.130401611328125, 0.13408660888671875, 0.1377716064453125, 0.14145660400390625, 0.1451416015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 7.0, 7.0, 6.0, 8.0, 14.0, 26.0, 26.0, 37.0, 96.0, 150.0, 203.0, 146.0, 81.0, 44.0, 25.0, 14.0, 18.0, 11.0, 12.0, 10.0, 9.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055267333984375, -0.0530095100402832, -0.050751686096191406, -0.04849386215209961, -0.04623603820800781, -0.043978214263916016, -0.04172039031982422, -0.03946256637573242, -0.037204742431640625, -0.03494691848754883, -0.03268909454345703, -0.030431270599365234, -0.028173446655273438, -0.02591562271118164, -0.023657798767089844, -0.021399974822998047, -0.01914215087890625, -0.016884326934814453, -0.014626502990722656, -0.01236867904663086, -0.010110855102539062, -0.007853031158447266, -0.005595207214355469, -0.003337383270263672, -0.001079559326171875, 0.0011782646179199219, 0.0034360885620117188, 0.005693912506103516, 0.007951736450195312, 0.01020956039428711, 0.012467384338378906, 0.014725208282470703, 0.0169830322265625, 0.019240856170654297, 0.021498680114746094, 0.02375650405883789, 0.026014328002929688, 0.028272151947021484, 0.03052997589111328, 0.03278779983520508, 0.035045623779296875, 0.03730344772338867, 0.03956127166748047, 0.041819095611572266, 0.04407691955566406, 0.04633474349975586, 0.048592567443847656, 0.05085039138793945, 0.05310821533203125, 0.05536603927612305, 0.057623863220214844, 0.05988168716430664, 0.06213951110839844, 0.06439733505249023, 0.06665515899658203, 0.06891298294067383, 0.07117080688476562, 0.07342863082885742, 0.07568645477294922, 0.07794427871704102, 0.08020210266113281, 0.08245992660522461, 0.0847177505493164, 0.0869755744934082, 0.0892333984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 10.0, 10.0, 28.0, 40.0, 69.0, 95.0, 131.0, 152.0, 149.0, 121.0, 78.0, 47.0, 37.0, 23.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5589745044708252, -1.5216351747512817, -1.4842958450317383, -1.4469563961029053, -1.4096170663833618, -1.3722777366638184, -1.334938406944275, -1.2975990772247314, -1.2602596282958984, -1.222920298576355, -1.1855809688568115, -1.1482415199279785, -1.110902190208435, -1.0735628604888916, -1.0362235307693481, -0.9988842010498047, -0.9615448713302612, -0.9242055416107178, -0.8868661522865295, -0.8495268225669861, -0.8121874332427979, -0.7748481035232544, -0.7375087738037109, -0.7001694440841675, -0.6628300547599792, -0.6254907250404358, -0.5881513357162476, -0.5508120059967041, -0.5134726762771606, -0.4761332869529724, -0.43879395723342896, -0.4014545977115631, -0.3641153573989868, -0.32677599787712097, -0.2894366383552551, -0.25209730863571167, -0.21475794911384583, -0.17741858959197998, -0.14007924497127533, -0.10273990035057068, -0.06540054082870483, -0.028061188757419586, 0.009278163313865662, 0.04661751538515091, 0.08395686745643616, 0.121296226978302, 0.15863557159900665, 0.1959749162197113, 0.23331427574157715, 0.270653635263443, 0.30799299478530884, 0.3453323245048523, 0.38267168402671814, 0.420011043548584, 0.45735037326812744, 0.4946897327899933, 0.5320290923118591, 0.5693684220314026, 0.6067078113555908, 0.6440471410751343, 0.6813864707946777, 0.718725860118866, 0.7560651898384094, 0.7934045791625977, 0.8307439088821411]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 9.0, 8.0, 17.0, 11.0, 20.0, 15.0, 23.0, 30.0, 40.0, 18.0, 38.0, 33.0, 46.0, 47.0, 38.0, 30.0, 46.0, 50.0, 46.0, 50.0, 51.0, 45.0, 42.0, 35.0, 26.0, 22.0, 24.0, 31.0, 17.0, 15.0, 17.0, 10.0, 6.0, 7.0, 7.0, 7.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.7214030623435974, -0.7007407546043396, -0.680078387260437, -0.6594160795211792, -0.6387537717819214, -0.6180914044380188, -0.597429096698761, -0.5767667293548584, -0.5561044216156006, -0.5354421138763428, -0.5147797465324402, -0.4941174387931824, -0.4734551012516022, -0.452792763710022, -0.43213045597076416, -0.41146811842918396, -0.39080578088760376, -0.37014344334602356, -0.34948110580444336, -0.32881879806518555, -0.30815646052360535, -0.28749412298202515, -0.26683181524276733, -0.24616947770118713, -0.22550714015960693, -0.20484480261802673, -0.18418247997760773, -0.16352015733718872, -0.14285781979560852, -0.12219548970460892, -0.10153315961360931, -0.08087083697319031, -0.06020849943161011, -0.039546169340610504, -0.0188838392496109, 0.0017784908413887024, 0.022440820932388306, 0.04310315102338791, 0.06376548111438751, 0.08442780375480652, 0.10509014129638672, 0.12575247883796692, 0.14641480147838593, 0.16707712411880493, 0.18773946166038513, 0.20840179920196533, 0.22906412184238434, 0.24972644448280334, 0.27038878202438354, 0.29105111956596375, 0.31171345710754395, 0.33237576484680176, 0.35303810238838196, 0.37370043992996216, 0.39436274766921997, 0.41502508521080017, 0.43568742275238037, 0.45634976029396057, 0.47701209783554077, 0.4976744055747986, 0.5183367729187012, 0.538999080657959, 0.5596613883972168, 0.5803236961364746, 0.6009860634803772]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 10.0, 16.0, 26.0, 34.0, 55.0, 77.0, 144.0, 274.0, 506.0, 865.0, 1728.0, 3601.0, 8113.0, 20184.0, 60820.0, 303292.0, 3490451.0, 221863.0, 51017.0, 17356.0, 7174.0, 3221.0, 1584.0, 820.0, 445.0, 260.0, 141.0, 72.0, 58.0, 31.0, 16.0, 8.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1959228515625, -0.19054412841796875, -0.1851654052734375, -0.17978668212890625, -0.174407958984375, -0.16902923583984375, -0.1636505126953125, -0.15827178955078125, -0.15289306640625, -0.14751434326171875, -0.1421356201171875, -0.13675689697265625, -0.131378173828125, -0.12599945068359375, -0.1206207275390625, -0.11524200439453125, -0.10986328125, -0.10448455810546875, -0.0991058349609375, -0.09372711181640625, -0.088348388671875, -0.08296966552734375, -0.0775909423828125, -0.07221221923828125, -0.06683349609375, -0.06145477294921875, -0.0560760498046875, -0.05069732666015625, -0.045318603515625, -0.03993988037109375, -0.0345611572265625, -0.02918243408203125, -0.0238037109375, -0.01842498779296875, -0.0130462646484375, -0.00766754150390625, -0.002288818359375, 0.00308990478515625, 0.0084686279296875, 0.01384735107421875, 0.01922607421875, 0.02460479736328125, 0.0299835205078125, 0.03536224365234375, 0.040740966796875, 0.04611968994140625, 0.0514984130859375, 0.05687713623046875, 0.062255859375, 0.06763458251953125, 0.0730133056640625, 0.07839202880859375, 0.083770751953125, 0.08914947509765625, 0.0945281982421875, 0.09990692138671875, 0.10528564453125, 0.11066436767578125, 0.1160430908203125, 0.12142181396484375, 0.126800537109375, 0.13217926025390625, 0.1375579833984375, 0.14293670654296875, 0.1483154296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 1.0, 6.0, 3.0, 10.0, 11.0, 11.0, 11.0, 15.0, 26.0, 35.0, 22.0, 29.0, 39.0, 49.0, 50.0, 44.0, 50.0, 60.0, 55.0, 51.0, 68.0, 51.0, 45.0, 36.0, 39.0, 39.0, 18.0, 27.0, 19.0, 28.0, 20.0, 9.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03302001953125, -0.03185272216796875, -0.0306854248046875, -0.02951812744140625, -0.028350830078125, -0.02718353271484375, -0.0260162353515625, -0.02484893798828125, -0.023681640625, -0.02251434326171875, -0.0213470458984375, -0.02017974853515625, -0.019012451171875, -0.01784515380859375, -0.0166778564453125, -0.01551055908203125, -0.01434326171875, -0.01317596435546875, -0.0120086669921875, -0.01084136962890625, -0.009674072265625, -0.00850677490234375, -0.0073394775390625, -0.00617218017578125, -0.0050048828125, -0.00383758544921875, -0.0026702880859375, -0.00150299072265625, -0.000335693359375, 0.00083160400390625, 0.0019989013671875, 0.00316619873046875, 0.00433349609375, 0.00550079345703125, 0.0066680908203125, 0.00783538818359375, 0.009002685546875, 0.01016998291015625, 0.0113372802734375, 0.01250457763671875, 0.013671875, 0.01483917236328125, 0.0160064697265625, 0.01717376708984375, 0.018341064453125, 0.01950836181640625, 0.0206756591796875, 0.02184295654296875, 0.02301025390625, 0.02417755126953125, 0.0253448486328125, 0.02651214599609375, 0.027679443359375, 0.02884674072265625, 0.0300140380859375, 0.03118133544921875, 0.0323486328125, 0.03351593017578125, 0.0346832275390625, 0.03585052490234375, 0.037017822265625, 0.03818511962890625, 0.0393524169921875, 0.04051971435546875, 0.04168701171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 14.0, 19.0, 25.0, 21.0, 41.0, 45.0, 86.0, 128.0, 191.0, 274.0, 452.0, 607.0, 1046.0, 1724.0, 2981.0, 5692.0, 13342.0, 38869.0, 174722.0, 3342947.0, 497887.0, 73593.0, 21231.0, 8518.0, 3925.0, 2166.0, 1324.0, 795.0, 571.0, 345.0, 183.0, 159.0, 119.0, 67.0, 51.0, 38.0, 25.0, 13.0, 8.0, 6.0, 5.0, 8.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22071266174316406, -0.21303176879882812, -0.2053508758544922, -0.19766998291015625, -0.1899890899658203, -0.18230819702148438, -0.17462730407714844, -0.1669464111328125, -0.15926551818847656, -0.15158462524414062, -0.1439037322998047, -0.13622283935546875, -0.1285419464111328, -0.12086105346679688, -0.11318016052246094, -0.105499267578125, -0.09781837463378906, -0.09013748168945312, -0.08245658874511719, -0.07477569580078125, -0.06709480285644531, -0.059413909912109375, -0.05173301696777344, -0.0440521240234375, -0.03637123107910156, -0.028690338134765625, -0.021009445190429688, -0.01332855224609375, -0.0056476593017578125, 0.002033233642578125, 0.009714126586914062, 0.01739501953125, 0.025075912475585938, 0.032756805419921875, 0.04043769836425781, 0.04811859130859375, 0.05579948425292969, 0.06348037719726562, 0.07116127014160156, 0.0788421630859375, 0.08652305603027344, 0.09420394897460938, 0.10188484191894531, 0.10956573486328125, 0.11724662780761719, 0.12492752075195312, 0.13260841369628906, 0.140289306640625, 0.14797019958496094, 0.15565109252929688, 0.1633319854736328, 0.17101287841796875, 0.1786937713623047, 0.18637466430664062, 0.19405555725097656, 0.2017364501953125, 0.20941734313964844, 0.21709823608398438, 0.2247791290283203, 0.23246002197265625, 0.2401409149169922, 0.24782180786132812, 0.25550270080566406, 0.26318359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 10.0, 5.0, 5.0, 15.0, 18.0, 21.0, 32.0, 51.0, 101.0, 155.0, 350.0, 2153.0, 596.0, 217.0, 129.0, 71.0, 31.0, 32.0, 18.0, 18.0, 7.0, 9.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1243896484375, -0.12058067321777344, -0.11677169799804688, -0.11296272277832031, -0.10915374755859375, -0.10534477233886719, -0.10153579711914062, -0.09772682189941406, -0.0939178466796875, -0.09010887145996094, -0.08629989624023438, -0.08249092102050781, -0.07868194580078125, -0.07487297058105469, -0.07106399536132812, -0.06725502014160156, -0.063446044921875, -0.05963706970214844, -0.055828094482421875, -0.05201911926269531, -0.04821014404296875, -0.04440116882324219, -0.040592193603515625, -0.03678321838378906, -0.0329742431640625, -0.029165267944335938, -0.025356292724609375, -0.021547317504882812, -0.01773834228515625, -0.013929367065429688, -0.010120391845703125, -0.0063114166259765625, -0.00250244140625, 0.0013065338134765625, 0.005115509033203125, 0.008924484252929688, 0.01273345947265625, 0.016542434692382812, 0.020351409912109375, 0.024160385131835938, 0.0279693603515625, 0.03177833557128906, 0.035587310791015625, 0.03939628601074219, 0.04320526123046875, 0.04701423645019531, 0.050823211669921875, 0.05463218688964844, 0.058441162109375, 0.06225013732910156, 0.06605911254882812, 0.06986808776855469, 0.07367706298828125, 0.07748603820800781, 0.08129501342773438, 0.08510398864746094, 0.0889129638671875, 0.09272193908691406, 0.09653091430664062, 0.10033988952636719, 0.10414886474609375, 0.10795783996582031, 0.11176681518554688, 0.11557579040527344, 0.119384765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 8.0, 31.0, 69.0, 116.0, 208.0, 217.0, 148.0, 105.0, 44.0, 23.0, 20.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5500032901763916, -0.5155172944068909, -0.48103129863739014, -0.4465453028678894, -0.41205930709838867, -0.37757331132888794, -0.3430872857570648, -0.3086012899875641, -0.27411529421806335, -0.23962929844856262, -0.2051433026790619, -0.17065729200839996, -0.13617129623889923, -0.1016853004693985, -0.06719928979873657, -0.03271329402923584, 0.0017727017402648926, 0.03625870123505592, 0.07074470072984695, 0.10523070394992828, 0.13971669971942902, 0.17420269548892975, 0.20868870615959167, 0.2431747019290924, 0.27766069769859314, 0.31214669346809387, 0.3466326892375946, 0.3811187148094177, 0.41560471057891846, 0.4500907063484192, 0.4845767021179199, 0.5190626978874207, 0.5535486936569214, 0.5880346894264221, 0.6225206851959229, 0.6570066809654236, 0.6914926767349243, 0.725978672504425, 0.7604646682739258, 0.7949507236480713, 0.8294366598129272, 0.863922655582428, 0.8984086513519287, 0.9328946471214294, 0.9673806428909302, 1.0018666982650757, 1.0363526344299316, 1.0708386898040771, 1.1053247451782227, 1.1398108005523682, 1.1742967367172241, 1.2087827920913696, 1.2432687282562256, 1.277754783630371, 1.312240719795227, 1.3467267751693726, 1.3812127113342285, 1.415698766708374, 1.45018470287323, 1.4846707582473755, 1.5191566944122314, 1.553642749786377, 1.588128685951233, 1.6226147413253784, 1.6571006774902344]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 9.0, 4.0, 7.0, 7.0, 20.0, 9.0, 14.0, 12.0, 22.0, 23.0, 31.0, 22.0, 24.0, 24.0, 22.0, 35.0, 22.0, 31.0, 35.0, 45.0, 51.0, 31.0, 41.0, 41.0, 45.0, 34.0, 31.0, 34.0, 27.0, 30.0, 31.0, 26.0, 27.0, 25.0, 20.0, 13.0, 16.0, 9.0, 4.0, 14.0, 5.0, 9.0, 7.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3495801091194153, -0.33873802423477173, -0.32789596915245056, -0.317053884267807, -0.30621182918548584, -0.2953697443008423, -0.28452765941619873, -0.2736855745315552, -0.262843519449234, -0.25200143456459045, -0.2411593794822693, -0.23031729459762573, -0.21947522461414337, -0.208633154630661, -0.19779106974601746, -0.1869489997625351, -0.17610692977905273, -0.16526485979557037, -0.154422789812088, -0.14358070492744446, -0.1327386349439621, -0.12189656496047974, -0.11105448752641678, -0.10021241009235382, -0.08937034010887146, -0.0785282701253891, -0.06768619269132614, -0.05684411898255348, -0.04600204527378082, -0.03515997156500816, -0.024317897856235504, -0.013475820422172546, -0.0026337504386901855, 0.008208323270082474, 0.019050396978855133, 0.029892470687627792, 0.04073454439640045, 0.05157661810517311, 0.06241869181394577, 0.07326076924800873, 0.08410283923149109, 0.09494490921497345, 0.10578698664903641, 0.11662906408309937, 0.12747113406658173, 0.1383132040500641, 0.14915528893470764, 0.15999735891819, 0.17083942890167236, 0.18168149888515472, 0.19252356886863708, 0.20336565375328064, 0.214207723736763, 0.22504979372024536, 0.23589187860488892, 0.24673394858837128, 0.25757601857185364, 0.2684181034564972, 0.27926015853881836, 0.2901022434234619, 0.30094432830810547, 0.31178638339042664, 0.3226284682750702, 0.33347052335739136, 0.3443126082420349]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 8.0, 15.0, 31.0, 30.0, 41.0, 67.0, 97.0, 145.0, 191.0, 292.0, 469.0, 844.0, 1386.0, 2461.0, 4637.0, 8755.0, 16611.0, 30758.0, 56811.0, 104118.0, 219823.0, 296327.0, 141606.0, 74227.0, 41057.0, 22163.0, 11559.0, 6230.0, 3302.0, 1799.0, 953.0, 617.0, 364.0, 215.0, 172.0, 103.0, 71.0, 57.0, 33.0, 31.0, 25.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.109588623046875, -0.1060791015625, -0.102569580078125, -0.09906005859375, -0.095550537109375, -0.092041015625, -0.088531494140625, -0.08502197265625, -0.081512451171875, -0.0780029296875, -0.074493408203125, -0.07098388671875, -0.067474365234375, -0.06396484375, -0.060455322265625, -0.05694580078125, -0.053436279296875, -0.0499267578125, -0.046417236328125, -0.04290771484375, -0.039398193359375, -0.035888671875, -0.032379150390625, -0.02886962890625, -0.025360107421875, -0.0218505859375, -0.018341064453125, -0.01483154296875, -0.011322021484375, -0.0078125, -0.004302978515625, -0.00079345703125, 0.002716064453125, 0.0062255859375, 0.009735107421875, 0.01324462890625, 0.016754150390625, 0.020263671875, 0.023773193359375, 0.02728271484375, 0.030792236328125, 0.0343017578125, 0.037811279296875, 0.04132080078125, 0.044830322265625, 0.04833984375, 0.051849365234375, 0.05535888671875, 0.058868408203125, 0.0623779296875, 0.065887451171875, 0.06939697265625, 0.072906494140625, 0.076416015625, 0.079925537109375, 0.08343505859375, 0.086944580078125, 0.0904541015625, 0.093963623046875, 0.09747314453125, 0.100982666015625, 0.1044921875, 0.108001708984375, 0.11151123046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 11.0, 6.0, 12.0, 12.0, 8.0, 18.0, 22.0, 17.0, 23.0, 26.0, 33.0, 29.0, 27.0, 23.0, 26.0, 45.0, 55.0, 50.0, 40.0, 33.0, 39.0, 52.0, 47.0, 37.0, 30.0, 46.0, 36.0, 30.0, 15.0, 28.0, 23.0, 16.0, 13.0, 12.0, 14.0, 9.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03515625, -0.0339818000793457, -0.032807350158691406, -0.03163290023803711, -0.030458450317382812, -0.029284000396728516, -0.02810955047607422, -0.026935100555419922, -0.025760650634765625, -0.024586200714111328, -0.02341175079345703, -0.022237300872802734, -0.021062850952148438, -0.01988840103149414, -0.018713951110839844, -0.017539501190185547, -0.01636505126953125, -0.015190601348876953, -0.014016151428222656, -0.01284170150756836, -0.011667251586914062, -0.010492801666259766, -0.009318351745605469, -0.008143901824951172, -0.006969451904296875, -0.005795001983642578, -0.004620552062988281, -0.0034461021423339844, -0.0022716522216796875, -0.0010972023010253906, 7.724761962890625e-05, 0.0012516975402832031, 0.0024261474609375, 0.003600597381591797, 0.004775047302246094, 0.005949497222900391, 0.0071239471435546875, 0.008298397064208984, 0.009472846984863281, 0.010647296905517578, 0.011821746826171875, 0.012996196746826172, 0.014170646667480469, 0.015345096588134766, 0.016519546508789062, 0.01769399642944336, 0.018868446350097656, 0.020042896270751953, 0.02121734619140625, 0.022391796112060547, 0.023566246032714844, 0.02474069595336914, 0.025915145874023438, 0.027089595794677734, 0.02826404571533203, 0.029438495635986328, 0.030612945556640625, 0.03178739547729492, 0.03296184539794922, 0.034136295318603516, 0.03531074523925781, 0.03648519515991211, 0.037659645080566406, 0.0388340950012207, 0.040008544921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 7.0, 6.0, 6.0, 13.0, 13.0, 15.0, 17.0, 24.0, 29.0, 52.0, 54.0, 79.0, 114.0, 155.0, 201.0, 280.0, 385.0, 563.0, 947.0, 1887.0, 4643.0, 13557.0, 44187.0, 145017.0, 562026.0, 188848.0, 56891.0, 17170.0, 5752.0, 2321.0, 1138.0, 613.0, 376.0, 311.0, 190.0, 153.0, 131.0, 104.0, 68.0, 55.0, 38.0, 29.0, 26.0, 19.0, 6.0, 15.0, 2.0, 1.0, 7.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.22412109375, -0.21724700927734375, -0.2103729248046875, -0.20349884033203125, -0.196624755859375, -0.18975067138671875, -0.1828765869140625, -0.17600250244140625, -0.16912841796875, -0.16225433349609375, -0.1553802490234375, -0.14850616455078125, -0.141632080078125, -0.13475799560546875, -0.1278839111328125, -0.12100982666015625, -0.1141357421875, -0.10726165771484375, -0.1003875732421875, -0.09351348876953125, -0.086639404296875, -0.07976531982421875, -0.0728912353515625, -0.06601715087890625, -0.05914306640625, -0.05226898193359375, -0.0453948974609375, -0.03852081298828125, -0.031646728515625, -0.02477264404296875, -0.0178985595703125, -0.01102447509765625, -0.004150390625, 0.00272369384765625, 0.0095977783203125, 0.01647186279296875, 0.023345947265625, 0.03022003173828125, 0.0370941162109375, 0.04396820068359375, 0.05084228515625, 0.05771636962890625, 0.0645904541015625, 0.07146453857421875, 0.078338623046875, 0.08521270751953125, 0.0920867919921875, 0.09896087646484375, 0.1058349609375, 0.11270904541015625, 0.1195831298828125, 0.12645721435546875, 0.133331298828125, 0.14020538330078125, 0.1470794677734375, 0.15395355224609375, 0.16082763671875, 0.16770172119140625, 0.1745758056640625, 0.18144989013671875, 0.188323974609375, 0.19519805908203125, 0.2020721435546875, 0.20894622802734375, 0.2158203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 3.0, 7.0, 7.0, 7.0, 15.0, 12.0, 19.0, 17.0, 17.0, 22.0, 37.0, 33.0, 35.0, 44.0, 35.0, 47.0, 57.0, 51.0, 54.0, 39.0, 57.0, 51.0, 39.0, 40.0, 21.0, 22.0, 32.0, 23.0, 25.0, 26.0, 18.0, 9.0, 11.0, 15.0, 5.0, 12.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.2347412109375, -0.22794151306152344, -0.22114181518554688, -0.2143421173095703, -0.20754241943359375, -0.2007427215576172, -0.19394302368164062, -0.18714332580566406, -0.1803436279296875, -0.17354393005371094, -0.16674423217773438, -0.1599445343017578, -0.15314483642578125, -0.1463451385498047, -0.13954544067382812, -0.13274574279785156, -0.125946044921875, -0.11914634704589844, -0.11234664916992188, -0.10554695129394531, -0.09874725341796875, -0.09194755554199219, -0.08514785766601562, -0.07834815979003906, -0.0715484619140625, -0.06474876403808594, -0.057949066162109375, -0.05114936828613281, -0.04434967041015625, -0.03754997253417969, -0.030750274658203125, -0.023950576782226562, -0.01715087890625, -0.010351181030273438, -0.003551483154296875, 0.0032482147216796875, 0.01004791259765625, 0.016847610473632812, 0.023647308349609375, 0.030447006225585938, 0.0372467041015625, 0.04404640197753906, 0.050846099853515625, 0.05764579772949219, 0.06444549560546875, 0.07124519348144531, 0.07804489135742188, 0.08484458923339844, 0.091644287109375, 0.09844398498535156, 0.10524368286132812, 0.11204338073730469, 0.11884307861328125, 0.1256427764892578, 0.13244247436523438, 0.13924217224121094, 0.1460418701171875, 0.15284156799316406, 0.15964126586914062, 0.1664409637451172, 0.17324066162109375, 0.1800403594970703, 0.18684005737304688, 0.19363975524902344, 0.200439453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 9.0, 7.0, 10.0, 24.0, 29.0, 48.0, 65.0, 127.0, 272.0, 600.0, 1663.0, 7778.0, 111757.0, 869151.0, 49852.0, 4997.0, 1217.0, 423.0, 192.0, 106.0, 69.0, 32.0, 36.0, 30.0, 19.0, 9.0, 5.0, 10.0, 3.0, 1.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.426513671875, -0.4159507751464844, -0.40538787841796875, -0.3948249816894531, -0.3842620849609375, -0.3736991882324219, -0.36313629150390625, -0.3525733947753906, -0.342010498046875, -0.3314476013183594, -0.32088470458984375, -0.3103218078613281, -0.2997589111328125, -0.2891960144042969, -0.27863311767578125, -0.2680702209472656, -0.25750732421875, -0.24694442749023438, -0.23638153076171875, -0.22581863403320312, -0.2152557373046875, -0.20469284057617188, -0.19412994384765625, -0.18356704711914062, -0.173004150390625, -0.16244125366210938, -0.15187835693359375, -0.14131546020507812, -0.1307525634765625, -0.12018966674804688, -0.10962677001953125, -0.09906387329101562, -0.0885009765625, -0.07793807983398438, -0.06737518310546875, -0.056812286376953125, -0.0462493896484375, -0.035686492919921875, -0.02512359619140625, -0.014560699462890625, -0.003997802734375, 0.006565093994140625, 0.01712799072265625, 0.027690887451171875, 0.0382537841796875, 0.048816680908203125, 0.05937957763671875, 0.06994247436523438, 0.08050537109375, 0.09106826782226562, 0.10163116455078125, 0.11219406127929688, 0.1227569580078125, 0.13331985473632812, 0.14388275146484375, 0.15444564819335938, 0.165008544921875, 0.17557144165039062, 0.18613433837890625, 0.19669723510742188, 0.2072601318359375, 0.21782302856445312, 0.22838592529296875, 0.23894882202148438, 0.24951171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 6.0, 8.0, 10.0, 19.0, 18.0, 31.0, 50.0, 60.0, 88.0, 102.0, 114.0, 126.0, 99.0, 68.0, 61.0, 39.0, 34.0, 12.0, 18.0, 14.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.772445678710938e-05, -7.520057260990143e-05, -7.267668843269348e-05, -7.015280425548553e-05, -6.762892007827759e-05, -6.510503590106964e-05, -6.25811517238617e-05, -6.005726754665375e-05, -5.75333833694458e-05, -5.5009499192237854e-05, -5.248561501502991e-05, -4.996173083782196e-05, -4.7437846660614014e-05, -4.491396248340607e-05, -4.239007830619812e-05, -3.986619412899017e-05, -3.7342309951782227e-05, -3.481842577457428e-05, -3.229454159736633e-05, -2.9770657420158386e-05, -2.724677324295044e-05, -2.4722889065742493e-05, -2.2199004888534546e-05, -1.96751207113266e-05, -1.7151236534118652e-05, -1.4627352356910706e-05, -1.2103468179702759e-05, -9.579584002494812e-06, -7.055699825286865e-06, -4.5318156480789185e-06, -2.0079314708709717e-06, 5.159527063369751e-07, 3.039836883544922e-06, 5.563721060752869e-06, 8.087605237960815e-06, 1.0611489415168762e-05, 1.3135373592376709e-05, 1.5659257769584656e-05, 1.8183141946792603e-05, 2.070702612400055e-05, 2.3230910301208496e-05, 2.5754794478416443e-05, 2.827867865562439e-05, 3.0802562832832336e-05, 3.332644701004028e-05, 3.585033118724823e-05, 3.837421536445618e-05, 4.0898099541664124e-05, 4.342198371887207e-05, 4.594586789608002e-05, 4.8469752073287964e-05, 5.099363625049591e-05, 5.351752042770386e-05, 5.6041404604911804e-05, 5.856528878211975e-05, 6.10891729593277e-05, 6.361305713653564e-05, 6.613694131374359e-05, 6.866082549095154e-05, 7.118470966815948e-05, 7.370859384536743e-05, 7.623247802257538e-05, 7.875636219978333e-05, 8.128024637699127e-05, 8.380413055419922e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 17.0, 16.0, 19.0, 22.0, 52.0, 88.0, 121.0, 216.0, 311.0, 580.0, 1134.0, 2575.0, 6361.0, 27516.0, 310319.0, 633411.0, 50336.0, 9045.0, 3175.0, 1482.0, 749.0, 388.0, 240.0, 116.0, 82.0, 57.0, 36.0, 23.0, 11.0, 9.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.2254962921142578, -0.21869277954101562, -0.21188926696777344, -0.20508575439453125, -0.19828224182128906, -0.19147872924804688, -0.1846752166748047, -0.1778717041015625, -0.1710681915283203, -0.16426467895507812, -0.15746116638183594, -0.15065765380859375, -0.14385414123535156, -0.13705062866210938, -0.1302471160888672, -0.123443603515625, -0.11664009094238281, -0.10983657836914062, -0.10303306579589844, -0.09622955322265625, -0.08942604064941406, -0.08262252807617188, -0.07581901550292969, -0.0690155029296875, -0.06221199035644531, -0.055408477783203125, -0.04860496520996094, -0.04180145263671875, -0.03499794006347656, -0.028194427490234375, -0.021390914916992188, -0.01458740234375, -0.0077838897705078125, -0.000980377197265625, 0.0058231353759765625, 0.01262664794921875, 0.019430160522460938, 0.026233673095703125, 0.03303718566894531, 0.0398406982421875, 0.04664421081542969, 0.053447723388671875, 0.06025123596191406, 0.06705474853515625, 0.07385826110839844, 0.08066177368164062, 0.08746528625488281, 0.094268798828125, 0.10107231140136719, 0.10787582397460938, 0.11467933654785156, 0.12148284912109375, 0.12828636169433594, 0.13508987426757812, 0.1418933868408203, 0.1486968994140625, 0.1555004119873047, 0.16230392456054688, 0.16910743713378906, 0.17591094970703125, 0.18271446228027344, 0.18951797485351562, 0.1963214874267578, 0.203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 8.0, 5.0, 4.0, 3.0, 12.0, 15.0, 34.0, 24.0, 43.0, 72.0, 73.0, 135.0, 175.0, 112.0, 83.0, 64.0, 47.0, 30.0, 19.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.17006874084472656, -0.16496658325195312, -0.1598644256591797, -0.15476226806640625, -0.1496601104736328, -0.14455795288085938, -0.13945579528808594, -0.1343536376953125, -0.12925148010253906, -0.12414932250976562, -0.11904716491699219, -0.11394500732421875, -0.10884284973144531, -0.10374069213867188, -0.09863853454589844, -0.093536376953125, -0.08843421936035156, -0.08333206176757812, -0.07822990417480469, -0.07312774658203125, -0.06802558898925781, -0.06292343139648438, -0.05782127380371094, -0.0527191162109375, -0.04761695861816406, -0.042514801025390625, -0.03741264343261719, -0.03231048583984375, -0.027208328247070312, -0.022106170654296875, -0.017004013061523438, -0.01190185546875, -0.0067996978759765625, -0.001697540283203125, 0.0034046173095703125, 0.00850677490234375, 0.013608932495117188, 0.018711090087890625, 0.023813247680664062, 0.0289154052734375, 0.03401756286621094, 0.039119720458984375, 0.04422187805175781, 0.04932403564453125, 0.05442619323730469, 0.059528350830078125, 0.06463050842285156, 0.069732666015625, 0.07483482360839844, 0.07993698120117188, 0.08503913879394531, 0.09014129638671875, 0.09524345397949219, 0.10034561157226562, 0.10544776916503906, 0.1105499267578125, 0.11565208435058594, 0.12075424194335938, 0.1258563995361328, 0.13095855712890625, 0.1360607147216797, 0.14116287231445312, 0.14626502990722656, 0.1513671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 14.0, 38.0, 54.0, 77.0, 115.0, 150.0, 159.0, 131.0, 91.0, 68.0, 43.0, 22.0, 12.0, 11.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583528995513916, -1.5179442167282104, -1.4523593187332153, -1.3867745399475098, -1.3211896419525146, -1.255604863166809, -1.1900200843811035, -1.1244351863861084, -1.0588504076004028, -0.9932655692100525, -0.9276807308197021, -0.8620959520339966, -0.7965111136436462, -0.7309262752532959, -0.6653414964675903, -0.59975665807724, -0.5341718196868896, -0.4685869812965393, -0.40300217270851135, -0.3374173641204834, -0.27183252573013306, -0.20624768733978271, -0.14066287875175476, -0.0750780701637268, -0.009493231773376465, 0.05609159171581268, 0.12167641520500183, 0.18726123869419098, 0.2528460621833801, 0.31843090057373047, 0.3840157091617584, 0.4496005177497864, 0.5151851177215576, 0.580769956111908, 0.6463547945022583, 0.7119395732879639, 0.7775244116783142, 0.8431092500686646, 0.9086940288543701, 0.9742788672447205, 1.0398637056350708, 1.1054484844207764, 1.1710333824157715, 1.236618161201477, 1.3022029399871826, 1.3677878379821777, 1.4333726167678833, 1.4989573955535889, 1.564542293548584, 1.6301270723342896, 1.6957119703292847, 1.7612967491149902, 1.8268816471099854, 1.892466425895691, 1.9580512046813965, 2.0236361026763916, 2.0892210006713867, 2.154805898666382, 2.220390558242798, 2.285975456237793, 2.351560354232788, 2.417145252227783, 2.482729911804199, 2.5483148097991943, 2.6138994693756104]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 11.0, 9.0, 9.0, 11.0, 17.0, 19.0, 17.0, 17.0, 22.0, 30.0, 22.0, 29.0, 31.0, 36.0, 35.0, 31.0, 39.0, 47.0, 53.0, 48.0, 37.0, 49.0, 31.0, 43.0, 39.0, 42.0, 38.0, 28.0, 17.0, 21.0, 19.0, 15.0, 10.0, 15.0, 13.0, 8.0, 7.0, 9.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-1.1979303359985352, -1.1631454229354858, -1.1283605098724365, -1.0935757160186768, -1.0587908029556274, -1.0240058898925781, -0.9892209768295288, -0.9544361233711243, -0.9196512699127197, -0.8848663568496704, -0.8500815033912659, -0.8152965903282166, -0.780511736869812, -0.7457268238067627, -0.7109419107437134, -0.6761570572853088, -0.6413721442222595, -0.6065872311592102, -0.5718023777008057, -0.5370174646377563, -0.5022326111793518, -0.4674476981163025, -0.43266281485557556, -0.39787793159484863, -0.3630930483341217, -0.3283081650733948, -0.29352328181266785, -0.2587383985519409, -0.2239535003900528, -0.18916861712932587, -0.15438371896743774, -0.11959883570671082, -0.08481395244598389, -0.05002906545996666, -0.015244178473949432, 0.019540712237358093, 0.05432559549808502, 0.08911047875881195, 0.12389537692070007, 0.158680260181427, 0.19346514344215393, 0.22825002670288086, 0.2630349099636078, 0.2978197932243347, 0.33260470628738403, 0.3673895597457886, 0.4021744728088379, 0.4369593560695648, 0.47174423933029175, 0.5065291523933411, 0.5413140058517456, 0.5760989189147949, 0.6108837723731995, 0.6456686854362488, 0.6804535388946533, 0.7152384519577026, 0.750023365020752, 0.7848082780838013, 0.8195931315422058, 0.8543780446052551, 0.8891628980636597, 0.923947811126709, 0.9587327241897583, 0.9935175776481628, 1.0283024311065674]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 10.0, 10.0, 10.0, 25.0, 30.0, 35.0, 49.0, 96.0, 126.0, 171.0, 280.0, 486.0, 836.0, 1331.0, 2272.0, 4554.0, 8752.0, 18639.0, 43829.0, 125255.0, 669655.0, 2987207.0, 214559.0, 64743.0, 25998.0, 11850.0, 5945.0, 3177.0, 1764.0, 979.0, 583.0, 361.0, 219.0, 142.0, 94.0, 66.0, 42.0, 32.0, 24.0, 16.0, 3.0, 12.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1488037109375, -0.1438770294189453, -0.13895034790039062, -0.13402366638183594, -0.12909698486328125, -0.12417030334472656, -0.11924362182617188, -0.11431694030761719, -0.1093902587890625, -0.10446357727050781, -0.09953689575195312, -0.09461021423339844, -0.08968353271484375, -0.08475685119628906, -0.07983016967773438, -0.07490348815917969, -0.069976806640625, -0.06505012512207031, -0.060123443603515625, -0.05519676208496094, -0.05027008056640625, -0.04534339904785156, -0.040416717529296875, -0.03549003601074219, -0.0305633544921875, -0.025636672973632812, -0.020709991455078125, -0.015783309936523438, -0.01085662841796875, -0.0059299468994140625, -0.001003265380859375, 0.0039234161376953125, 0.00885009765625, 0.013776779174804688, 0.018703460693359375, 0.023630142211914062, 0.02855682373046875, 0.03348350524902344, 0.038410186767578125, 0.04333686828613281, 0.0482635498046875, 0.05319023132324219, 0.058116912841796875, 0.06304359436035156, 0.06797027587890625, 0.07289695739746094, 0.07782363891601562, 0.08275032043457031, 0.087677001953125, 0.09260368347167969, 0.09753036499023438, 0.10245704650878906, 0.10738372802734375, 0.11231040954589844, 0.11723709106445312, 0.12216377258300781, 0.1270904541015625, 0.1320171356201172, 0.13694381713867188, 0.14187049865722656, 0.14679718017578125, 0.15172386169433594, 0.15665054321289062, 0.1615772247314453, 0.16650390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 12.0, 8.0, 9.0, 24.0, 21.0, 23.0, 26.0, 27.0, 28.0, 32.0, 40.0, 38.0, 33.0, 57.0, 46.0, 60.0, 46.0, 47.0, 40.0, 39.0, 54.0, 38.0, 31.0, 30.0, 29.0, 30.0, 21.0, 15.0, 19.0, 13.0, 11.0, 8.0, 9.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.047943115234375, -0.04653644561767578, -0.04512977600097656, -0.043723106384277344, -0.042316436767578125, -0.040909767150878906, -0.03950309753417969, -0.03809642791748047, -0.03668975830078125, -0.03528308868408203, -0.03387641906738281, -0.032469749450683594, -0.031063079833984375, -0.029656410217285156, -0.028249740600585938, -0.02684307098388672, -0.0254364013671875, -0.02402973175048828, -0.022623062133789062, -0.021216392517089844, -0.019809722900390625, -0.018403053283691406, -0.016996383666992188, -0.015589714050292969, -0.01418304443359375, -0.012776374816894531, -0.011369705200195312, -0.009963035583496094, -0.008556365966796875, -0.007149696350097656, -0.0057430267333984375, -0.004336357116699219, -0.0029296875, -0.0015230178833007812, -0.0001163482666015625, 0.0012903213500976562, 0.002696990966796875, 0.004103660583496094, 0.0055103302001953125, 0.006916999816894531, 0.00832366943359375, 0.009730339050292969, 0.011137008666992188, 0.012543678283691406, 0.013950347900390625, 0.015357017517089844, 0.016763687133789062, 0.01817035675048828, 0.0195770263671875, 0.02098369598388672, 0.022390365600585938, 0.023797035217285156, 0.025203704833984375, 0.026610374450683594, 0.028017044067382812, 0.02942371368408203, 0.03083038330078125, 0.03223705291748047, 0.03364372253417969, 0.035050392150878906, 0.036457061767578125, 0.037863731384277344, 0.03927040100097656, 0.04067707061767578, 0.042083740234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 7.0, 8.0, 14.0, 26.0, 35.0, 31.0, 53.0, 79.0, 132.0, 168.0, 224.0, 371.0, 594.0, 1083.0, 2144.0, 5289.0, 15918.0, 64077.0, 463158.0, 3385403.0, 199435.0, 37699.0, 10504.0, 3797.0, 1637.0, 832.0, 483.0, 331.0, 252.0, 137.0, 98.0, 66.0, 57.0, 33.0, 20.0, 21.0, 16.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.27783203125, -0.2672767639160156, -0.25672149658203125, -0.24616622924804688, -0.2356109619140625, -0.22505569458007812, -0.21450042724609375, -0.20394515991210938, -0.193389892578125, -0.18283462524414062, -0.17227935791015625, -0.16172409057617188, -0.1511688232421875, -0.14061355590820312, -0.13005828857421875, -0.11950302124023438, -0.10894775390625, -0.09839248657226562, -0.08783721923828125, -0.07728195190429688, -0.0667266845703125, -0.056171417236328125, -0.04561614990234375, -0.035060882568359375, -0.024505615234375, -0.013950347900390625, -0.00339508056640625, 0.007160186767578125, 0.0177154541015625, 0.028270721435546875, 0.03882598876953125, 0.049381256103515625, 0.0599365234375, 0.07049179077148438, 0.08104705810546875, 0.09160232543945312, 0.1021575927734375, 0.11271286010742188, 0.12326812744140625, 0.13382339477539062, 0.144378662109375, 0.15493392944335938, 0.16548919677734375, 0.17604446411132812, 0.1865997314453125, 0.19715499877929688, 0.20771026611328125, 0.21826553344726562, 0.22882080078125, 0.23937606811523438, 0.24993133544921875, 0.2604866027832031, 0.2710418701171875, 0.2815971374511719, 0.29215240478515625, 0.3027076721191406, 0.313262939453125, 0.3238182067871094, 0.33437347412109375, 0.3449287414550781, 0.3554840087890625, 0.3660392761230469, 0.37659454345703125, 0.3871498107910156, 0.397705078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 9.0, 9.0, 20.0, 32.0, 32.0, 75.0, 131.0, 256.0, 1021.0, 1721.0, 310.0, 207.0, 90.0, 53.0, 26.0, 27.0, 15.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.27099609375, -0.2645606994628906, -0.25812530517578125, -0.2516899108886719, -0.2452545166015625, -0.23881912231445312, -0.23238372802734375, -0.22594833374023438, -0.219512939453125, -0.21307754516601562, -0.20664215087890625, -0.20020675659179688, -0.1937713623046875, -0.18733596801757812, -0.18090057373046875, -0.17446517944335938, -0.16802978515625, -0.16159439086914062, -0.15515899658203125, -0.14872360229492188, -0.1422882080078125, -0.13585281372070312, -0.12941741943359375, -0.12298202514648438, -0.116546630859375, -0.11011123657226562, -0.10367584228515625, -0.09724044799804688, -0.0908050537109375, -0.08436965942382812, -0.07793426513671875, -0.07149887084960938, -0.0650634765625, -0.058628082275390625, -0.05219268798828125, -0.045757293701171875, -0.0393218994140625, -0.032886505126953125, -0.02645111083984375, -0.020015716552734375, -0.013580322265625, -0.007144927978515625, -0.00070953369140625, 0.005725860595703125, 0.0121612548828125, 0.018596649169921875, 0.02503204345703125, 0.031467437744140625, 0.03790283203125, 0.044338226318359375, 0.05077362060546875, 0.057209014892578125, 0.0636444091796875, 0.07007980346679688, 0.07651519775390625, 0.08295059204101562, 0.089385986328125, 0.09582138061523438, 0.10225677490234375, 0.10869216918945312, 0.1151275634765625, 0.12156295776367188, 0.12799835205078125, 0.13443374633789062, 0.140869140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 13.0, 29.0, 70.0, 204.0, 324.0, 223.0, 101.0, 19.0, 13.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.812553882598877, -3.7325737476348877, -3.6525933742523193, -3.57261323928833, -3.492633104324341, -3.4126529693603516, -3.332672595977783, -3.252692461013794, -3.1727123260498047, -3.0927321910858154, -3.012751817703247, -2.932771682739258, -2.8527915477752686, -2.7728114128112793, -2.692831039428711, -2.6128509044647217, -2.5328707695007324, -2.452890634536743, -2.372910261154175, -2.2929301261901855, -2.2129499912261963, -2.132969856262207, -2.0529894828796387, -1.9730093479156494, -1.893028974533081, -1.8130487203598022, -1.733068585395813, -1.6530883312225342, -1.573108196258545, -1.4931279420852661, -1.4131476879119873, -1.333167552947998, -1.2531875371932983, -1.1732072830200195, -1.0932271480560303, -1.0132468938827515, -0.9332667589187622, -0.8532865047454834, -0.7733063101768494, -0.6933261156082153, -0.6133459210395813, -0.5333657264709473, -0.45338553190231323, -0.3734053075313568, -0.2934251129627228, -0.21344491839408875, -0.13346469402313232, -0.05348449945449829, 0.026495695114135742, 0.10647589713335037, 0.186456099152565, 0.26643630862236023, 0.34641650319099426, 0.4263966977596283, 0.5063769221305847, 0.5863571166992188, 0.6663373112678528, 0.7463175058364868, 0.8262977004051208, 0.9062778949737549, 0.9862581491470337, 1.066238284111023, 1.1462185382843018, 1.226198673248291, 1.3061789274215698]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 15.0, 13.0, 25.0, 32.0, 28.0, 44.0, 28.0, 39.0, 24.0, 37.0, 45.0, 44.0, 54.0, 56.0, 45.0, 39.0, 50.0, 42.0, 35.0, 46.0, 36.0, 36.0, 33.0, 32.0, 21.0, 13.0, 11.0, 14.0, 8.0, 10.0, 9.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5369692444801331, -0.5185194611549377, -0.5000696778297424, -0.4816198945045471, -0.4631701111793518, -0.4447203278541565, -0.4262705147266388, -0.4078207314014435, -0.38937094807624817, -0.37092116475105286, -0.35247138142585754, -0.33402159810066223, -0.31557178497314453, -0.2971220016479492, -0.2786722183227539, -0.2602224349975586, -0.24177265167236328, -0.22332286834716797, -0.20487308502197266, -0.18642328679561615, -0.16797350347042084, -0.14952372014522552, -0.13107392191886902, -0.1126241385936737, -0.0941743552684784, -0.07572457194328308, -0.05727478116750717, -0.03882499411702156, -0.02037520706653595, -0.0019254237413406372, 0.016524367034435272, 0.03497415781021118, 0.05342400074005127, 0.07187378406524658, 0.09032357484102249, 0.1087733656167984, 0.1272231489419937, 0.14567293226718903, 0.16412273049354553, 0.18257251381874084, 0.20102229714393616, 0.21947208046913147, 0.23792186379432678, 0.2563716471195221, 0.2748214602470398, 0.2932712435722351, 0.3117210268974304, 0.33017081022262573, 0.34862059354782104, 0.36707037687301636, 0.38552016019821167, 0.403969943523407, 0.4224197268486023, 0.4408695101737976, 0.4593193233013153, 0.4777691066265106, 0.49621888995170593, 0.5146687030792236, 0.533118486404419, 0.5515682697296143, 0.5700180530548096, 0.5884678363800049, 0.6069176197052002, 0.6253674030303955, 0.6438171863555908]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 1.0, 7.0, 18.0, 26.0, 29.0, 55.0, 78.0, 131.0, 187.0, 260.0, 438.0, 767.0, 1336.0, 2276.0, 4100.0, 7388.0, 14121.0, 27267.0, 53901.0, 109728.0, 213314.0, 271654.0, 169939.0, 83604.0, 41551.0, 21521.0, 10907.0, 5923.0, 3407.0, 1841.0, 1131.0, 614.0, 382.0, 234.0, 148.0, 92.0, 50.0, 42.0, 29.0, 21.0, 6.0, 12.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1276378631591797, -0.12356185913085938, -0.11948585510253906, -0.11540985107421875, -0.11133384704589844, -0.10725784301757812, -0.10318183898925781, -0.0991058349609375, -0.09502983093261719, -0.09095382690429688, -0.08687782287597656, -0.08280181884765625, -0.07872581481933594, -0.07464981079101562, -0.07057380676269531, -0.066497802734375, -0.06242179870605469, -0.058345794677734375, -0.05426979064941406, -0.05019378662109375, -0.04611778259277344, -0.042041778564453125, -0.03796577453613281, -0.0338897705078125, -0.029813766479492188, -0.025737762451171875, -0.021661758422851562, -0.01758575439453125, -0.013509750366210938, -0.009433746337890625, -0.0053577423095703125, -0.00128173828125, 0.0027942657470703125, 0.006870269775390625, 0.010946273803710938, 0.01502227783203125, 0.019098281860351562, 0.023174285888671875, 0.027250289916992188, 0.0313262939453125, 0.03540229797363281, 0.039478302001953125, 0.04355430603027344, 0.04763031005859375, 0.05170631408691406, 0.055782318115234375, 0.05985832214355469, 0.063934326171875, 0.06801033020019531, 0.07208633422851562, 0.07616233825683594, 0.08023834228515625, 0.08431434631347656, 0.08839035034179688, 0.09246635437011719, 0.0965423583984375, 0.10061836242675781, 0.10469436645507812, 0.10877037048339844, 0.11284637451171875, 0.11692237854003906, 0.12099838256835938, 0.1250743865966797, 0.129150390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 4.0, 3.0, 6.0, 8.0, 10.0, 14.0, 23.0, 17.0, 27.0, 11.0, 29.0, 23.0, 36.0, 32.0, 42.0, 43.0, 43.0, 52.0, 42.0, 47.0, 43.0, 41.0, 33.0, 38.0, 40.0, 37.0, 28.0, 29.0, 30.0, 34.0, 21.0, 23.0, 17.0, 12.0, 15.0, 8.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.053375244140625, -0.05192375183105469, -0.050472259521484375, -0.04902076721191406, -0.04756927490234375, -0.04611778259277344, -0.044666290283203125, -0.04321479797363281, -0.0417633056640625, -0.04031181335449219, -0.038860321044921875, -0.03740882873535156, -0.03595733642578125, -0.03450584411621094, -0.033054351806640625, -0.03160285949707031, -0.0301513671875, -0.028699874877929688, -0.027248382568359375, -0.025796890258789062, -0.02434539794921875, -0.022893905639648438, -0.021442413330078125, -0.019990921020507812, -0.0185394287109375, -0.017087936401367188, -0.015636444091796875, -0.014184951782226562, -0.01273345947265625, -0.011281967163085938, -0.009830474853515625, -0.008378982543945312, -0.006927490234375, -0.0054759979248046875, -0.004024505615234375, -0.0025730133056640625, -0.00112152099609375, 0.0003299713134765625, 0.001781463623046875, 0.0032329559326171875, 0.0046844482421875, 0.0061359405517578125, 0.007587432861328125, 0.009038925170898438, 0.01049041748046875, 0.011941909790039062, 0.013393402099609375, 0.014844894409179688, 0.01629638671875, 0.017747879028320312, 0.019199371337890625, 0.020650863647460938, 0.02210235595703125, 0.023553848266601562, 0.025005340576171875, 0.026456832885742188, 0.0279083251953125, 0.029359817504882812, 0.030811309814453125, 0.03226280212402344, 0.03371429443359375, 0.03516578674316406, 0.036617279052734375, 0.03806877136230469, 0.039520263671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 6.0, 6.0, 13.0, 10.0, 23.0, 30.0, 35.0, 46.0, 65.0, 97.0, 141.0, 224.0, 377.0, 571.0, 1283.0, 2760.0, 7724.0, 28573.0, 148352.0, 596558.0, 207935.0, 37562.0, 9483.0, 3300.0, 1400.0, 697.0, 430.0, 262.0, 183.0, 139.0, 79.0, 44.0, 38.0, 36.0, 22.0, 12.0, 9.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.38037109375, -0.3699760437011719, -0.35958099365234375, -0.3491859436035156, -0.3387908935546875, -0.3283958435058594, -0.31800079345703125, -0.3076057434082031, -0.297210693359375, -0.2868156433105469, -0.27642059326171875, -0.2660255432128906, -0.2556304931640625, -0.24523544311523438, -0.23484039306640625, -0.22444534301757812, -0.21405029296875, -0.20365524291992188, -0.19326019287109375, -0.18286514282226562, -0.1724700927734375, -0.16207504272460938, -0.15167999267578125, -0.14128494262695312, -0.130889892578125, -0.12049484252929688, -0.11009979248046875, -0.09970474243164062, -0.0893096923828125, -0.07891464233398438, -0.06851959228515625, -0.058124542236328125, -0.0477294921875, -0.037334442138671875, -0.02693939208984375, -0.016544342041015625, -0.0061492919921875, 0.004245758056640625, 0.01464080810546875, 0.025035858154296875, 0.035430908203125, 0.045825958251953125, 0.05622100830078125, 0.06661605834960938, 0.0770111083984375, 0.08740615844726562, 0.09780120849609375, 0.10819625854492188, 0.11859130859375, 0.12898635864257812, 0.13938140869140625, 0.14977645874023438, 0.1601715087890625, 0.17056655883789062, 0.18096160888671875, 0.19135665893554688, 0.201751708984375, 0.21214675903320312, 0.22254180908203125, 0.23293685913085938, 0.2433319091796875, 0.2537269592285156, 0.26412200927734375, 0.2745170593261719, 0.284912109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 3.0, 5.0, 5.0, 8.0, 18.0, 12.0, 12.0, 23.0, 20.0, 20.0, 17.0, 33.0, 45.0, 36.0, 37.0, 39.0, 49.0, 55.0, 55.0, 58.0, 52.0, 51.0, 46.0, 41.0, 34.0, 28.0, 33.0, 38.0, 30.0, 19.0, 17.0, 12.0, 12.0, 7.0, 13.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.36083984375, -0.3508110046386719, -0.34078216552734375, -0.3307533264160156, -0.3207244873046875, -0.3106956481933594, -0.30066680908203125, -0.2906379699707031, -0.280609130859375, -0.2705802917480469, -0.26055145263671875, -0.2505226135253906, -0.2404937744140625, -0.23046493530273438, -0.22043609619140625, -0.21040725708007812, -0.20037841796875, -0.19034957885742188, -0.18032073974609375, -0.17029190063476562, -0.1602630615234375, -0.15023422241210938, -0.14020538330078125, -0.13017654418945312, -0.120147705078125, -0.11011886596679688, -0.10009002685546875, -0.09006118774414062, -0.0800323486328125, -0.07000350952148438, -0.05997467041015625, -0.049945831298828125, -0.0399169921875, -0.029888153076171875, -0.01985931396484375, -0.009830474853515625, 0.0001983642578125, 0.010227203369140625, 0.02025604248046875, 0.030284881591796875, 0.040313720703125, 0.050342559814453125, 0.06037139892578125, 0.07040023803710938, 0.0804290771484375, 0.09045791625976562, 0.10048675537109375, 0.11051559448242188, 0.12054443359375, 0.13057327270507812, 0.14060211181640625, 0.15063095092773438, 0.1606597900390625, 0.17068862915039062, 0.18071746826171875, 0.19074630737304688, 0.200775146484375, 0.21080398559570312, 0.22083282470703125, 0.23086166381835938, 0.2408905029296875, 0.2509193420410156, 0.26094818115234375, 0.2709770202636719, 0.281005859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 2.0, 2.0, 3.0, 7.0, 16.0, 13.0, 22.0, 26.0, 34.0, 64.0, 105.0, 176.0, 339.0, 678.0, 1296.0, 2838.0, 7585.0, 22981.0, 98642.0, 461058.0, 354430.0, 70156.0, 17373.0, 5919.0, 2413.0, 1111.0, 556.0, 265.0, 161.0, 106.0, 55.0, 34.0, 25.0, 21.0, 9.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1549072265625, -0.14972496032714844, -0.14454269409179688, -0.1393604278564453, -0.13417816162109375, -0.1289958953857422, -0.12381362915039062, -0.11863136291503906, -0.1134490966796875, -0.10826683044433594, -0.10308456420898438, -0.09790229797363281, -0.09272003173828125, -0.08753776550292969, -0.08235549926757812, -0.07717323303222656, -0.071990966796875, -0.06680870056152344, -0.061626434326171875, -0.05644416809082031, -0.05126190185546875, -0.04607963562011719, -0.040897369384765625, -0.03571510314941406, -0.0305328369140625, -0.025350570678710938, -0.020168304443359375, -0.014986038208007812, -0.00980377197265625, -0.0046215057373046875, 0.000560760498046875, 0.0057430267333984375, 0.01092529296875, 0.016107559204101562, 0.021289825439453125, 0.026472091674804688, 0.03165435791015625, 0.03683662414550781, 0.042018890380859375, 0.04720115661621094, 0.0523834228515625, 0.05756568908691406, 0.06274795532226562, 0.06793022155761719, 0.07311248779296875, 0.07829475402832031, 0.08347702026367188, 0.08865928649902344, 0.093841552734375, 0.09902381896972656, 0.10420608520507812, 0.10938835144042969, 0.11457061767578125, 0.11975288391113281, 0.12493515014648438, 0.13011741638183594, 0.1352996826171875, 0.14048194885253906, 0.14566421508789062, 0.1508464813232422, 0.15602874755859375, 0.1612110137939453, 0.16639328002929688, 0.17157554626464844, 0.1767578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 17.0, 12.0, 13.0, 24.0, 33.0, 41.0, 34.0, 47.0, 50.0, 61.0, 59.0, 36.0, 63.0, 60.0, 52.0, 57.0, 44.0, 39.0, 35.0, 33.0, 38.0, 25.0, 17.0, 18.0, 11.0, 11.0, 10.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6372413635253906e-05, -4.494283348321915e-05, -4.351325333118439e-05, -4.208367317914963e-05, -4.065409302711487e-05, -3.922451287508011e-05, -3.779493272304535e-05, -3.636535257101059e-05, -3.493577241897583e-05, -3.350619226694107e-05, -3.207661211490631e-05, -3.064703196287155e-05, -2.9217451810836792e-05, -2.7787871658802032e-05, -2.6358291506767273e-05, -2.4928711354732513e-05, -2.3499131202697754e-05, -2.2069551050662994e-05, -2.0639970898628235e-05, -1.9210390746593475e-05, -1.7780810594558716e-05, -1.6351230442523956e-05, -1.4921650290489197e-05, -1.3492070138454437e-05, -1.2062489986419678e-05, -1.0632909834384918e-05, -9.203329682350159e-06, -7.7737495303154e-06, -6.34416937828064e-06, -4.91458922624588e-06, -3.4850090742111206e-06, -2.055428922176361e-06, -6.258487701416016e-07, 8.03731381893158e-07, 2.2333115339279175e-06, 3.662891685962677e-06, 5.0924718379974365e-06, 6.522051990032196e-06, 7.951632142066956e-06, 9.381212294101715e-06, 1.0810792446136475e-05, 1.2240372598171234e-05, 1.3669952750205994e-05, 1.5099532902240753e-05, 1.6529113054275513e-05, 1.7958693206310272e-05, 1.9388273358345032e-05, 2.081785351037979e-05, 2.224743366241455e-05, 2.367701381444931e-05, 2.510659396648407e-05, 2.653617411851883e-05, 2.796575427055359e-05, 2.939533442258835e-05, 3.082491457462311e-05, 3.225449472665787e-05, 3.368407487869263e-05, 3.5113655030727386e-05, 3.6543235182762146e-05, 3.7972815334796906e-05, 3.9402395486831665e-05, 4.0831975638866425e-05, 4.2261555790901184e-05, 4.3691135942935944e-05, 4.51207160949707e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 0.0, 3.0, 5.0, 6.0, 8.0, 13.0, 17.0, 36.0, 47.0, 70.0, 92.0, 129.0, 216.0, 414.0, 701.0, 1491.0, 3304.0, 8924.0, 30162.0, 142562.0, 547033.0, 244950.0, 47254.0, 12742.0, 4496.0, 1767.0, 860.0, 486.0, 284.0, 174.0, 102.0, 46.0, 55.0, 22.0, 17.0, 14.0, 10.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1761474609375, -0.1709136962890625, -0.165679931640625, -0.1604461669921875, -0.15521240234375, -0.1499786376953125, -0.144744873046875, -0.1395111083984375, -0.13427734375, -0.1290435791015625, -0.123809814453125, -0.1185760498046875, -0.11334228515625, -0.1081085205078125, -0.102874755859375, -0.0976409912109375, -0.0924072265625, -0.0871734619140625, -0.081939697265625, -0.0767059326171875, -0.07147216796875, -0.0662384033203125, -0.061004638671875, -0.0557708740234375, -0.050537109375, -0.0453033447265625, -0.040069580078125, -0.0348358154296875, -0.02960205078125, -0.0243682861328125, -0.019134521484375, -0.0139007568359375, -0.0086669921875, -0.0034332275390625, 0.001800537109375, 0.0070343017578125, 0.01226806640625, 0.0175018310546875, 0.022735595703125, 0.0279693603515625, 0.033203125, 0.0384368896484375, 0.043670654296875, 0.0489044189453125, 0.05413818359375, 0.0593719482421875, 0.064605712890625, 0.0698394775390625, 0.0750732421875, 0.0803070068359375, 0.085540771484375, 0.0907745361328125, 0.09600830078125, 0.1012420654296875, 0.106475830078125, 0.1117095947265625, 0.116943359375, 0.1221771240234375, 0.127410888671875, 0.1326446533203125, 0.13787841796875, 0.1431121826171875, 0.148345947265625, 0.1535797119140625, 0.1588134765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 17.0, 10.0, 21.0, 32.0, 49.0, 62.0, 73.0, 98.0, 88.0, 110.0, 100.0, 93.0, 62.0, 31.0, 27.0, 29.0, 17.0, 14.0, 15.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1875, -0.18230819702148438, -0.17711639404296875, -0.17192459106445312, -0.1667327880859375, -0.16154098510742188, -0.15634918212890625, -0.15115737915039062, -0.145965576171875, -0.14077377319335938, -0.13558197021484375, -0.13039016723632812, -0.1251983642578125, -0.12000656127929688, -0.11481475830078125, -0.10962295532226562, -0.10443115234375, -0.09923934936523438, -0.09404754638671875, -0.08885574340820312, -0.0836639404296875, -0.07847213745117188, -0.07328033447265625, -0.06808853149414062, -0.062896728515625, -0.057704925537109375, -0.05251312255859375, -0.047321319580078125, -0.0421295166015625, -0.036937713623046875, -0.03174591064453125, -0.026554107666015625, -0.0213623046875, -0.016170501708984375, -0.01097869873046875, -0.005786895751953125, -0.0005950927734375, 0.004596710205078125, 0.00978851318359375, 0.014980316162109375, 0.020172119140625, 0.025363922119140625, 0.03055572509765625, 0.035747528076171875, 0.0409393310546875, 0.046131134033203125, 0.05132293701171875, 0.056514739990234375, 0.06170654296875, 0.06689834594726562, 0.07209014892578125, 0.07728195190429688, 0.0824737548828125, 0.08766555786132812, 0.09285736083984375, 0.09804916381835938, 0.103240966796875, 0.10843276977539062, 0.11362457275390625, 0.11881637573242188, 0.1240081787109375, 0.12919998168945312, 0.13439178466796875, 0.13958358764648438, 0.144775390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 16.0, 63.0, 181.0, 290.0, 263.0, 153.0, 27.0, 11.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2634855508804321, -1.082746982574463, -0.9020082950592041, -0.7212697267532349, -0.5405310988426208, -0.35979247093200684, -0.1790539026260376, 0.0016847848892211914, 0.18242335319519043, 0.36316198110580444, 0.5439006090164185, 0.7246391773223877, 0.9053778052330017, 1.0861164331436157, 1.266855001449585, 1.4475936889648438, 1.628332257270813, 1.8090708255767822, 1.989809513092041, 2.1705479621887207, 2.3512866497039795, 2.5320253372192383, 2.712763786315918, 2.893502712249756, 3.0742411613464355, 3.2549798488616943, 3.435718297958374, 3.616456985473633, 3.7971956729888916, 3.9779343605041504, 4.15867280960083, 4.339411735534668, 4.5201497077941895, 4.700888156890869, 4.881627082824707, 5.062365531921387, 5.243103981018066, 5.423842906951904, 5.604581356048584, 5.785320281982422, 5.966058731079102, 6.146797180175781, 6.327536106109619, 6.508274555206299, 6.6890130043029785, 6.869751930236816, 7.050490379333496, 7.231228828430176, 7.4119672775268555, 7.592705726623535, 7.773444652557373, 7.954183101654053, 8.13492202758789, 8.31566047668457, 8.49639892578125, 8.67713737487793, 8.857876777648926, 9.038615226745605, 9.219353675842285, 9.400093078613281, 9.580831527709961, 9.76156997680664, 9.94230842590332, 10.123046875, 10.30378532409668]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 6.0, 11.0, 7.0, 13.0, 6.0, 24.0, 15.0, 23.0, 17.0, 32.0, 32.0, 32.0, 44.0, 62.0, 45.0, 46.0, 48.0, 47.0, 41.0, 47.0, 43.0, 47.0, 41.0, 39.0, 51.0, 34.0, 29.0, 11.0, 19.0, 16.0, 14.0, 12.0, 9.0, 4.0, 10.0, 6.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7388379573822021, -1.6875922679901123, -1.636346459388733, -1.585100769996643, -1.5338549613952637, -1.4826092720031738, -1.431363582611084, -1.3801178932189941, -1.3288720846176147, -1.277626395225525, -1.2263805866241455, -1.1751348972320557, -1.1238892078399658, -1.0726433992385864, -1.0213977098464966, -0.970151960849762, -0.9189062118530273, -0.8676604628562927, -0.8164147138595581, -0.7651690244674683, -0.7139232754707336, -0.662677526473999, -0.6114318370819092, -0.5601860880851746, -0.5089403390884399, -0.4576945900917053, -0.4064488708972931, -0.35520315170288086, -0.30395740270614624, -0.2527116537094116, -0.2014659345149994, -0.15022021532058716, -0.09897446632385254, -0.047728732228279114, 0.0035170018672943115, 0.05476273596286774, 0.10600847005844116, 0.15725421905517578, 0.208499938249588, 0.25974565744400024, 0.31099140644073486, 0.3622371554374695, 0.4134828746318817, 0.46472859382629395, 0.5159743428230286, 0.5672200918197632, 0.618465781211853, 0.6697115302085876, 0.7209572792053223, 0.7722030282020569, 0.8234487771987915, 0.8746944665908813, 0.925940215587616, 0.9771859645843506, 1.0284316539764404, 1.0796773433685303, 1.1309231519699097, 1.1821688413619995, 1.233414649963379, 1.2846603393554688, 1.3359060287475586, 1.387151837348938, 1.4383975267410278, 1.4896433353424072, 1.540889024734497]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 12.0, 9.0, 19.0, 20.0, 36.0, 57.0, 69.0, 85.0, 152.0, 222.0, 366.0, 669.0, 1152.0, 2123.0, 4441.0, 10911.0, 39514.0, 3783656.0, 304383.0, 28948.0, 8917.0, 3840.0, 1998.0, 1020.0, 581.0, 380.0, 232.0, 137.0, 109.0, 56.0, 61.0, 25.0, 23.0, 18.0, 7.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.36962890625, -0.3593330383300781, -0.34903717041015625, -0.3387413024902344, -0.3284454345703125, -0.3181495666503906, -0.30785369873046875, -0.2975578308105469, -0.287261962890625, -0.2769660949707031, -0.26667022705078125, -0.2563743591308594, -0.2460784912109375, -0.23578262329101562, -0.22548675537109375, -0.21519088745117188, -0.20489501953125, -0.19459915161132812, -0.18430328369140625, -0.17400741577148438, -0.1637115478515625, -0.15341567993164062, -0.14311981201171875, -0.13282394409179688, -0.122528076171875, -0.11223220825195312, -0.10193634033203125, -0.09164047241210938, -0.0813446044921875, -0.07104873657226562, -0.06075286865234375, -0.050457000732421875, -0.0401611328125, -0.029865264892578125, -0.01956939697265625, -0.009273529052734375, 0.0010223388671875, 0.011318206787109375, 0.02161407470703125, 0.031909942626953125, 0.042205810546875, 0.052501678466796875, 0.06279754638671875, 0.07309341430664062, 0.0833892822265625, 0.09368515014648438, 0.10398101806640625, 0.11427688598632812, 0.12457275390625, 0.13486862182617188, 0.14516448974609375, 0.15546035766601562, 0.1657562255859375, 0.17605209350585938, 0.18634796142578125, 0.19664382934570312, 0.206939697265625, 0.21723556518554688, 0.22753143310546875, 0.23782730102539062, 0.2481231689453125, 0.2584190368652344, 0.26871490478515625, 0.2790107727050781, 0.289306640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 5.0, 16.0, 14.0, 9.0, 20.0, 25.0, 20.0, 30.0, 20.0, 32.0, 25.0, 40.0, 39.0, 48.0, 51.0, 46.0, 46.0, 47.0, 50.0, 34.0, 43.0, 47.0, 42.0, 41.0, 25.0, 26.0, 25.0, 22.0, 20.0, 18.0, 17.0, 11.0, 6.0, 2.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.056915283203125, -0.055274009704589844, -0.05363273620605469, -0.05199146270751953, -0.050350189208984375, -0.04870891571044922, -0.04706764221191406, -0.045426368713378906, -0.04378509521484375, -0.042143821716308594, -0.04050254821777344, -0.03886127471923828, -0.037220001220703125, -0.03557872772216797, -0.03393745422363281, -0.032296180725097656, -0.0306549072265625, -0.029013633728027344, -0.027372360229492188, -0.02573108673095703, -0.024089813232421875, -0.02244853973388672, -0.020807266235351562, -0.019165992736816406, -0.01752471923828125, -0.015883445739746094, -0.014242172241210938, -0.012600898742675781, -0.010959625244140625, -0.009318351745605469, -0.0076770782470703125, -0.006035804748535156, -0.00439453125, -0.0027532577514648438, -0.0011119842529296875, 0.0005292892456054688, 0.002170562744140625, 0.0038118362426757812, 0.0054531097412109375, 0.007094383239746094, 0.00873565673828125, 0.010376930236816406, 0.012018203735351562, 0.013659477233886719, 0.015300750732421875, 0.01694202423095703, 0.018583297729492188, 0.020224571228027344, 0.0218658447265625, 0.023507118225097656, 0.025148391723632812, 0.02678966522216797, 0.028430938720703125, 0.03007221221923828, 0.03171348571777344, 0.033354759216308594, 0.03499603271484375, 0.036637306213378906, 0.03827857971191406, 0.03991985321044922, 0.041561126708984375, 0.04320240020751953, 0.04484367370605469, 0.046484947204589844, 0.048126220703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 9.0, 11.0, 15.0, 30.0, 25.0, 43.0, 81.0, 94.0, 184.0, 282.0, 516.0, 1263.0, 4570.0, 51646.0, 4103893.0, 25922.0, 3428.0, 1070.0, 509.0, 248.0, 175.0, 77.0, 64.0, 35.0, 31.0, 19.0, 8.0, 11.0, 3.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.17449951171875, -1.1370849609375, -1.09967041015625, -1.062255859375, -1.02484130859375, -0.9874267578125, -0.95001220703125, -0.91259765625, -0.87518310546875, -0.8377685546875, -0.80035400390625, -0.762939453125, -0.72552490234375, -0.6881103515625, -0.65069580078125, -0.61328125, -0.57586669921875, -0.5384521484375, -0.50103759765625, -0.463623046875, -0.42620849609375, -0.3887939453125, -0.35137939453125, -0.31396484375, -0.27655029296875, -0.2391357421875, -0.20172119140625, -0.164306640625, -0.12689208984375, -0.0894775390625, -0.05206298828125, -0.0146484375, 0.02276611328125, 0.0601806640625, 0.09759521484375, 0.135009765625, 0.17242431640625, 0.2098388671875, 0.24725341796875, 0.28466796875, 0.32208251953125, 0.3594970703125, 0.39691162109375, 0.434326171875, 0.47174072265625, 0.5091552734375, 0.54656982421875, 0.583984375, 0.62139892578125, 0.6588134765625, 0.69622802734375, 0.733642578125, 0.77105712890625, 0.8084716796875, 0.84588623046875, 0.88330078125, 0.92071533203125, 0.9581298828125, 0.99554443359375, 1.032958984375, 1.07037353515625, 1.1077880859375, 1.14520263671875, 1.1826171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 22.0, 58.0, 114.0, 3468.0, 251.0, 76.0, 24.0, 21.0, 15.0, 4.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.2231426239013672, -0.21752548217773438, -0.21190834045410156, -0.20629119873046875, -0.20067405700683594, -0.19505691528320312, -0.1894397735595703, -0.1838226318359375, -0.1782054901123047, -0.17258834838867188, -0.16697120666503906, -0.16135406494140625, -0.15573692321777344, -0.15011978149414062, -0.1445026397705078, -0.138885498046875, -0.1332683563232422, -0.12765121459960938, -0.12203407287597656, -0.11641693115234375, -0.11079978942871094, -0.10518264770507812, -0.09956550598144531, -0.0939483642578125, -0.08833122253417969, -0.08271408081054688, -0.07709693908691406, -0.07147979736328125, -0.06586265563964844, -0.060245513916015625, -0.05462837219238281, -0.04901123046875, -0.04339408874511719, -0.037776947021484375, -0.03215980529785156, -0.02654266357421875, -0.020925521850585938, -0.015308380126953125, -0.009691238403320312, -0.0040740966796875, 0.0015430450439453125, 0.007160186767578125, 0.012777328491210938, 0.01839447021484375, 0.024011611938476562, 0.029628753662109375, 0.03524589538574219, 0.040863037109375, 0.04648017883300781, 0.052097320556640625, 0.05771446228027344, 0.06333160400390625, 0.06894874572753906, 0.07456588745117188, 0.08018302917480469, 0.0858001708984375, 0.09141731262207031, 0.09703445434570312, 0.10265159606933594, 0.10826873779296875, 0.11388587951660156, 0.11950302124023438, 0.1251201629638672, 0.1307373046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 3.0, 5.0, 5.0, 10.0, 19.0, 28.0, 50.0, 70.0, 100.0, 137.0, 144.0, 124.0, 115.0, 64.0, 45.0, 38.0, 20.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3986055850982666, -0.38072556257247925, -0.3628455400466919, -0.34496551752090454, -0.3270854949951172, -0.30920547246932983, -0.2913254201412201, -0.27344539761543274, -0.2555653750896454, -0.23768535256385803, -0.21980533003807068, -0.20192529261112213, -0.18404527008533478, -0.16616524755954742, -0.14828521013259888, -0.13040518760681152, -0.11252516508102417, -0.09464514255523682, -0.07676511257886887, -0.058885086327791214, -0.04100506007671356, -0.02312503755092621, -0.005245007574558258, 0.012635022401809692, 0.030515044927597046, 0.0483950711786747, 0.06627509742975235, 0.0841551274061203, 0.10203514993190765, 0.11991517245769501, 0.13779520988464355, 0.1556752324104309, 0.17355531454086304, 0.1914353370666504, 0.20931535959243774, 0.2271953970193863, 0.24507541954517365, 0.2629554271697998, 0.28083547949790955, 0.2987155020236969, 0.31659552454948425, 0.3344755470752716, 0.35235556960105896, 0.3702355921268463, 0.38811564445495605, 0.4059956669807434, 0.42387568950653076, 0.4417557120323181, 0.45963573455810547, 0.4775157570838928, 0.4953957796096802, 0.5132758021354675, 0.5311558246612549, 0.5490358471870422, 0.5669158697128296, 0.5847959518432617, 0.6026759147644043, 0.6205559372901917, 0.638435959815979, 0.6563159823417664, 0.6741960048675537, 0.6920760273933411, 0.7099560499191284, 0.7278361320495605, 0.7457161545753479]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 5.0, 8.0, 12.0, 8.0, 16.0, 16.0, 24.0, 25.0, 24.0, 27.0, 32.0, 38.0, 41.0, 33.0, 34.0, 47.0, 41.0, 48.0, 48.0, 45.0, 54.0, 49.0, 49.0, 36.0, 33.0, 25.0, 27.0, 26.0, 27.0, 14.0, 24.0, 18.0, 13.0, 9.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24449318647384644, -0.23632627725601196, -0.2281593531370163, -0.21999244391918182, -0.21182551980018616, -0.20365861058235168, -0.1954917013645172, -0.18732477724552155, -0.17915785312652588, -0.1709909439086914, -0.16282401978969574, -0.15465711057186127, -0.1464901864528656, -0.13832327723503113, -0.13015636801719666, -0.12198944389820099, -0.11382253468036652, -0.10565561801195145, -0.09748870134353638, -0.0893217921257019, -0.08115486800670624, -0.07298795878887177, -0.0648210421204567, -0.056654125452041626, -0.048487208783626556, -0.04032029211521149, -0.03215337544679642, -0.023986462503671646, -0.015819545835256577, -0.007652629166841507, 0.0005142837762832642, 0.008681200444698334, 0.016848117113113403, 0.025015033781528473, 0.03318195044994354, 0.041348863393068314, 0.04951578006148338, 0.05768269672989845, 0.06584960967302322, 0.0740165263414383, 0.08218344300985336, 0.09035035967826843, 0.0985172763466835, 0.10668419301509857, 0.11485110223293304, 0.12301802635192871, 0.13118493556976318, 0.13935184478759766, 0.14751876890659332, 0.1556856781244278, 0.16385260224342346, 0.17201951146125793, 0.1801864355802536, 0.18835334479808807, 0.19652026891708374, 0.2046871781349182, 0.21285408735275269, 0.22102099657058716, 0.22918792068958282, 0.2373548299074173, 0.24552175402641296, 0.25368866324424744, 0.2618555724620819, 0.27002251148223877, 0.27818942070007324]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 9.0, 10.0, 20.0, 18.0, 30.0, 45.0, 71.0, 116.0, 201.0, 284.0, 471.0, 897.0, 1483.0, 2951.0, 6036.0, 12721.0, 28624.0, 64834.0, 139165.0, 246519.0, 257969.0, 154013.0, 71669.0, 31886.0, 14397.0, 6790.0, 3235.0, 1777.0, 946.0, 512.0, 282.0, 210.0, 129.0, 90.0, 46.0, 40.0, 20.0, 15.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.18896484375, -0.1835765838623047, -0.17818832397460938, -0.17280006408691406, -0.16741180419921875, -0.16202354431152344, -0.15663528442382812, -0.1512470245361328, -0.1458587646484375, -0.1404705047607422, -0.13508224487304688, -0.12969398498535156, -0.12430572509765625, -0.11891746520996094, -0.11352920532226562, -0.10814094543457031, -0.102752685546875, -0.09736442565917969, -0.09197616577148438, -0.08658790588378906, -0.08119964599609375, -0.07581138610839844, -0.07042312622070312, -0.06503486633300781, -0.0596466064453125, -0.05425834655761719, -0.048870086669921875, -0.04348182678222656, -0.03809356689453125, -0.03270530700683594, -0.027317047119140625, -0.021928787231445312, -0.01654052734375, -0.011152267456054688, -0.005764007568359375, -0.0003757476806640625, 0.00501251220703125, 0.010400772094726562, 0.015789031982421875, 0.021177291870117188, 0.0265655517578125, 0.03195381164550781, 0.037342071533203125, 0.04273033142089844, 0.04811859130859375, 0.05350685119628906, 0.058895111083984375, 0.06428337097167969, 0.069671630859375, 0.07505989074707031, 0.08044815063476562, 0.08583641052246094, 0.09122467041015625, 0.09661293029785156, 0.10200119018554688, 0.10738945007324219, 0.1127777099609375, 0.11816596984863281, 0.12355422973632812, 0.12894248962402344, 0.13433074951171875, 0.13971900939941406, 0.14510726928710938, 0.1504955291748047, 0.1558837890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 8.0, 12.0, 14.0, 20.0, 19.0, 32.0, 34.0, 34.0, 31.0, 44.0, 35.0, 59.0, 53.0, 55.0, 63.0, 56.0, 56.0, 42.0, 45.0, 47.0, 43.0, 44.0, 27.0, 32.0, 17.0, 17.0, 12.0, 11.0, 2.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.0791482925415039, -0.07669258117675781, -0.07423686981201172, -0.07178115844726562, -0.06932544708251953, -0.06686973571777344, -0.06441402435302734, -0.06195831298828125, -0.059502601623535156, -0.05704689025878906, -0.05459117889404297, -0.052135467529296875, -0.04967975616455078, -0.04722404479980469, -0.044768333435058594, -0.0423126220703125, -0.039856910705566406, -0.03740119934082031, -0.03494548797607422, -0.032489776611328125, -0.03003406524658203, -0.027578353881835938, -0.025122642517089844, -0.02266693115234375, -0.020211219787597656, -0.017755508422851562, -0.015299797058105469, -0.012844085693359375, -0.010388374328613281, -0.007932662963867188, -0.005476951599121094, -0.003021240234375, -0.0005655288696289062, 0.0018901824951171875, 0.004345893859863281, 0.006801605224609375, 0.009257316589355469, 0.011713027954101562, 0.014168739318847656, 0.01662445068359375, 0.019080162048339844, 0.021535873413085938, 0.02399158477783203, 0.026447296142578125, 0.02890300750732422, 0.03135871887207031, 0.033814430236816406, 0.0362701416015625, 0.038725852966308594, 0.04118156433105469, 0.04363727569580078, 0.046092987060546875, 0.04854869842529297, 0.05100440979003906, 0.053460121154785156, 0.05591583251953125, 0.058371543884277344, 0.06082725524902344, 0.06328296661376953, 0.06573867797851562, 0.06819438934326172, 0.07065010070800781, 0.0731058120727539, 0.0755615234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 16.0, 14.0, 17.0, 26.0, 42.0, 58.0, 76.0, 125.0, 156.0, 220.0, 356.0, 590.0, 1095.0, 2266.0, 6164.0, 24554.0, 139184.0, 574057.0, 243029.0, 41159.0, 9096.0, 2872.0, 1306.0, 724.0, 422.0, 288.0, 177.0, 130.0, 82.0, 66.0, 47.0, 33.0, 20.0, 20.0, 16.0, 8.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3851776123046875, -0.373382568359375, -0.3615875244140625, -0.34979248046875, -0.3379974365234375, -0.326202392578125, -0.3144073486328125, -0.3026123046875, -0.2908172607421875, -0.279022216796875, -0.2672271728515625, -0.25543212890625, -0.2436370849609375, -0.231842041015625, -0.2200469970703125, -0.208251953125, -0.1964569091796875, -0.184661865234375, -0.1728668212890625, -0.16107177734375, -0.1492767333984375, -0.137481689453125, -0.1256866455078125, -0.1138916015625, -0.1020965576171875, -0.090301513671875, -0.0785064697265625, -0.06671142578125, -0.0549163818359375, -0.043121337890625, -0.0313262939453125, -0.01953125, -0.0077362060546875, 0.004058837890625, 0.0158538818359375, 0.02764892578125, 0.0394439697265625, 0.051239013671875, 0.0630340576171875, 0.0748291015625, 0.0866241455078125, 0.098419189453125, 0.1102142333984375, 0.12200927734375, 0.1338043212890625, 0.145599365234375, 0.1573944091796875, 0.169189453125, 0.1809844970703125, 0.192779541015625, 0.2045745849609375, 0.21636962890625, 0.2281646728515625, 0.239959716796875, 0.2517547607421875, 0.2635498046875, 0.2753448486328125, 0.287139892578125, 0.2989349365234375, 0.31072998046875, 0.3225250244140625, 0.334320068359375, 0.3461151123046875, 0.35791015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 17.0, 13.0, 16.0, 14.0, 20.0, 22.0, 22.0, 31.0, 24.0, 35.0, 37.0, 46.0, 38.0, 45.0, 41.0, 43.0, 38.0, 43.0, 32.0, 43.0, 47.0, 37.0, 30.0, 24.0, 26.0, 31.0, 21.0, 23.0, 23.0, 22.0, 13.0, 11.0, 15.0, 9.0, 10.0, 7.0, 0.0, 1.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0], "bins": [-0.427978515625, -0.416259765625, -0.404541015625, -0.392822265625, -0.381103515625, -0.369384765625, -0.357666015625, -0.345947265625, -0.334228515625, -0.322509765625, -0.310791015625, -0.299072265625, -0.287353515625, -0.275634765625, -0.263916015625, -0.252197265625, -0.240478515625, -0.228759765625, -0.217041015625, -0.205322265625, -0.193603515625, -0.181884765625, -0.170166015625, -0.158447265625, -0.146728515625, -0.135009765625, -0.123291015625, -0.111572265625, -0.099853515625, -0.088134765625, -0.076416015625, -0.064697265625, -0.052978515625, -0.041259765625, -0.029541015625, -0.017822265625, -0.006103515625, 0.005615234375, 0.017333984375, 0.029052734375, 0.040771484375, 0.052490234375, 0.064208984375, 0.075927734375, 0.087646484375, 0.099365234375, 0.111083984375, 0.122802734375, 0.134521484375, 0.146240234375, 0.157958984375, 0.169677734375, 0.181396484375, 0.193115234375, 0.204833984375, 0.216552734375, 0.228271484375, 0.239990234375, 0.251708984375, 0.263427734375, 0.275146484375, 0.286865234375, 0.298583984375, 0.310302734375, 0.322021484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 9.0, 15.0, 11.0, 32.0, 49.0, 75.0, 99.0, 170.0, 262.0, 430.0, 792.0, 1485.0, 3002.0, 7105.0, 19581.0, 69625.0, 310408.0, 473215.0, 114843.0, 29439.0, 9710.0, 4014.0, 1868.0, 970.0, 528.0, 288.0, 153.0, 124.0, 80.0, 54.0, 31.0, 22.0, 17.0, 2.0, 7.0, 9.0, 12.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.192138671875, -0.18696975708007812, -0.18180084228515625, -0.17663192749023438, -0.1714630126953125, -0.16629409790039062, -0.16112518310546875, -0.15595626831054688, -0.150787353515625, -0.14561843872070312, -0.14044952392578125, -0.13528060913085938, -0.1301116943359375, -0.12494277954101562, -0.11977386474609375, -0.11460494995117188, -0.10943603515625, -0.10426712036132812, -0.09909820556640625, -0.09392929077148438, -0.0887603759765625, -0.08359146118164062, -0.07842254638671875, -0.07325363159179688, -0.068084716796875, -0.06291580200195312, -0.05774688720703125, -0.052577972412109375, -0.0474090576171875, -0.042240142822265625, -0.03707122802734375, -0.031902313232421875, -0.0267333984375, -0.021564483642578125, -0.01639556884765625, -0.011226654052734375, -0.0060577392578125, -0.000888824462890625, 0.00428009033203125, 0.009449005126953125, 0.014617919921875, 0.019786834716796875, 0.02495574951171875, 0.030124664306640625, 0.0352935791015625, 0.040462493896484375, 0.04563140869140625, 0.050800323486328125, 0.05596923828125, 0.061138153076171875, 0.06630706787109375, 0.07147598266601562, 0.0766448974609375, 0.08181381225585938, 0.08698272705078125, 0.09215164184570312, 0.097320556640625, 0.10248947143554688, 0.10765838623046875, 0.11282730102539062, 0.1179962158203125, 0.12316513061523438, 0.12833404541015625, 0.13350296020507812, 0.138671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 9.0, 21.0, 15.0, 28.0, 43.0, 50.0, 48.0, 66.0, 79.0, 72.0, 72.0, 76.0, 77.0, 70.0, 50.0, 59.0, 41.0, 21.0, 26.0, 13.0, 13.0, 15.0, 3.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.458427429199219e-05, -4.2698346078395844e-05, -4.08124178647995e-05, -3.8926489651203156e-05, -3.704056143760681e-05, -3.515463322401047e-05, -3.3268705010414124e-05, -3.138277679681778e-05, -2.9496848583221436e-05, -2.761092036962509e-05, -2.5724992156028748e-05, -2.3839063942432404e-05, -2.195313572883606e-05, -2.0067207515239716e-05, -1.818127930164337e-05, -1.6295351088047028e-05, -1.4409422874450684e-05, -1.252349466085434e-05, -1.0637566447257996e-05, -8.751638233661652e-06, -6.865710020065308e-06, -4.979781806468964e-06, -3.0938535928726196e-06, -1.2079253792762756e-06, 6.780028343200684e-07, 2.5639310479164124e-06, 4.449859261512756e-06, 6.3357874751091e-06, 8.221715688705444e-06, 1.0107643902301788e-05, 1.1993572115898132e-05, 1.3879500329494476e-05, 1.576542854309082e-05, 1.7651356756687164e-05, 1.9537284970283508e-05, 2.1423213183879852e-05, 2.3309141397476196e-05, 2.519506961107254e-05, 2.7080997824668884e-05, 2.8966926038265228e-05, 3.085285425186157e-05, 3.2738782465457916e-05, 3.462471067905426e-05, 3.6510638892650604e-05, 3.839656710624695e-05, 4.028249531984329e-05, 4.2168423533439636e-05, 4.405435174703598e-05, 4.5940279960632324e-05, 4.782620817422867e-05, 4.971213638782501e-05, 5.1598064601421356e-05, 5.34839928150177e-05, 5.5369921028614044e-05, 5.725584924221039e-05, 5.914177745580673e-05, 6.1027705669403076e-05, 6.291363388299942e-05, 6.479956209659576e-05, 6.668549031019211e-05, 6.857141852378845e-05, 7.04573467373848e-05, 7.234327495098114e-05, 7.422920316457748e-05, 7.611513137817383e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 5.0, 14.0, 18.0, 32.0, 50.0, 78.0, 145.0, 227.0, 484.0, 1203.0, 3606.0, 16141.0, 146322.0, 730744.0, 128888.0, 15009.0, 3399.0, 1181.0, 451.0, 242.0, 128.0, 61.0, 49.0, 24.0, 26.0, 10.0, 5.0, 1.0, 0.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.34808921813964844, -0.3394889831542969, -0.3308887481689453, -0.32228851318359375, -0.3136882781982422, -0.3050880432128906, -0.29648780822753906, -0.2878875732421875, -0.27928733825683594, -0.2706871032714844, -0.2620868682861328, -0.25348663330078125, -0.2448863983154297, -0.23628616333007812, -0.22768592834472656, -0.219085693359375, -0.21048545837402344, -0.20188522338867188, -0.1932849884033203, -0.18468475341796875, -0.1760845184326172, -0.16748428344726562, -0.15888404846191406, -0.1502838134765625, -0.14168357849121094, -0.13308334350585938, -0.12448310852050781, -0.11588287353515625, -0.10728263854980469, -0.09868240356445312, -0.09008216857910156, -0.08148193359375, -0.07288169860839844, -0.06428146362304688, -0.05568122863769531, -0.04708099365234375, -0.03848075866699219, -0.029880523681640625, -0.021280288696289062, -0.0126800537109375, -0.0040798187255859375, 0.004520416259765625, 0.013120651245117188, 0.02172088623046875, 0.030321121215820312, 0.038921356201171875, 0.04752159118652344, 0.056121826171875, 0.06472206115722656, 0.07332229614257812, 0.08192253112792969, 0.09052276611328125, 0.09912300109863281, 0.10772323608398438, 0.11632347106933594, 0.1249237060546875, 0.13352394104003906, 0.14212417602539062, 0.1507244110107422, 0.15932464599609375, 0.1679248809814453, 0.17652511596679688, 0.18512535095214844, 0.1937255859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 8.0, 2.0, 3.0, 6.0, 11.0, 16.0, 26.0, 46.0, 40.0, 57.0, 70.0, 113.0, 103.0, 105.0, 95.0, 77.0, 66.0, 52.0, 39.0, 28.0, 14.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.314453125, -0.3070049285888672, -0.2995567321777344, -0.29210853576660156, -0.28466033935546875, -0.27721214294433594, -0.2697639465332031, -0.2623157501220703, -0.2548675537109375, -0.2474193572998047, -0.23997116088867188, -0.23252296447753906, -0.22507476806640625, -0.21762657165527344, -0.21017837524414062, -0.2027301788330078, -0.195281982421875, -0.1878337860107422, -0.18038558959960938, -0.17293739318847656, -0.16548919677734375, -0.15804100036621094, -0.15059280395507812, -0.1431446075439453, -0.1356964111328125, -0.1282482147216797, -0.12080001831054688, -0.11335182189941406, -0.10590362548828125, -0.09845542907714844, -0.09100723266601562, -0.08355903625488281, -0.07611083984375, -0.06866264343261719, -0.061214447021484375, -0.05376625061035156, -0.04631805419921875, -0.03886985778808594, -0.031421661376953125, -0.023973464965820312, -0.0165252685546875, -0.009077072143554688, -0.001628875732421875, 0.0058193206787109375, 0.01326751708984375, 0.020715713500976562, 0.028163909912109375, 0.03561210632324219, 0.043060302734375, 0.05050849914550781, 0.057956695556640625, 0.06540489196777344, 0.07285308837890625, 0.08030128479003906, 0.08774948120117188, 0.09519767761230469, 0.1026458740234375, 0.11009407043457031, 0.11754226684570312, 0.12499046325683594, 0.13243865966796875, 0.13988685607910156, 0.14733505249023438, 0.1547832489013672, 0.1622314453125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 20.0, 28.0, 48.0, 101.0, 150.0, 168.0, 144.0, 132.0, 77.0, 63.0, 28.0, 15.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.422314167022705, -3.3121464252471924, -3.2019784450531006, -3.091810703277588, -2.981642961502075, -2.8714752197265625, -2.7613072395324707, -2.651139497756958, -2.5409717559814453, -2.4308040142059326, -2.320636034011841, -2.210468292236328, -2.1003005504608154, -1.9901326894760132, -1.879964828491211, -1.7697970867156982, -1.6596291065216064, -1.5494612455368042, -1.4392935037612915, -1.3291256427764893, -1.2189579010009766, -1.1087900400161743, -0.9986221790313721, -0.8884543776512146, -0.7782865762710571, -0.6681187748908997, -0.5579509735107422, -0.44778311252593994, -0.33761531114578247, -0.227447509765625, -0.11727964878082275, -0.007111847400665283, 0.10305595397949219, 0.21322377026081085, 0.3233915865421295, 0.4335594177246094, 0.5437272191047668, 0.6538950204849243, 0.7640628814697266, 0.874230682849884, 0.9843984842300415, 1.0945663452148438, 1.2047340869903564, 1.3149019479751587, 1.425069808959961, 1.5352375507354736, 1.6454054117202759, 1.7555732727050781, 1.8657410144805908, 1.975908875465393, 2.0860767364501953, 2.196244478225708, 2.3064122200012207, 2.4165802001953125, 2.526747941970825, 2.636915683746338, 2.7470836639404297, 2.8572514057159424, 2.967419385910034, 3.077587127685547, 3.1877548694610596, 3.2979226112365723, 3.408090591430664, 3.5182583332061768, 3.6284260749816895]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 4.0, 10.0, 7.0, 9.0, 11.0, 17.0, 17.0, 15.0, 17.0, 18.0, 26.0, 43.0, 36.0, 36.0, 41.0, 48.0, 37.0, 42.0, 57.0, 63.0, 68.0, 63.0, 40.0, 38.0, 28.0, 21.0, 26.0, 34.0, 25.0, 17.0, 21.0, 16.0, 11.0, 5.0, 8.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2215898036956787, -2.1516826152801514, -2.081775426864624, -2.0118682384490967, -1.9419611692428589, -1.8720539808273315, -1.8021469116210938, -1.7322397232055664, -1.662332534790039, -1.5924253463745117, -1.5225181579589844, -1.4526110887527466, -1.3827039003372192, -1.312796711921692, -1.242889642715454, -1.1729824542999268, -1.1030752658843994, -1.033168077468872, -0.9632609486579895, -0.8933538198471069, -0.8234466314315796, -0.7535394430160522, -0.6836323142051697, -0.6137251853942871, -0.5438179969787598, -0.4739108383655548, -0.40400367975234985, -0.3340965211391449, -0.26418936252593994, -0.19428220391273499, -0.12437504529953003, -0.05446788668632507, 0.015439033508300781, 0.08534619212150574, 0.1552533507347107, 0.22516050934791565, 0.2950676679611206, 0.36497482657432556, 0.4348819851875305, 0.5047891139984131, 0.5746963024139404, 0.6446034908294678, 0.7145106196403503, 0.7844177484512329, 0.8543249368667603, 0.9242321252822876, 0.9941392540931702, 1.0640463829040527, 1.13395357131958, 1.2038607597351074, 1.2737679481506348, 1.3436750173568726, 1.4135822057724, 1.4834893941879272, 1.553396463394165, 1.6233036518096924, 1.6932108402252197, 1.763118028640747, 1.8330252170562744, 1.9029322862625122, 1.9728394746780396, 2.0427465438842773, 2.1126537322998047, 2.182560920715332, 2.2524681091308594]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 10.0, 16.0, 14.0, 17.0, 19.0, 34.0, 36.0, 54.0, 91.0, 115.0, 152.0, 171.0, 295.0, 441.0, 657.0, 1004.0, 1652.0, 2742.0, 5049.0, 10061.0, 23905.0, 93171.0, 3890199.0, 114323.0, 26172.0, 10616.0, 5372.0, 2937.0, 1732.0, 1036.0, 683.0, 410.0, 346.0, 200.0, 140.0, 105.0, 78.0, 61.0, 49.0, 23.0, 27.0, 16.0, 13.0, 6.0, 8.0, 8.0, 12.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.275390625, -0.26692962646484375, -0.2584686279296875, -0.25000762939453125, -0.241546630859375, -0.23308563232421875, -0.2246246337890625, -0.21616363525390625, -0.20770263671875, -0.19924163818359375, -0.1907806396484375, -0.18231964111328125, -0.173858642578125, -0.16539764404296875, -0.1569366455078125, -0.14847564697265625, -0.1400146484375, -0.13155364990234375, -0.1230926513671875, -0.11463165283203125, -0.106170654296875, -0.09770965576171875, -0.0892486572265625, -0.08078765869140625, -0.07232666015625, -0.06386566162109375, -0.0554046630859375, -0.04694366455078125, -0.038482666015625, -0.03002166748046875, -0.0215606689453125, -0.01309967041015625, -0.004638671875, 0.00382232666015625, 0.0122833251953125, 0.02074432373046875, 0.029205322265625, 0.03766632080078125, 0.0461273193359375, 0.05458831787109375, 0.06304931640625, 0.07151031494140625, 0.0799713134765625, 0.08843231201171875, 0.096893310546875, 0.10535430908203125, 0.1138153076171875, 0.12227630615234375, 0.1307373046875, 0.13919830322265625, 0.1476593017578125, 0.15612030029296875, 0.164581298828125, 0.17304229736328125, 0.1815032958984375, 0.18996429443359375, 0.19842529296875, 0.20688629150390625, 0.2153472900390625, 0.22380828857421875, 0.232269287109375, 0.24073028564453125, 0.2491912841796875, 0.25765228271484375, 0.26611328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 11.0, 13.0, 16.0, 21.0, 20.0, 24.0, 28.0, 32.0, 45.0, 49.0, 47.0, 49.0, 65.0, 57.0, 74.0, 45.0, 50.0, 39.0, 34.0, 43.0, 44.0, 38.0, 29.0, 20.0, 19.0, 7.0, 14.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 0.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0899658203125, -0.08747100830078125, -0.0849761962890625, -0.08248138427734375, -0.079986572265625, -0.07749176025390625, -0.0749969482421875, -0.07250213623046875, -0.07000732421875, -0.06751251220703125, -0.0650177001953125, -0.06252288818359375, -0.060028076171875, -0.05753326416015625, -0.0550384521484375, -0.05254364013671875, -0.050048828125, -0.04755401611328125, -0.0450592041015625, -0.04256439208984375, -0.040069580078125, -0.03757476806640625, -0.0350799560546875, -0.03258514404296875, -0.03009033203125, -0.02759552001953125, -0.0251007080078125, -0.02260589599609375, -0.020111083984375, -0.01761627197265625, -0.0151214599609375, -0.01262664794921875, -0.0101318359375, -0.00763702392578125, -0.0051422119140625, -0.00264739990234375, -0.000152587890625, 0.00234222412109375, 0.0048370361328125, 0.00733184814453125, 0.00982666015625, 0.01232147216796875, 0.0148162841796875, 0.01731109619140625, 0.019805908203125, 0.02230072021484375, 0.0247955322265625, 0.02729034423828125, 0.02978515625, 0.03227996826171875, 0.0347747802734375, 0.03726959228515625, 0.039764404296875, 0.04225921630859375, 0.0447540283203125, 0.04724884033203125, 0.04974365234375, 0.05223846435546875, 0.0547332763671875, 0.05722808837890625, 0.059722900390625, 0.06221771240234375, 0.0647125244140625, 0.06720733642578125, 0.0697021484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 10.0, 13.0, 14.0, 10.0, 27.0, 34.0, 50.0, 66.0, 70.0, 95.0, 124.0, 184.0, 235.0, 340.0, 487.0, 688.0, 1090.0, 1788.0, 3130.0, 6214.0, 14423.0, 42087.0, 277286.0, 3728689.0, 76521.0, 21432.0, 8687.0, 4117.0, 2203.0, 1237.0, 851.0, 589.0, 371.0, 309.0, 222.0, 144.0, 98.0, 97.0, 52.0, 38.0, 36.0, 31.0, 27.0, 19.0, 7.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.393798828125, -0.38228607177734375, -0.3707733154296875, -0.35926055908203125, -0.347747802734375, -0.33623504638671875, -0.3247222900390625, -0.31320953369140625, -0.30169677734375, -0.29018402099609375, -0.2786712646484375, -0.26715850830078125, -0.255645751953125, -0.24413299560546875, -0.2326202392578125, -0.22110748291015625, -0.2095947265625, -0.19808197021484375, -0.1865692138671875, -0.17505645751953125, -0.163543701171875, -0.15203094482421875, -0.1405181884765625, -0.12900543212890625, -0.11749267578125, -0.10597991943359375, -0.0944671630859375, -0.08295440673828125, -0.071441650390625, -0.05992889404296875, -0.0484161376953125, -0.03690338134765625, -0.025390625, -0.01387786865234375, -0.0023651123046875, 0.00914764404296875, 0.020660400390625, 0.03217315673828125, 0.0436859130859375, 0.05519866943359375, 0.06671142578125, 0.07822418212890625, 0.0897369384765625, 0.10124969482421875, 0.112762451171875, 0.12427520751953125, 0.1357879638671875, 0.14730072021484375, 0.1588134765625, 0.17032623291015625, 0.1818389892578125, 0.19335174560546875, 0.204864501953125, 0.21637725830078125, 0.2278900146484375, 0.23940277099609375, 0.25091552734375, 0.26242828369140625, 0.2739410400390625, 0.28545379638671875, 0.296966552734375, 0.30847930908203125, 0.3199920654296875, 0.33150482177734375, 0.343017578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 6.0, 6.0, 6.0, 8.0, 16.0, 47.0, 68.0, 148.0, 2850.0, 600.0, 130.0, 56.0, 38.0, 14.0, 19.0, 15.0, 8.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1231689453125, -0.1195383071899414, -0.11590766906738281, -0.11227703094482422, -0.10864639282226562, -0.10501575469970703, -0.10138511657714844, -0.09775447845458984, -0.09412384033203125, -0.09049320220947266, -0.08686256408691406, -0.08323192596435547, -0.07960128784179688, -0.07597064971923828, -0.07234001159667969, -0.0687093734741211, -0.0650787353515625, -0.061448097229003906, -0.05781745910644531, -0.05418682098388672, -0.050556182861328125, -0.04692554473876953, -0.04329490661621094, -0.039664268493652344, -0.03603363037109375, -0.032402992248535156, -0.028772354125976562, -0.02514171600341797, -0.021511077880859375, -0.01788043975830078, -0.014249801635742188, -0.010619163513183594, -0.006988525390625, -0.0033578872680664062, 0.0002727508544921875, 0.0039033889770507812, 0.007534027099609375, 0.011164665222167969, 0.014795303344726562, 0.018425941467285156, 0.02205657958984375, 0.025687217712402344, 0.029317855834960938, 0.03294849395751953, 0.036579132080078125, 0.04020977020263672, 0.04384040832519531, 0.047471046447753906, 0.0511016845703125, 0.054732322692871094, 0.05836296081542969, 0.06199359893798828, 0.06562423706054688, 0.06925487518310547, 0.07288551330566406, 0.07651615142822266, 0.08014678955078125, 0.08377742767333984, 0.08740806579589844, 0.09103870391845703, 0.09466934204101562, 0.09829998016357422, 0.10193061828613281, 0.1055612564086914, 0.10919189453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 11.0, 14.0, 22.0, 48.0, 87.0, 118.0, 132.0, 143.0, 151.0, 86.0, 74.0, 47.0, 24.0, 14.0, 13.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.664283275604248, -0.6442078351974487, -0.6241323947906494, -0.6040569543838501, -0.5839815139770508, -0.5639060735702515, -0.5438306331634521, -0.5237551927566528, -0.5036797523498535, -0.4836043119430542, -0.4635288715362549, -0.44345343112945557, -0.42337799072265625, -0.40330255031585693, -0.38322708010673523, -0.3631516396999359, -0.3430761694908142, -0.3230007290840149, -0.3029252886772156, -0.28284984827041626, -0.26277440786361694, -0.24269895255565643, -0.22262349724769592, -0.2025480568408966, -0.1824726164340973, -0.16239717602729797, -0.14232173562049866, -0.12224628031253815, -0.10217083990573883, -0.08209539949893951, -0.0620199516415596, -0.04194450378417969, -0.02186906337738037, -0.0017936192452907562, 0.01828182488679886, 0.038357269018888474, 0.05843271315097809, 0.0785081535577774, 0.09858360141515732, 0.11865904927253723, 0.13873448967933655, 0.15880993008613586, 0.17888537049293518, 0.1989608258008957, 0.219036266207695, 0.23911170661449432, 0.25918716192245483, 0.27926260232925415, 0.29933804273605347, 0.3194134831428528, 0.3394889235496521, 0.3595643639564514, 0.37963980436325073, 0.39971524477005005, 0.41979071497917175, 0.43986615538597107, 0.4599415957927704, 0.4800170361995697, 0.5000925064086914, 0.5201679468154907, 0.54024338722229, 0.5603188276290894, 0.5803942680358887, 0.600469708442688, 0.6205451488494873]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 6.0, 6.0, 11.0, 7.0, 10.0, 18.0, 6.0, 17.0, 16.0, 17.0, 30.0, 30.0, 28.0, 30.0, 53.0, 46.0, 41.0, 45.0, 53.0, 40.0, 51.0, 54.0, 40.0, 34.0, 37.0, 36.0, 30.0, 36.0, 24.0, 21.0, 23.0, 19.0, 20.0, 15.0, 16.0, 8.0, 6.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24712252616882324, -0.23897069692611694, -0.23081886768341064, -0.22266703844070435, -0.21451520919799805, -0.20636337995529175, -0.19821156561374664, -0.19005973637104034, -0.18190790712833405, -0.17375607788562775, -0.16560424864292145, -0.15745241940021515, -0.14930060505867004, -0.14114877581596375, -0.13299694657325745, -0.12484511733055115, -0.11669328808784485, -0.10854145884513855, -0.10038962960243225, -0.09223780781030655, -0.08408597856760025, -0.07593414932489395, -0.06778232753276825, -0.05963049829006195, -0.05147866904735565, -0.04332683980464935, -0.03517501428723335, -0.027023186907172203, -0.018871359527111053, -0.010719530284404755, -0.0025677047669887543, 0.005584120750427246, 0.013735949993133545, 0.021887777373194695, 0.030039604753255844, 0.038191430270671844, 0.04634325951337814, 0.05449508875608444, 0.06264691054821014, 0.07079873979091644, 0.07895056903362274, 0.08710239827632904, 0.09525422751903534, 0.10340604931116104, 0.11155787855386734, 0.11970970779657364, 0.12786152958869934, 0.13601335883140564, 0.14416518807411194, 0.15231701731681824, 0.16046884655952454, 0.16862067580223083, 0.17677250504493713, 0.18492433428764343, 0.19307614862918854, 0.20122797787189484, 0.20937980711460114, 0.21753163635730743, 0.22568346560001373, 0.23383529484272003, 0.24198710918426514, 0.25013893842697144, 0.25829076766967773, 0.26644259691238403, 0.27459442615509033]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 7.0, 23.0, 33.0, 45.0, 56.0, 109.0, 131.0, 215.0, 352.0, 594.0, 985.0, 1821.0, 3743.0, 7604.0, 16482.0, 38018.0, 87788.0, 197588.0, 308220.0, 211601.0, 96561.0, 41579.0, 17920.0, 8363.0, 3890.0, 2053.0, 1128.0, 612.0, 369.0, 240.0, 149.0, 85.0, 52.0, 37.0, 33.0, 21.0, 6.0, 10.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.13544654846191406, -0.13014602661132812, -0.12484550476074219, -0.11954498291015625, -0.11424446105957031, -0.10894393920898438, -0.10364341735839844, -0.0983428955078125, -0.09304237365722656, -0.08774185180664062, -0.08244132995605469, -0.07714080810546875, -0.07184028625488281, -0.06653976440429688, -0.06123924255371094, -0.055938720703125, -0.05063819885253906, -0.045337677001953125, -0.04003715515136719, -0.03473663330078125, -0.029436111450195312, -0.024135589599609375, -0.018835067749023438, -0.0135345458984375, -0.008234024047851562, -0.002933502197265625, 0.0023670196533203125, 0.00766754150390625, 0.012968063354492188, 0.018268585205078125, 0.023569107055664062, 0.02886962890625, 0.03417015075683594, 0.039470672607421875, 0.04477119445800781, 0.05007171630859375, 0.05537223815917969, 0.060672760009765625, 0.06597328186035156, 0.0712738037109375, 0.07657432556152344, 0.08187484741210938, 0.08717536926269531, 0.09247589111328125, 0.09777641296386719, 0.10307693481445312, 0.10837745666503906, 0.113677978515625, 0.11897850036621094, 0.12427902221679688, 0.1295795440673828, 0.13488006591796875, 0.1401805877685547, 0.14548110961914062, 0.15078163146972656, 0.1560821533203125, 0.16138267517089844, 0.16668319702148438, 0.1719837188720703, 0.17728424072265625, 0.1825847625732422, 0.18788528442382812, 0.19318580627441406, 0.198486328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 9.0, 11.0, 22.0, 14.0, 26.0, 24.0, 36.0, 33.0, 42.0, 37.0, 56.0, 52.0, 60.0, 48.0, 66.0, 54.0, 55.0, 58.0, 47.0, 49.0, 37.0, 35.0, 24.0, 28.0, 14.0, 15.0, 8.0, 5.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1072998046875, -0.10440826416015625, -0.1015167236328125, -0.09862518310546875, -0.095733642578125, -0.09284210205078125, -0.0899505615234375, -0.08705902099609375, -0.08416748046875, -0.08127593994140625, -0.0783843994140625, -0.07549285888671875, -0.072601318359375, -0.06970977783203125, -0.0668182373046875, -0.06392669677734375, -0.06103515625, -0.05814361572265625, -0.0552520751953125, -0.05236053466796875, -0.049468994140625, -0.04657745361328125, -0.0436859130859375, -0.04079437255859375, -0.03790283203125, -0.03501129150390625, -0.0321197509765625, -0.02922821044921875, -0.026336669921875, -0.02344512939453125, -0.0205535888671875, -0.01766204833984375, -0.0147705078125, -0.01187896728515625, -0.0089874267578125, -0.00609588623046875, -0.003204345703125, -0.00031280517578125, 0.0025787353515625, 0.00547027587890625, 0.00836181640625, 0.01125335693359375, 0.0141448974609375, 0.01703643798828125, 0.019927978515625, 0.02281951904296875, 0.0257110595703125, 0.02860260009765625, 0.031494140625, 0.03438568115234375, 0.0372772216796875, 0.04016876220703125, 0.043060302734375, 0.04595184326171875, 0.0488433837890625, 0.05173492431640625, 0.05462646484375, 0.05751800537109375, 0.0604095458984375, 0.06330108642578125, 0.066192626953125, 0.06908416748046875, 0.0719757080078125, 0.07486724853515625, 0.0777587890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 18.0, 19.0, 18.0, 30.0, 34.0, 81.0, 108.0, 154.0, 233.0, 378.0, 619.0, 1224.0, 2945.0, 10044.0, 59200.0, 529415.0, 388520.0, 42346.0, 7963.0, 2539.0, 1062.0, 561.0, 362.0, 215.0, 137.0, 109.0, 63.0, 47.0, 23.0, 19.0, 19.0, 11.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4365234375, -0.42436981201171875, -0.4122161865234375, -0.40006256103515625, -0.387908935546875, -0.37575531005859375, -0.3636016845703125, -0.35144805908203125, -0.33929443359375, -0.32714080810546875, -0.3149871826171875, -0.30283355712890625, -0.290679931640625, -0.27852630615234375, -0.2663726806640625, -0.25421905517578125, -0.2420654296875, -0.22991180419921875, -0.2177581787109375, -0.20560455322265625, -0.193450927734375, -0.18129730224609375, -0.1691436767578125, -0.15699005126953125, -0.14483642578125, -0.13268280029296875, -0.1205291748046875, -0.10837554931640625, -0.096221923828125, -0.08406829833984375, -0.0719146728515625, -0.05976104736328125, -0.047607421875, -0.03545379638671875, -0.0233001708984375, -0.01114654541015625, 0.001007080078125, 0.01316070556640625, 0.0253143310546875, 0.03746795654296875, 0.04962158203125, 0.06177520751953125, 0.0739288330078125, 0.08608245849609375, 0.098236083984375, 0.11038970947265625, 0.1225433349609375, 0.13469696044921875, 0.1468505859375, 0.15900421142578125, 0.1711578369140625, 0.18331146240234375, 0.195465087890625, 0.20761871337890625, 0.2197723388671875, 0.23192596435546875, 0.24407958984375, 0.25623321533203125, 0.2683868408203125, 0.28054046630859375, 0.292694091796875, 0.30484771728515625, 0.3170013427734375, 0.32915496826171875, 0.34130859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 0.0, 6.0, 6.0, 5.0, 9.0, 8.0, 9.0, 16.0, 22.0, 25.0, 29.0, 24.0, 38.0, 37.0, 38.0, 48.0, 45.0, 45.0, 69.0, 58.0, 50.0, 57.0, 44.0, 43.0, 46.0, 44.0, 43.0, 30.0, 24.0, 15.0, 21.0, 6.0, 7.0, 11.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373046875, -0.3598518371582031, -0.34665679931640625, -0.3334617614746094, -0.3202667236328125, -0.3070716857910156, -0.29387664794921875, -0.2806816101074219, -0.267486572265625, -0.2542915344238281, -0.24109649658203125, -0.22790145874023438, -0.2147064208984375, -0.20151138305664062, -0.18831634521484375, -0.17512130737304688, -0.16192626953125, -0.14873123168945312, -0.13553619384765625, -0.12234115600585938, -0.1091461181640625, -0.09595108032226562, -0.08275604248046875, -0.06956100463867188, -0.056365966796875, -0.043170928955078125, -0.02997589111328125, -0.016780853271484375, -0.0035858154296875, 0.009609222412109375, 0.02280426025390625, 0.035999298095703125, 0.0491943359375, 0.062389373779296875, 0.07558441162109375, 0.08877944946289062, 0.1019744873046875, 0.11516952514648438, 0.12836456298828125, 0.14155960083007812, 0.154754638671875, 0.16794967651367188, 0.18114471435546875, 0.19433975219726562, 0.2075347900390625, 0.22072982788085938, 0.23392486572265625, 0.24711990356445312, 0.26031494140625, 0.2735099792480469, 0.28670501708984375, 0.2999000549316406, 0.3130950927734375, 0.3262901306152344, 0.33948516845703125, 0.3526802062988281, 0.365875244140625, 0.3790702819824219, 0.39226531982421875, 0.4054603576660156, 0.4186553955078125, 0.4318504333496094, 0.44504547119140625, 0.4582405090332031, 0.471435546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 8.0, 15.0, 21.0, 47.0, 75.0, 198.0, 540.0, 2009.0, 14450.0, 642892.0, 376146.0, 9828.0, 1518.0, 471.0, 178.0, 85.0, 36.0, 15.0, 12.0, 6.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4404296875, -0.4274482727050781, -0.41446685791015625, -0.4014854431152344, -0.3885040283203125, -0.3755226135253906, -0.36254119873046875, -0.3495597839355469, -0.336578369140625, -0.3235969543457031, -0.31061553955078125, -0.2976341247558594, -0.2846527099609375, -0.2716712951660156, -0.25868988037109375, -0.24570846557617188, -0.23272705078125, -0.21974563598632812, -0.20676422119140625, -0.19378280639648438, -0.1808013916015625, -0.16781997680664062, -0.15483856201171875, -0.14185714721679688, -0.128875732421875, -0.11589431762695312, -0.10291290283203125, -0.08993148803710938, -0.0769500732421875, -0.06396865844726562, -0.05098724365234375, -0.038005828857421875, -0.0250244140625, -0.012042999267578125, 0.00093841552734375, 0.013919830322265625, 0.0269012451171875, 0.039882659912109375, 0.05286407470703125, 0.06584548950195312, 0.078826904296875, 0.09180831909179688, 0.10478973388671875, 0.11777114868164062, 0.1307525634765625, 0.14373397827148438, 0.15671539306640625, 0.16969680786132812, 0.18267822265625, 0.19565963745117188, 0.20864105224609375, 0.22162246704101562, 0.2346038818359375, 0.24758529663085938, 0.26056671142578125, 0.2735481262207031, 0.286529541015625, 0.2995109558105469, 0.31249237060546875, 0.3254737854003906, 0.3384552001953125, 0.3514366149902344, 0.36441802978515625, 0.3773994445800781, 0.390380859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 15.0, 11.0, 16.0, 16.0, 40.0, 39.0, 52.0, 68.0, 92.0, 83.0, 91.0, 86.0, 80.0, 70.0, 51.0, 55.0, 43.0, 25.0, 13.0, 15.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7147274017333984e-05, -4.5076943933963776e-05, -4.300661385059357e-05, -4.093628376722336e-05, -3.886595368385315e-05, -3.679562360048294e-05, -3.472529351711273e-05, -3.265496343374252e-05, -3.0584633350372314e-05, -2.8514303267002106e-05, -2.6443973183631897e-05, -2.4373643100261688e-05, -2.230331301689148e-05, -2.023298293352127e-05, -1.8162652850151062e-05, -1.6092322766780853e-05, -1.4021992683410645e-05, -1.1951662600040436e-05, -9.881332516670227e-06, -7.811002433300018e-06, -5.7406723499298096e-06, -3.670342266559601e-06, -1.600012183189392e-06, 4.7031790018081665e-07, 2.5406479835510254e-06, 4.610978066921234e-06, 6.681308150291443e-06, 8.751638233661652e-06, 1.082196831703186e-05, 1.2892298400402069e-05, 1.4962628483772278e-05, 1.7032958567142487e-05, 1.9103288650512695e-05, 2.1173618733882904e-05, 2.3243948817253113e-05, 2.531427890062332e-05, 2.738460898399353e-05, 2.945493906736374e-05, 3.152526915073395e-05, 3.3595599234104156e-05, 3.5665929317474365e-05, 3.7736259400844574e-05, 3.980658948421478e-05, 4.187691956758499e-05, 4.39472496509552e-05, 4.601757973432541e-05, 4.808790981769562e-05, 5.0158239901065826e-05, 5.2228569984436035e-05, 5.4298900067806244e-05, 5.636923015117645e-05, 5.843956023454666e-05, 6.050989031791687e-05, 6.258022040128708e-05, 6.465055048465729e-05, 6.67208805680275e-05, 6.87912106513977e-05, 7.086154073476791e-05, 7.293187081813812e-05, 7.500220090150833e-05, 7.707253098487854e-05, 7.914286106824875e-05, 8.121319115161896e-05, 8.328352123498917e-05, 8.535385131835938e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 11.0, 12.0, 14.0, 36.0, 53.0, 101.0, 165.0, 338.0, 678.0, 1579.0, 4947.0, 23800.0, 269719.0, 667135.0, 66208.0, 9217.0, 2594.0, 984.0, 424.0, 236.0, 123.0, 66.0, 39.0, 17.0, 13.0, 8.0, 11.0, 9.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.21076583862304688, -0.20302581787109375, -0.19528579711914062, -0.1875457763671875, -0.17980575561523438, -0.17206573486328125, -0.16432571411132812, -0.156585693359375, -0.14884567260742188, -0.14110565185546875, -0.13336563110351562, -0.1256256103515625, -0.11788558959960938, -0.11014556884765625, -0.10240554809570312, -0.09466552734375, -0.08692550659179688, -0.07918548583984375, -0.07144546508789062, -0.0637054443359375, -0.055965423583984375, -0.04822540283203125, -0.040485382080078125, -0.032745361328125, -0.025005340576171875, -0.01726531982421875, -0.009525299072265625, -0.0017852783203125, 0.005954742431640625, 0.01369476318359375, 0.021434783935546875, 0.0291748046875, 0.036914825439453125, 0.04465484619140625, 0.052394866943359375, 0.0601348876953125, 0.06787490844726562, 0.07561492919921875, 0.08335494995117188, 0.091094970703125, 0.09883499145507812, 0.10657501220703125, 0.11431503295898438, 0.1220550537109375, 0.12979507446289062, 0.13753509521484375, 0.14527511596679688, 0.15301513671875, 0.16075515747070312, 0.16849517822265625, 0.17623519897460938, 0.1839752197265625, 0.19171524047851562, 0.19945526123046875, 0.20719528198242188, 0.214935302734375, 0.22267532348632812, 0.23041534423828125, 0.23815536499023438, 0.2458953857421875, 0.2536354064941406, 0.26137542724609375, 0.2691154479980469, 0.27685546875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 9.0, 7.0, 7.0, 14.0, 19.0, 30.0, 38.0, 46.0, 58.0, 72.0, 85.0, 62.0, 85.0, 91.0, 72.0, 69.0, 51.0, 44.0, 32.0, 35.0, 26.0, 14.0, 8.0, 9.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1573486328125, -0.151947021484375, -0.14654541015625, -0.141143798828125, -0.1357421875, -0.130340576171875, -0.12493896484375, -0.119537353515625, -0.1141357421875, -0.108734130859375, -0.10333251953125, -0.097930908203125, -0.092529296875, -0.087127685546875, -0.08172607421875, -0.076324462890625, -0.0709228515625, -0.065521240234375, -0.06011962890625, -0.054718017578125, -0.04931640625, -0.043914794921875, -0.03851318359375, -0.033111572265625, -0.0277099609375, -0.022308349609375, -0.01690673828125, -0.011505126953125, -0.006103515625, -0.000701904296875, 0.00469970703125, 0.010101318359375, 0.0155029296875, 0.020904541015625, 0.02630615234375, 0.031707763671875, 0.037109375, 0.042510986328125, 0.04791259765625, 0.053314208984375, 0.0587158203125, 0.064117431640625, 0.06951904296875, 0.074920654296875, 0.080322265625, 0.085723876953125, 0.09112548828125, 0.096527099609375, 0.1019287109375, 0.107330322265625, 0.11273193359375, 0.118133544921875, 0.12353515625, 0.128936767578125, 0.13433837890625, 0.139739990234375, 0.1451416015625, 0.150543212890625, 0.15594482421875, 0.161346435546875, 0.166748046875, 0.172149658203125, 0.17755126953125, 0.182952880859375, 0.1883544921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 15.0, 39.0, 124.0, 237.0, 274.0, 190.0, 79.0, 29.0, 9.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.918266534805298, -2.739671468734741, -2.5610766410827637, -2.382481575012207, -2.2038865089416504, -2.025291681289673, -1.8466966152191162, -1.6681016683578491, -1.489506721496582, -1.310911774635315, -1.1323168277740479, -0.9537217617034912, -0.7751268148422241, -0.596531867980957, -0.4179368019104004, -0.2393418550491333, -0.06074690818786621, 0.11784806847572327, 0.29644304513931274, 0.4750380516052246, 0.6536329984664917, 0.8322279453277588, 1.0108230113983154, 1.1894179582595825, 1.3680129051208496, 1.5466078519821167, 1.7252027988433838, 1.9037978649139404, 2.082392692565918, 2.2609877586364746, 2.4395828247070312, 2.618177890777588, 2.7967729568481445, 2.975368022918701, 3.1539628505706787, 3.3325579166412354, 3.511152744293213, 3.6897478103637695, 3.868342876434326, 4.046937942504883, 4.225532531738281, 4.404127597808838, 4.5827226638793945, 4.761317253112793, 4.93991231918335, 5.118507385253906, 5.297102451324463, 5.4756975173950195, 5.654292583465576, 5.832887649536133, 6.0114827156066895, 6.190077781677246, 6.3686723709106445, 6.547267436981201, 6.725862503051758, 6.9044575691223145, 7.083052635192871, 7.261647701263428, 7.440242767333984, 7.618837356567383, 7.7974324226379395, 7.976027488708496, 8.154623031616211, 8.33321762084961, 8.511812210083008]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 1.0, 9.0, 3.0, 8.0, 1.0, 12.0, 17.0, 11.0, 13.0, 11.0, 16.0, 24.0, 39.0, 25.0, 39.0, 46.0, 60.0, 55.0, 68.0, 45.0, 47.0, 59.0, 57.0, 60.0, 44.0, 30.0, 25.0, 25.0, 24.0, 25.0, 25.0, 18.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0916075706481934, -2.0315911769866943, -1.9715749025344849, -1.9115585088729858, -1.8515422344207764, -1.7915258407592773, -1.7315094470977783, -1.6714931726455688, -1.6114768981933594, -1.5514605045318604, -1.4914442300796509, -1.4314278364181519, -1.3714115619659424, -1.3113951683044434, -1.2513787746429443, -1.1913625001907349, -1.1313461065292358, -1.0713297128677368, -1.0113134384155273, -0.9512970447540283, -0.8912807703018188, -0.8312643766403198, -0.7712480425834656, -0.7112317085266113, -0.6512153744697571, -0.5911990404129028, -0.5311827063560486, -0.47116634249687195, -0.4111500084400177, -0.35113367438316345, -0.2911173105239868, -0.23110097646713257, -0.17108476161956787, -0.11106842011213303, -0.05105207860469818, 0.00896427035331726, 0.06898060441017151, 0.12899693846702576, 0.1890133023262024, 0.24902963638305664, 0.3090459704399109, 0.36906230449676514, 0.4290786385536194, 0.489095002412796, 0.5491113662719727, 0.6091276407241821, 0.6691440343856812, 0.7291603684425354, 0.7891767024993896, 0.8491930365562439, 0.9092093706130981, 0.9692257642745972, 1.0292420387268066, 1.0892584323883057, 1.1492748260498047, 1.2092911005020142, 1.2693073749542236, 1.3293237686157227, 1.3893400430679321, 1.4493564367294312, 1.5093727111816406, 1.5693891048431396, 1.6294054985046387, 1.6894217729568481, 1.7494381666183472]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 7.0, 9.0, 10.0, 16.0, 29.0, 30.0, 49.0, 103.0, 143.0, 158.0, 274.0, 462.0, 736.0, 1091.0, 1945.0, 3624.0, 7609.0, 20463.0, 202115.0, 3909827.0, 26883.0, 8878.0, 4129.0, 2178.0, 1303.0, 826.0, 476.0, 278.0, 189.0, 135.0, 91.0, 50.0, 53.0, 37.0, 19.0, 20.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.355712890625, -0.3446311950683594, -0.33354949951171875, -0.3224678039550781, -0.3113861083984375, -0.3003044128417969, -0.28922271728515625, -0.2781410217285156, -0.267059326171875, -0.2559776306152344, -0.24489593505859375, -0.23381423950195312, -0.2227325439453125, -0.21165084838867188, -0.20056915283203125, -0.18948745727539062, -0.17840576171875, -0.16732406616210938, -0.15624237060546875, -0.14516067504882812, -0.1340789794921875, -0.12299728393554688, -0.11191558837890625, -0.10083389282226562, -0.089752197265625, -0.07867050170898438, -0.06758880615234375, -0.056507110595703125, -0.0454254150390625, -0.034343719482421875, -0.02326202392578125, -0.012180328369140625, -0.0010986328125, 0.009983062744140625, 0.02106475830078125, 0.032146453857421875, 0.0432281494140625, 0.054309844970703125, 0.06539154052734375, 0.07647323608398438, 0.087554931640625, 0.09863662719726562, 0.10971832275390625, 0.12080001831054688, 0.1318817138671875, 0.14296340942382812, 0.15404510498046875, 0.16512680053710938, 0.17620849609375, 0.18729019165039062, 0.19837188720703125, 0.20945358276367188, 0.2205352783203125, 0.23161697387695312, 0.24269866943359375, 0.2537803649902344, 0.264862060546875, 0.2759437561035156, 0.28702545166015625, 0.2981071472167969, 0.3091888427734375, 0.3202705383300781, 0.33135223388671875, 0.3424339294433594, 0.353515625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 1.0, 9.0, 16.0, 9.0, 22.0, 22.0, 24.0, 40.0, 58.0, 51.0, 69.0, 56.0, 64.0, 83.0, 71.0, 70.0, 71.0, 63.0, 51.0, 41.0, 29.0, 22.0, 13.0, 13.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1357421875, -0.13199329376220703, -0.12824440002441406, -0.1244955062866211, -0.12074661254882812, -0.11699771881103516, -0.11324882507324219, -0.10949993133544922, -0.10575103759765625, -0.10200214385986328, -0.09825325012207031, -0.09450435638427734, -0.09075546264648438, -0.0870065689086914, -0.08325767517089844, -0.07950878143310547, -0.0757598876953125, -0.07201099395751953, -0.06826210021972656, -0.0645132064819336, -0.060764312744140625, -0.057015419006347656, -0.05326652526855469, -0.04951763153076172, -0.04576873779296875, -0.04201984405517578, -0.03827095031738281, -0.034522056579589844, -0.030773162841796875, -0.027024269104003906, -0.023275375366210938, -0.01952648162841797, -0.015777587890625, -0.012028694152832031, -0.008279800415039062, -0.004530906677246094, -0.000782012939453125, 0.0029668807983398438, 0.0067157745361328125, 0.010464668273925781, 0.01421356201171875, 0.01796245574951172, 0.021711349487304688, 0.025460243225097656, 0.029209136962890625, 0.032958030700683594, 0.03670692443847656, 0.04045581817626953, 0.0442047119140625, 0.04795360565185547, 0.05170249938964844, 0.055451393127441406, 0.059200286865234375, 0.06294918060302734, 0.06669807434082031, 0.07044696807861328, 0.07419586181640625, 0.07794475555419922, 0.08169364929199219, 0.08544254302978516, 0.08919143676757812, 0.0929403305053711, 0.09668922424316406, 0.10043811798095703, 0.10418701171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 4.0, 10.0, 14.0, 16.0, 10.0, 14.0, 27.0, 34.0, 47.0, 63.0, 99.0, 203.0, 308.0, 623.0, 1210.0, 2920.0, 8810.0, 44650.0, 4049976.0, 67641.0, 11191.0, 3428.0, 1445.0, 644.0, 339.0, 182.0, 108.0, 69.0, 58.0, 30.0, 23.0, 15.0, 17.0, 14.0, 13.0, 8.0, 11.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50830078125, -0.48987579345703125, -0.4714508056640625, -0.45302581787109375, -0.434600830078125, -0.41617584228515625, -0.3977508544921875, -0.37932586669921875, -0.36090087890625, -0.34247589111328125, -0.3240509033203125, -0.30562591552734375, -0.287200927734375, -0.26877593994140625, -0.2503509521484375, -0.23192596435546875, -0.2135009765625, -0.19507598876953125, -0.1766510009765625, -0.15822601318359375, -0.139801025390625, -0.12137603759765625, -0.1029510498046875, -0.08452606201171875, -0.06610107421875, -0.04767608642578125, -0.0292510986328125, -0.01082611083984375, 0.007598876953125, 0.02602386474609375, 0.0444488525390625, 0.06287384033203125, 0.081298828125, 0.09972381591796875, 0.1181488037109375, 0.13657379150390625, 0.154998779296875, 0.17342376708984375, 0.1918487548828125, 0.21027374267578125, 0.22869873046875, 0.24712371826171875, 0.2655487060546875, 0.28397369384765625, 0.302398681640625, 0.32082366943359375, 0.3392486572265625, 0.35767364501953125, 0.3760986328125, 0.39452362060546875, 0.4129486083984375, 0.43137359619140625, 0.449798583984375, 0.46822357177734375, 0.4866485595703125, 0.5050735473632812, 0.52349853515625, 0.5419235229492188, 0.5603485107421875, 0.5787734985351562, 0.597198486328125, 0.6156234741210938, 0.6340484619140625, 0.6524734497070312, 0.6708984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 9.0, 11.0, 14.0, 27.0, 54.0, 151.0, 3472.0, 193.0, 60.0, 20.0, 18.0, 10.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08172607421875, -0.07776165008544922, -0.07379722595214844, -0.06983280181884766, -0.06586837768554688, -0.061903953552246094, -0.05793952941894531, -0.05397510528564453, -0.05001068115234375, -0.04604625701904297, -0.04208183288574219, -0.038117408752441406, -0.034152984619140625, -0.030188560485839844, -0.026224136352539062, -0.02225971221923828, -0.0182952880859375, -0.014330863952636719, -0.010366439819335938, -0.006402015686035156, -0.002437591552734375, 0.0015268325805664062, 0.0054912567138671875, 0.009455680847167969, 0.01342010498046875, 0.01738452911376953, 0.021348953247070312, 0.025313377380371094, 0.029277801513671875, 0.033242225646972656, 0.03720664978027344, 0.04117107391357422, 0.045135498046875, 0.04909992218017578, 0.05306434631347656, 0.057028770446777344, 0.060993194580078125, 0.0649576187133789, 0.06892204284667969, 0.07288646697998047, 0.07685089111328125, 0.08081531524658203, 0.08477973937988281, 0.0887441635131836, 0.09270858764648438, 0.09667301177978516, 0.10063743591308594, 0.10460186004638672, 0.1085662841796875, 0.11253070831298828, 0.11649513244628906, 0.12045955657958984, 0.12442398071289062, 0.1283884048461914, 0.1323528289794922, 0.13631725311279297, 0.14028167724609375, 0.14424610137939453, 0.1482105255126953, 0.1521749496459961, 0.15613937377929688, 0.16010379791259766, 0.16406822204589844, 0.16803264617919922, 0.1719970703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 15.0, 27.0, 47.0, 73.0, 103.0, 128.0, 145.0, 133.0, 117.0, 74.0, 53.0, 33.0, 19.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5267080664634705, -0.5120776891708374, -0.49744731187820435, -0.4828169345855713, -0.4681865870952606, -0.45355620980262756, -0.4389258325099945, -0.42429545521736145, -0.4096651077270508, -0.3950347304344177, -0.38040435314178467, -0.3657739758491516, -0.35114362835884094, -0.3365132510662079, -0.32188287377357483, -0.3072524964809418, -0.2926221191883087, -0.27799174189567566, -0.2633613646030426, -0.24873100221157074, -0.23410063982009888, -0.21947026252746582, -0.20483988523483276, -0.1902095079421997, -0.17557914555072784, -0.1609487682580948, -0.14631840586662292, -0.13168802857398987, -0.11705765873193741, -0.10242728888988495, -0.08779691159725189, -0.07316654175519943, -0.05853617191314697, -0.04390580207109451, -0.029275428503751755, -0.014645054936408997, -1.4685094356536865e-05, 0.014615684747695923, 0.02924606204032898, 0.04387643188238144, 0.0585068017244339, 0.07313717156648636, 0.08776754140853882, 0.10239791870117188, 0.11702828854322433, 0.1316586583852768, 0.14628903567790985, 0.1609193980693817, 0.17554977536201477, 0.19018015265464783, 0.2048105150461197, 0.21944089233875275, 0.2340712547302246, 0.24870163202285767, 0.2633320093154907, 0.2779623866081238, 0.29259276390075684, 0.3072231411933899, 0.32185351848602295, 0.336483895778656, 0.3511142432689667, 0.36574462056159973, 0.3803749978542328, 0.39500537514686584, 0.4096357226371765]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 7.0, 7.0, 19.0, 9.0, 22.0, 20.0, 14.0, 30.0, 34.0, 31.0, 30.0, 41.0, 38.0, 35.0, 51.0, 48.0, 38.0, 40.0, 41.0, 29.0, 39.0, 41.0, 29.0, 37.0, 32.0, 30.0, 27.0, 22.0, 22.0, 20.0, 14.0, 15.0, 18.0, 13.0, 11.0, 8.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.17311352491378784, -0.16769325733184814, -0.16227300465106964, -0.15685273706912994, -0.15143248438835144, -0.14601221680641174, -0.14059194922447205, -0.13517168164253235, -0.12975142896175385, -0.12433116883039474, -0.11891090869903564, -0.11349064111709595, -0.10807038098573685, -0.10265012085437775, -0.09722985327243805, -0.09180959314107895, -0.08638933300971985, -0.08096907287836075, -0.07554881274700165, -0.07012854516506195, -0.06470828503370285, -0.05928802490234375, -0.05386776104569435, -0.04844749718904495, -0.04302723705768585, -0.03760697692632675, -0.03218671306967735, -0.026766451075673103, -0.021346189081668854, -0.015925927087664604, -0.010505665093660355, -0.005085401237010956, 0.00033485889434814453, 0.005755120888352394, 0.011175382882356644, 0.016595644876360893, 0.022015906870365143, 0.027436168864369392, 0.03285643085837364, 0.03827669471502304, 0.04369695484638214, 0.04911721497774124, 0.05453747883439064, 0.05995774269104004, 0.06537800282239914, 0.07079826295375824, 0.07621853053569794, 0.08163879066705704, 0.08705905079841614, 0.09247931092977524, 0.09789957106113434, 0.10331983864307404, 0.10874009877443314, 0.11416035890579224, 0.11958062648773193, 0.12500089406967163, 0.13042114675045013, 0.13584141433238983, 0.14126166701316833, 0.14668193459510803, 0.15210220217704773, 0.15752245485782623, 0.16294272243976593, 0.16836297512054443, 0.17378324270248413]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 4.0, 16.0, 21.0, 38.0, 40.0, 47.0, 69.0, 100.0, 175.0, 267.0, 451.0, 734.0, 1372.0, 2626.0, 4945.0, 9900.0, 20527.0, 42985.0, 93802.0, 210456.0, 319126.0, 184503.0, 81910.0, 37977.0, 17813.0, 8854.0, 4378.0, 2205.0, 1268.0, 736.0, 437.0, 243.0, 176.0, 106.0, 77.0, 49.0, 32.0, 17.0, 17.0, 12.0, 8.0, 4.0, 10.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.14276695251464844, -0.13807296752929688, -0.1333789825439453, -0.12868499755859375, -0.12399101257324219, -0.11929702758789062, -0.11460304260253906, -0.1099090576171875, -0.10521507263183594, -0.10052108764648438, -0.09582710266113281, -0.09113311767578125, -0.08643913269042969, -0.08174514770507812, -0.07705116271972656, -0.072357177734375, -0.06766319274902344, -0.06296920776367188, -0.05827522277832031, -0.05358123779296875, -0.04888725280761719, -0.044193267822265625, -0.03949928283691406, -0.0348052978515625, -0.030111312866210938, -0.025417327880859375, -0.020723342895507812, -0.01602935791015625, -0.011335372924804688, -0.006641387939453125, -0.0019474029541015625, 0.00274658203125, 0.0074405670166015625, 0.012134552001953125, 0.016828536987304688, 0.02152252197265625, 0.026216506958007812, 0.030910491943359375, 0.03560447692871094, 0.0402984619140625, 0.04499244689941406, 0.049686431884765625, 0.05438041687011719, 0.05907440185546875, 0.06376838684082031, 0.06846237182617188, 0.07315635681152344, 0.077850341796875, 0.08254432678222656, 0.08723831176757812, 0.09193229675292969, 0.09662628173828125, 0.10132026672363281, 0.10601425170898438, 0.11070823669433594, 0.1154022216796875, 0.12009620666503906, 0.12479019165039062, 0.1294841766357422, 0.13417816162109375, 0.1388721466064453, 0.14356613159179688, 0.14826011657714844, 0.1529541015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 10.0, 10.0, 14.0, 14.0, 20.0, 27.0, 24.0, 36.0, 52.0, 62.0, 59.0, 86.0, 83.0, 80.0, 91.0, 58.0, 55.0, 44.0, 45.0, 42.0, 30.0, 23.0, 10.0, 11.0, 8.0, 0.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152587890625, -0.14844894409179688, -0.14430999755859375, -0.14017105102539062, -0.1360321044921875, -0.13189315795898438, -0.12775421142578125, -0.12361526489257812, -0.119476318359375, -0.11533737182617188, -0.11119842529296875, -0.10705947875976562, -0.1029205322265625, -0.09878158569335938, -0.09464263916015625, -0.09050369262695312, -0.08636474609375, -0.08222579956054688, -0.07808685302734375, -0.07394790649414062, -0.0698089599609375, -0.06567001342773438, -0.06153106689453125, -0.057392120361328125, -0.053253173828125, -0.049114227294921875, -0.04497528076171875, -0.040836334228515625, -0.0366973876953125, -0.032558441162109375, -0.02841949462890625, -0.024280548095703125, -0.0201416015625, -0.016002655029296875, -0.01186370849609375, -0.007724761962890625, -0.0035858154296875, 0.000553131103515625, 0.00469207763671875, 0.008831024169921875, 0.012969970703125, 0.017108917236328125, 0.02124786376953125, 0.025386810302734375, 0.0295257568359375, 0.033664703369140625, 0.03780364990234375, 0.041942596435546875, 0.04608154296875, 0.050220489501953125, 0.05435943603515625, 0.058498382568359375, 0.0626373291015625, 0.06677627563476562, 0.07091522216796875, 0.07505416870117188, 0.079193115234375, 0.08333206176757812, 0.08747100830078125, 0.09160995483398438, 0.0957489013671875, 0.09988784790039062, 0.10402679443359375, 0.10816574096679688, 0.1123046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 9.0, 6.0, 5.0, 13.0, 22.0, 29.0, 40.0, 39.0, 55.0, 70.0, 107.0, 111.0, 181.0, 300.0, 422.0, 732.0, 1401.0, 3207.0, 10739.0, 52878.0, 454774.0, 453938.0, 52171.0, 10516.0, 3237.0, 1369.0, 723.0, 434.0, 294.0, 203.0, 123.0, 92.0, 86.0, 51.0, 40.0, 32.0, 33.0, 20.0, 14.0, 11.0, 6.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.32177734375, -0.3123130798339844, -0.30284881591796875, -0.2933845520019531, -0.2839202880859375, -0.2744560241699219, -0.26499176025390625, -0.2555274963378906, -0.246063232421875, -0.23659896850585938, -0.22713470458984375, -0.21767044067382812, -0.2082061767578125, -0.19874191284179688, -0.18927764892578125, -0.17981338500976562, -0.17034912109375, -0.16088485717773438, -0.15142059326171875, -0.14195632934570312, -0.1324920654296875, -0.12302780151367188, -0.11356353759765625, -0.10409927368164062, -0.094635009765625, -0.08517074584960938, -0.07570648193359375, -0.06624221801757812, -0.0567779541015625, -0.047313690185546875, -0.03784942626953125, -0.028385162353515625, -0.0189208984375, -0.009456634521484375, 7.62939453125e-06, 0.009471893310546875, 0.0189361572265625, 0.028400421142578125, 0.03786468505859375, 0.047328948974609375, 0.056793212890625, 0.06625747680664062, 0.07572174072265625, 0.08518600463867188, 0.0946502685546875, 0.10411453247070312, 0.11357879638671875, 0.12304306030273438, 0.13250732421875, 0.14197158813476562, 0.15143585205078125, 0.16090011596679688, 0.1703643798828125, 0.17982864379882812, 0.18929290771484375, 0.19875717163085938, 0.208221435546875, 0.21768569946289062, 0.22714996337890625, 0.23661422729492188, 0.2460784912109375, 0.2555427551269531, 0.26500701904296875, 0.2744712829589844, 0.283935546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 11.0, 10.0, 20.0, 27.0, 25.0, 34.0, 33.0, 44.0, 39.0, 50.0, 47.0, 54.0, 51.0, 49.0, 54.0, 50.0, 39.0, 41.0, 43.0, 45.0, 36.0, 32.0, 38.0, 25.0, 13.0, 9.0, 23.0, 10.0, 10.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4873046875, -0.4737281799316406, -0.46015167236328125, -0.4465751647949219, -0.4329986572265625, -0.4194221496582031, -0.40584564208984375, -0.3922691345214844, -0.378692626953125, -0.3651161193847656, -0.35153961181640625, -0.3379631042480469, -0.3243865966796875, -0.3108100891113281, -0.29723358154296875, -0.2836570739746094, -0.27008056640625, -0.2565040588378906, -0.24292755126953125, -0.22935104370117188, -0.2157745361328125, -0.20219802856445312, -0.18862152099609375, -0.17504501342773438, -0.161468505859375, -0.14789199829101562, -0.13431549072265625, -0.12073898315429688, -0.1071624755859375, -0.09358596801757812, -0.08000946044921875, -0.06643295288085938, -0.0528564453125, -0.039279937744140625, -0.02570343017578125, -0.012126922607421875, 0.0014495849609375, 0.015026092529296875, 0.02860260009765625, 0.042179107666015625, 0.055755615234375, 0.06933212280273438, 0.08290863037109375, 0.09648513793945312, 0.1100616455078125, 0.12363815307617188, 0.13721466064453125, 0.15079116821289062, 0.16436767578125, 0.17794418334960938, 0.19152069091796875, 0.20509719848632812, 0.2186737060546875, 0.23225021362304688, 0.24582672119140625, 0.2594032287597656, 0.272979736328125, 0.2865562438964844, 0.30013275146484375, 0.3137092590332031, 0.3272857666015625, 0.3408622741699219, 0.35443878173828125, 0.3680152893066406, 0.381591796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 10.0, 23.0, 71.0, 141.0, 385.0, 1476.0, 12118.0, 702824.0, 322432.0, 7437.0, 1098.0, 319.0, 101.0, 48.0, 20.0, 17.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.489990234375, -0.4780120849609375, -0.466033935546875, -0.4540557861328125, -0.44207763671875, -0.4300994873046875, -0.418121337890625, -0.4061431884765625, -0.3941650390625, -0.3821868896484375, -0.370208740234375, -0.3582305908203125, -0.34625244140625, -0.3342742919921875, -0.322296142578125, -0.3103179931640625, -0.29833984375, -0.2863616943359375, -0.274383544921875, -0.2624053955078125, -0.25042724609375, -0.2384490966796875, -0.226470947265625, -0.2144927978515625, -0.2025146484375, -0.1905364990234375, -0.178558349609375, -0.1665802001953125, -0.15460205078125, -0.1426239013671875, -0.130645751953125, -0.1186676025390625, -0.106689453125, -0.0947113037109375, -0.082733154296875, -0.0707550048828125, -0.05877685546875, -0.0467987060546875, -0.034820556640625, -0.0228424072265625, -0.0108642578125, 0.0011138916015625, 0.013092041015625, 0.0250701904296875, 0.03704833984375, 0.0490264892578125, 0.061004638671875, 0.0729827880859375, 0.0849609375, 0.0969390869140625, 0.108917236328125, 0.1208953857421875, 0.13287353515625, 0.1448516845703125, 0.156829833984375, 0.1688079833984375, 0.1807861328125, 0.1927642822265625, 0.204742431640625, 0.2167205810546875, 0.22869873046875, 0.2406768798828125, 0.252655029296875, 0.2646331787109375, 0.276611328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 0.0, 6.0, 4.0, 9.0, 5.0, 4.0, 6.0, 9.0, 11.0, 17.0, 13.0, 18.0, 33.0, 30.0, 60.0, 63.0, 58.0, 67.0, 97.0, 76.0, 77.0, 65.0, 57.0, 52.0, 35.0, 35.0, 20.0, 14.0, 17.0, 15.0, 10.0, 7.0, 2.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.115436553955078e-05, -5.970802158117294e-05, -5.8261677622795105e-05, -5.681533366441727e-05, -5.536898970603943e-05, -5.392264574766159e-05, -5.247630178928375e-05, -5.1029957830905914e-05, -4.9583613872528076e-05, -4.813726991415024e-05, -4.66909259557724e-05, -4.524458199739456e-05, -4.3798238039016724e-05, -4.2351894080638885e-05, -4.090555012226105e-05, -3.945920616388321e-05, -3.801286220550537e-05, -3.656651824712753e-05, -3.5120174288749695e-05, -3.367383033037186e-05, -3.222748637199402e-05, -3.078114241361618e-05, -2.9334798455238342e-05, -2.7888454496860504e-05, -2.6442110538482666e-05, -2.4995766580104828e-05, -2.354942262172699e-05, -2.210307866334915e-05, -2.0656734704971313e-05, -1.9210390746593475e-05, -1.7764046788215637e-05, -1.63177028298378e-05, -1.4871358871459961e-05, -1.3425014913082123e-05, -1.1978670954704285e-05, -1.0532326996326447e-05, -9.085983037948608e-06, -7.63963907957077e-06, -6.193295121192932e-06, -4.746951162815094e-06, -3.300607204437256e-06, -1.8542632460594177e-06, -4.079192876815796e-07, 1.0384246706962585e-06, 2.4847686290740967e-06, 3.931112587451935e-06, 5.377456545829773e-06, 6.823800504207611e-06, 8.27014446258545e-06, 9.716488420963287e-06, 1.1162832379341125e-05, 1.2609176337718964e-05, 1.4055520296096802e-05, 1.550186425447464e-05, 1.6948208212852478e-05, 1.8394552171230316e-05, 1.9840896129608154e-05, 2.1287240087985992e-05, 2.273358404636383e-05, 2.417992800474167e-05, 2.5626271963119507e-05, 2.7072615921497345e-05, 2.8518959879875183e-05, 2.996530383825302e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 12.0, 14.0, 38.0, 53.0, 78.0, 154.0, 261.0, 487.0, 1056.0, 2895.0, 10818.0, 78367.0, 701611.0, 222894.0, 22061.0, 4731.0, 1645.0, 646.0, 317.0, 176.0, 86.0, 45.0, 33.0, 18.0, 12.0, 6.0, 7.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2093505859375, -0.20294952392578125, -0.1965484619140625, -0.19014739990234375, -0.183746337890625, -0.17734527587890625, -0.1709442138671875, -0.16454315185546875, -0.15814208984375, -0.15174102783203125, -0.1453399658203125, -0.13893890380859375, -0.132537841796875, -0.12613677978515625, -0.1197357177734375, -0.11333465576171875, -0.10693359375, -0.10053253173828125, -0.0941314697265625, -0.08773040771484375, -0.081329345703125, -0.07492828369140625, -0.0685272216796875, -0.06212615966796875, -0.05572509765625, -0.04932403564453125, -0.0429229736328125, -0.03652191162109375, -0.030120849609375, -0.02371978759765625, -0.0173187255859375, -0.01091766357421875, -0.0045166015625, 0.00188446044921875, 0.0082855224609375, 0.01468658447265625, 0.021087646484375, 0.02748870849609375, 0.0338897705078125, 0.04029083251953125, 0.04669189453125, 0.05309295654296875, 0.0594940185546875, 0.06589508056640625, 0.072296142578125, 0.07869720458984375, 0.0850982666015625, 0.09149932861328125, 0.097900390625, 0.10430145263671875, 0.1107025146484375, 0.11710357666015625, 0.123504638671875, 0.12990570068359375, 0.1363067626953125, 0.14270782470703125, 0.14910888671875, 0.15550994873046875, 0.1619110107421875, 0.16831207275390625, 0.174713134765625, 0.18111419677734375, 0.1875152587890625, 0.19391632080078125, 0.2003173828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 15.0, 6.0, 18.0, 27.0, 26.0, 24.0, 56.0, 46.0, 57.0, 63.0, 76.0, 75.0, 77.0, 59.0, 58.0, 59.0, 39.0, 40.0, 23.0, 23.0, 20.0, 28.0, 14.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1240234375, -0.12037944793701172, -0.11673545837402344, -0.11309146881103516, -0.10944747924804688, -0.1058034896850586, -0.10215950012207031, -0.09851551055908203, -0.09487152099609375, -0.09122753143310547, -0.08758354187011719, -0.0839395523071289, -0.08029556274414062, -0.07665157318115234, -0.07300758361816406, -0.06936359405517578, -0.0657196044921875, -0.06207561492919922, -0.05843162536621094, -0.054787635803222656, -0.051143646240234375, -0.047499656677246094, -0.04385566711425781, -0.04021167755126953, -0.03656768798828125, -0.03292369842529297, -0.029279708862304688, -0.025635719299316406, -0.021991729736328125, -0.018347740173339844, -0.014703750610351562, -0.011059761047363281, -0.007415771484375, -0.0037717819213867188, -0.0001277923583984375, 0.0035161972045898438, 0.007160186767578125, 0.010804176330566406, 0.014448165893554688, 0.01809215545654297, 0.02173614501953125, 0.02538013458251953, 0.029024124145507812, 0.032668113708496094, 0.036312103271484375, 0.039956092834472656, 0.04360008239746094, 0.04724407196044922, 0.0508880615234375, 0.05453205108642578, 0.05817604064941406, 0.061820030212402344, 0.06546401977539062, 0.0691080093383789, 0.07275199890136719, 0.07639598846435547, 0.08003997802734375, 0.08368396759033203, 0.08732795715332031, 0.0909719467163086, 0.09461593627929688, 0.09825992584228516, 0.10190391540527344, 0.10554790496826172, 0.10919189453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 5.0, 1.0, 6.0, 1.0, 18.0, 27.0, 66.0, 164.0, 193.0, 235.0, 154.0, 83.0, 34.0, 15.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6376831531524658, -1.5120912790298462, -1.3864994049072266, -1.2609076499938965, -1.1353156566619873, -1.0097239017486572, -0.8841320276260376, -0.758540153503418, -0.6329482793807983, -0.5073564052581787, -0.38176456093788147, -0.25617271661758423, -0.1305808424949646, -0.004988968372344971, 0.12060284614562988, 0.2461947202682495, 0.37178659439086914, 0.49737846851348877, 0.6229703426361084, 0.7485621571540833, 0.8741540312767029, 0.9997459053993225, 1.1253377199172974, 1.250929594039917, 1.3765214681625366, 1.5021133422851562, 1.6277052164077759, 1.7532970905303955, 1.8788888454437256, 2.0044808387756348, 2.130072593688965, 2.255664348602295, 2.381256580352783, 2.5068483352661133, 2.6324403285980225, 2.7580320835113525, 2.8836240768432617, 3.009215831756592, 3.134807586669922, 3.260399580001831, 3.3859915733337402, 3.5115833282470703, 3.6371753215789795, 3.7627670764923096, 3.8883590698242188, 4.013950824737549, 4.139542579650879, 4.265134811401367, 4.390726089477539, 4.516317844390869, 4.641909599304199, 4.7675018310546875, 4.893093585968018, 5.018685340881348, 5.144277095794678, 5.269868850708008, 5.395461082458496, 5.521052837371826, 5.646644592285156, 5.7722368240356445, 5.897828578948975, 6.023420333862305, 6.149012088775635, 6.274603843688965, 6.400196075439453]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 3.0, 5.0, 13.0, 13.0, 11.0, 12.0, 24.0, 22.0, 32.0, 23.0, 27.0, 26.0, 39.0, 31.0, 43.0, 41.0, 61.0, 66.0, 57.0, 50.0, 59.0, 36.0, 51.0, 33.0, 33.0, 28.0, 25.0, 20.0, 25.0, 24.0, 13.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9483669996261597, -1.8918190002441406, -1.8352710008621216, -1.7787230014801025, -1.722175121307373, -1.665627121925354, -1.609079122543335, -1.552531123161316, -1.4959831237792969, -1.4394351243972778, -1.3828871250152588, -1.3263392448425293, -1.2697912454605103, -1.2132432460784912, -1.1566952466964722, -1.1001472473144531, -1.0435993671417236, -0.9870513677597046, -0.9305034279823303, -0.8739554286003113, -0.8174074292182922, -0.760859489440918, -0.7043114900588989, -0.6477634906768799, -0.5912154912948608, -0.5346674919128418, -0.47811952233314514, -0.4215715527534485, -0.36502355337142944, -0.3084755837917328, -0.25192761421203613, -0.1953796148300171, -0.13883161544799805, -0.0822836309671402, -0.025735653936862946, 0.030812323093414307, 0.08736030757427216, 0.14390829205513, 0.20045626163482666, 0.2570042610168457, 0.31355223059654236, 0.370100200176239, 0.42664819955825806, 0.4831961691379547, 0.5397441387176514, 0.5962921380996704, 0.6528401374816895, 0.7093881368637085, 0.7659360766410828, 0.8224840760231018, 0.8790320158004761, 0.9355800151824951, 0.9921280145645142, 1.0486760139465332, 1.1052238941192627, 1.1617720127105713, 1.2183198928833008, 1.2748678922653198, 1.3314158916473389, 1.3879637718200684, 1.4445117712020874, 1.5010597705841064, 1.5576077699661255, 1.6141557693481445, 1.6707037687301636]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 12.0, 16.0, 19.0, 26.0, 38.0, 66.0, 111.0, 164.0, 253.0, 423.0, 756.0, 1319.0, 2513.0, 4931.0, 11363.0, 33761.0, 200696.0, 3822723.0, 78982.0, 20385.0, 7817.0, 3567.0, 1786.0, 957.0, 594.0, 345.0, 211.0, 165.0, 104.0, 67.0, 42.0, 21.0, 15.0, 10.0, 7.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.2677154541015625, -0.258575439453125, -0.2494354248046875, -0.24029541015625, -0.2311553955078125, -0.222015380859375, -0.2128753662109375, -0.2037353515625, -0.1945953369140625, -0.185455322265625, -0.1763153076171875, -0.16717529296875, -0.1580352783203125, -0.148895263671875, -0.1397552490234375, -0.130615234375, -0.1214752197265625, -0.112335205078125, -0.1031951904296875, -0.09405517578125, -0.0849151611328125, -0.075775146484375, -0.0666351318359375, -0.0574951171875, -0.0483551025390625, -0.039215087890625, -0.0300750732421875, -0.02093505859375, -0.0117950439453125, -0.002655029296875, 0.0064849853515625, 0.015625, 0.0247650146484375, 0.033905029296875, 0.0430450439453125, 0.05218505859375, 0.0613250732421875, 0.070465087890625, 0.0796051025390625, 0.0887451171875, 0.0978851318359375, 0.107025146484375, 0.1161651611328125, 0.12530517578125, 0.1344451904296875, 0.143585205078125, 0.1527252197265625, 0.161865234375, 0.1710052490234375, 0.180145263671875, 0.1892852783203125, 0.19842529296875, 0.2075653076171875, 0.216705322265625, 0.2258453369140625, 0.2349853515625, 0.2441253662109375, 0.253265380859375, 0.2624053955078125, 0.27154541015625, 0.2806854248046875, 0.289825439453125, 0.2989654541015625, 0.30810546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 3.0, 7.0, 14.0, 12.0, 15.0, 21.0, 19.0, 38.0, 56.0, 48.0, 48.0, 64.0, 62.0, 80.0, 66.0, 49.0, 45.0, 50.0, 44.0, 47.0, 40.0, 37.0, 34.0, 23.0, 14.0, 6.0, 11.0, 5.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.10055828094482422, -0.09753990173339844, -0.09452152252197266, -0.09150314331054688, -0.0884847640991211, -0.08546638488769531, -0.08244800567626953, -0.07942962646484375, -0.07641124725341797, -0.07339286804199219, -0.0703744888305664, -0.06735610961914062, -0.06433773040771484, -0.06131935119628906, -0.05830097198486328, -0.0552825927734375, -0.05226421356201172, -0.04924583435058594, -0.046227455139160156, -0.043209075927734375, -0.040190696716308594, -0.03717231750488281, -0.03415393829345703, -0.03113555908203125, -0.02811717987060547, -0.025098800659179688, -0.022080421447753906, -0.019062042236328125, -0.016043663024902344, -0.013025283813476562, -0.010006904602050781, -0.006988525390625, -0.003970146179199219, -0.0009517669677734375, 0.0020666122436523438, 0.005084991455078125, 0.008103370666503906, 0.011121749877929688, 0.014140129089355469, 0.01715850830078125, 0.02017688751220703, 0.023195266723632812, 0.026213645935058594, 0.029232025146484375, 0.032250404357910156, 0.03526878356933594, 0.03828716278076172, 0.0413055419921875, 0.04432392120361328, 0.04734230041503906, 0.050360679626464844, 0.053379058837890625, 0.056397438049316406, 0.05941581726074219, 0.06243419647216797, 0.06545257568359375, 0.06847095489501953, 0.07148933410644531, 0.0745077133178711, 0.07752609252929688, 0.08054447174072266, 0.08356285095214844, 0.08658123016357422, 0.089599609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 14.0, 22.0, 28.0, 48.0, 81.0, 107.0, 150.0, 245.0, 442.0, 747.0, 1464.0, 3269.0, 8044.0, 26090.0, 154271.0, 3818326.0, 141843.0, 24830.0, 7796.0, 3115.0, 1463.0, 719.0, 406.0, 255.0, 154.0, 107.0, 78.0, 46.0, 33.0, 15.0, 19.0, 15.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.37353515625, -0.3632965087890625, -0.353057861328125, -0.3428192138671875, -0.33258056640625, -0.3223419189453125, -0.312103271484375, -0.3018646240234375, -0.2916259765625, -0.2813873291015625, -0.271148681640625, -0.2609100341796875, -0.25067138671875, -0.2404327392578125, -0.230194091796875, -0.2199554443359375, -0.209716796875, -0.1994781494140625, -0.189239501953125, -0.1790008544921875, -0.16876220703125, -0.1585235595703125, -0.148284912109375, -0.1380462646484375, -0.1278076171875, -0.1175689697265625, -0.107330322265625, -0.0970916748046875, -0.08685302734375, -0.0766143798828125, -0.066375732421875, -0.0561370849609375, -0.0458984375, -0.0356597900390625, -0.025421142578125, -0.0151824951171875, -0.00494384765625, 0.0052947998046875, 0.015533447265625, 0.0257720947265625, 0.0360107421875, 0.0462493896484375, 0.056488037109375, 0.0667266845703125, 0.07696533203125, 0.0872039794921875, 0.097442626953125, 0.1076812744140625, 0.117919921875, 0.1281585693359375, 0.138397216796875, 0.1486358642578125, 0.15887451171875, 0.1691131591796875, 0.179351806640625, 0.1895904541015625, 0.1998291015625, 0.2100677490234375, 0.220306396484375, 0.2305450439453125, 0.24078369140625, 0.2510223388671875, 0.261260986328125, 0.2714996337890625, 0.28173828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 11.0, 6.0, 10.0, 9.0, 25.0, 39.0, 47.0, 100.0, 219.0, 1693.0, 1439.0, 187.0, 105.0, 44.0, 42.0, 23.0, 15.0, 17.0, 9.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.15771484375, -0.15345191955566406, -0.14918899536132812, -0.1449260711669922, -0.14066314697265625, -0.1364002227783203, -0.13213729858398438, -0.12787437438964844, -0.1236114501953125, -0.11934852600097656, -0.11508560180664062, -0.11082267761230469, -0.10655975341796875, -0.10229682922363281, -0.09803390502929688, -0.09377098083496094, -0.089508056640625, -0.08524513244628906, -0.08098220825195312, -0.07671928405761719, -0.07245635986328125, -0.06819343566894531, -0.06393051147460938, -0.05966758728027344, -0.0554046630859375, -0.05114173889160156, -0.046878814697265625, -0.04261589050292969, -0.03835296630859375, -0.03409004211425781, -0.029827117919921875, -0.025564193725585938, -0.02130126953125, -0.017038345336914062, -0.012775421142578125, -0.008512496948242188, -0.00424957275390625, 1.33514404296875e-05, 0.004276275634765625, 0.008539199829101562, 0.0128021240234375, 0.017065048217773438, 0.021327972412109375, 0.025590896606445312, 0.02985382080078125, 0.03411674499511719, 0.038379669189453125, 0.04264259338378906, 0.046905517578125, 0.05116844177246094, 0.055431365966796875, 0.05969429016113281, 0.06395721435546875, 0.06822013854980469, 0.07248306274414062, 0.07674598693847656, 0.0810089111328125, 0.08527183532714844, 0.08953475952148438, 0.09379768371582031, 0.09806060791015625, 0.10232353210449219, 0.10658645629882812, 0.11084938049316406, 0.1151123046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 9.0, 13.0, 22.0, 39.0, 81.0, 134.0, 171.0, 189.0, 135.0, 82.0, 53.0, 28.0, 21.0, 8.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8752933740615845, -0.8462796211242676, -0.8172658085823059, -0.788252055644989, -0.7592383027076721, -0.7302244901657104, -0.7012107372283936, -0.6721969842910767, -0.6431832313537598, -0.6141694784164429, -0.5851556658744812, -0.5561419129371643, -0.5271281599998474, -0.49811437726020813, -0.46910059452056885, -0.44008684158325195, -0.4110730290412903, -0.382059246301651, -0.3530454933643341, -0.3240317106246948, -0.29501795768737793, -0.26600417494773865, -0.23699039220809937, -0.20797662436962128, -0.1789628565311432, -0.1499490886926651, -0.12093531340360641, -0.09192153811454773, -0.06290777027606964, -0.03389400243759155, -0.0048802196979522705, 0.024133548140525818, 0.05314725637435913, 0.08216102421283722, 0.1111747995018959, 0.1401885747909546, 0.16920234262943268, 0.19821611046791077, 0.22722989320755005, 0.25624364614486694, 0.2852574288845062, 0.3142712116241455, 0.3432849645614624, 0.3722987473011017, 0.40131253004074097, 0.43032628297805786, 0.45934006571769714, 0.4883538484573364, 0.5173676013946533, 0.5463813543319702, 0.5753951668739319, 0.6044089198112488, 0.6334226727485657, 0.6624364852905273, 0.6914502382278442, 0.7204639911651611, 0.749477744102478, 0.7784914970397949, 0.8075053095817566, 0.8365190625190735, 0.8655328154563904, 0.894546627998352, 0.923560380935669, 0.9525741338729858, 0.9815879464149475]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 1.0, 6.0, 7.0, 10.0, 8.0, 15.0, 7.0, 16.0, 18.0, 22.0, 23.0, 25.0, 23.0, 31.0, 37.0, 50.0, 37.0, 38.0, 50.0, 48.0, 33.0, 56.0, 32.0, 38.0, 33.0, 42.0, 33.0, 34.0, 34.0, 31.0, 22.0, 16.0, 20.0, 18.0, 14.0, 13.0, 8.0, 7.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2980915307998657, -0.2880476415157318, -0.2780037522315979, -0.267959862947464, -0.2579159736633301, -0.24787208437919617, -0.23782820999622345, -0.22778432071208954, -0.21774043142795563, -0.20769654214382172, -0.1976526528596878, -0.1876087635755539, -0.17756488919258118, -0.16752099990844727, -0.15747711062431335, -0.14743322134017944, -0.13738933205604553, -0.12734544277191162, -0.11730155348777771, -0.1072576716542244, -0.09721378237009048, -0.08716989308595657, -0.07712601125240326, -0.06708212196826935, -0.05703823268413544, -0.046994343400001526, -0.03695045784115791, -0.02690657041966915, -0.01686268299818039, -0.006818793714046478, 0.0032250918447971344, 0.013268977403640747, 0.023312866687774658, 0.03335675597190857, 0.04340064153075218, 0.053444527089595795, 0.0634884163737297, 0.07353230565786362, 0.08357618749141693, 0.09362007677555084, 0.10366396605968475, 0.11370785534381866, 0.12375174462795258, 0.1337956339120865, 0.1438395082950592, 0.15388339757919312, 0.16392728686332703, 0.17397117614746094, 0.18401506543159485, 0.19405895471572876, 0.20410284399986267, 0.21414673328399658, 0.2241906225681305, 0.2342345118522644, 0.24427838623523712, 0.2543222904205322, 0.26436614990234375, 0.27441003918647766, 0.2844539284706116, 0.2944978177547455, 0.3045417070388794, 0.3145855963230133, 0.3246294856071472, 0.33467334508895874, 0.34471726417541504]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 16.0, 12.0, 15.0, 39.0, 45.0, 70.0, 122.0, 184.0, 309.0, 483.0, 878.0, 1368.0, 2508.0, 4486.0, 8517.0, 16076.0, 31159.0, 60061.0, 118426.0, 260561.0, 280306.0, 127671.0, 64308.0, 33176.0, 17360.0, 9053.0, 4754.0, 2757.0, 1527.0, 886.0, 503.0, 319.0, 196.0, 147.0, 99.0, 44.0, 30.0, 25.0, 13.0, 10.0, 9.0, 5.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1517333984375, -0.1466846466064453, -0.14163589477539062, -0.13658714294433594, -0.13153839111328125, -0.12648963928222656, -0.12144088745117188, -0.11639213562011719, -0.1113433837890625, -0.10629463195800781, -0.10124588012695312, -0.09619712829589844, -0.09114837646484375, -0.08609962463378906, -0.08105087280273438, -0.07600212097167969, -0.070953369140625, -0.06590461730957031, -0.060855865478515625, -0.05580711364746094, -0.05075836181640625, -0.04570960998535156, -0.040660858154296875, -0.03561210632324219, -0.0305633544921875, -0.025514602661132812, -0.020465850830078125, -0.015417098999023438, -0.01036834716796875, -0.0053195953369140625, -0.000270843505859375, 0.0047779083251953125, 0.00982666015625, 0.014875411987304688, 0.019924163818359375, 0.024972915649414062, 0.03002166748046875, 0.03507041931152344, 0.040119171142578125, 0.04516792297363281, 0.0502166748046875, 0.05526542663574219, 0.060314178466796875, 0.06536293029785156, 0.07041168212890625, 0.07546043395996094, 0.08050918579101562, 0.08555793762207031, 0.090606689453125, 0.09565544128417969, 0.10070419311523438, 0.10575294494628906, 0.11080169677734375, 0.11585044860839844, 0.12089920043945312, 0.1259479522705078, 0.1309967041015625, 0.1360454559326172, 0.14109420776367188, 0.14614295959472656, 0.15119171142578125, 0.15624046325683594, 0.16128921508789062, 0.1663379669189453, 0.17138671875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 5.0, 8.0, 6.0, 9.0, 11.0, 18.0, 17.0, 23.0, 41.0, 44.0, 40.0, 42.0, 59.0, 55.0, 61.0, 53.0, 54.0, 54.0, 45.0, 57.0, 55.0, 41.0, 41.0, 37.0, 32.0, 23.0, 10.0, 6.0, 11.0, 8.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1025390625, -0.0994110107421875, -0.096282958984375, -0.0931549072265625, -0.09002685546875, -0.0868988037109375, -0.083770751953125, -0.0806427001953125, -0.0775146484375, -0.0743865966796875, -0.071258544921875, -0.0681304931640625, -0.06500244140625, -0.0618743896484375, -0.058746337890625, -0.0556182861328125, -0.052490234375, -0.0493621826171875, -0.046234130859375, -0.0431060791015625, -0.03997802734375, -0.0368499755859375, -0.033721923828125, -0.0305938720703125, -0.0274658203125, -0.0243377685546875, -0.021209716796875, -0.0180816650390625, -0.01495361328125, -0.0118255615234375, -0.008697509765625, -0.0055694580078125, -0.00244140625, 0.0006866455078125, 0.003814697265625, 0.0069427490234375, 0.01007080078125, 0.0131988525390625, 0.016326904296875, 0.0194549560546875, 0.0225830078125, 0.0257110595703125, 0.028839111328125, 0.0319671630859375, 0.03509521484375, 0.0382232666015625, 0.041351318359375, 0.0444793701171875, 0.047607421875, 0.0507354736328125, 0.053863525390625, 0.0569915771484375, 0.06011962890625, 0.0632476806640625, 0.066375732421875, 0.0695037841796875, 0.0726318359375, 0.0757598876953125, 0.078887939453125, 0.0820159912109375, 0.08514404296875, 0.0882720947265625, 0.091400146484375, 0.0945281982421875, 0.09765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 13.0, 17.0, 23.0, 39.0, 40.0, 59.0, 85.0, 119.0, 176.0, 245.0, 341.0, 578.0, 1024.0, 2045.0, 5511.0, 21816.0, 144577.0, 697602.0, 142365.0, 21538.0, 5594.0, 2016.0, 1026.0, 564.0, 343.0, 227.0, 169.0, 106.0, 86.0, 55.0, 52.0, 20.0, 22.0, 12.0, 10.0, 9.0, 10.0, 4.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.3662109375, -0.35527801513671875, -0.3443450927734375, -0.33341217041015625, -0.322479248046875, -0.31154632568359375, -0.3006134033203125, -0.28968048095703125, -0.27874755859375, -0.26781463623046875, -0.2568817138671875, -0.24594879150390625, -0.235015869140625, -0.22408294677734375, -0.2131500244140625, -0.20221710205078125, -0.1912841796875, -0.18035125732421875, -0.1694183349609375, -0.15848541259765625, -0.147552490234375, -0.13661956787109375, -0.1256866455078125, -0.11475372314453125, -0.10382080078125, -0.09288787841796875, -0.0819549560546875, -0.07102203369140625, -0.060089111328125, -0.04915618896484375, -0.0382232666015625, -0.02729034423828125, -0.016357421875, -0.00542449951171875, 0.0055084228515625, 0.01644134521484375, 0.027374267578125, 0.03830718994140625, 0.0492401123046875, 0.06017303466796875, 0.07110595703125, 0.08203887939453125, 0.0929718017578125, 0.10390472412109375, 0.114837646484375, 0.12577056884765625, 0.1367034912109375, 0.14763641357421875, 0.1585693359375, 0.16950225830078125, 0.1804351806640625, 0.19136810302734375, 0.202301025390625, 0.21323394775390625, 0.2241668701171875, 0.23509979248046875, 0.24603271484375, 0.25696563720703125, 0.2678985595703125, 0.27883148193359375, 0.289764404296875, 0.30069732666015625, 0.3116302490234375, 0.32256317138671875, 0.33349609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 3.0, 8.0, 4.0, 10.0, 5.0, 14.0, 15.0, 17.0, 22.0, 18.0, 35.0, 23.0, 23.0, 27.0, 33.0, 46.0, 38.0, 48.0, 49.0, 50.0, 36.0, 51.0, 45.0, 38.0, 37.0, 33.0, 37.0, 30.0, 31.0, 16.0, 23.0, 19.0, 16.0, 20.0, 12.0, 11.0, 8.0, 6.0, 7.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0], "bins": [-0.353759765625, -0.3442115783691406, -0.33466339111328125, -0.3251152038574219, -0.3155670166015625, -0.3060188293457031, -0.29647064208984375, -0.2869224548339844, -0.277374267578125, -0.2678260803222656, -0.25827789306640625, -0.24872970581054688, -0.2391815185546875, -0.22963333129882812, -0.22008514404296875, -0.21053695678710938, -0.20098876953125, -0.19144058227539062, -0.18189239501953125, -0.17234420776367188, -0.1627960205078125, -0.15324783325195312, -0.14369964599609375, -0.13415145874023438, -0.124603271484375, -0.11505508422851562, -0.10550689697265625, -0.09595870971679688, -0.0864105224609375, -0.07686233520507812, -0.06731414794921875, -0.057765960693359375, -0.0482177734375, -0.038669586181640625, -0.02912139892578125, -0.019573211669921875, -0.0100250244140625, -0.000476837158203125, 0.00907135009765625, 0.018619537353515625, 0.028167724609375, 0.037715911865234375, 0.04726409912109375, 0.056812286376953125, 0.0663604736328125, 0.07590866088867188, 0.08545684814453125, 0.09500503540039062, 0.10455322265625, 0.11410140991210938, 0.12364959716796875, 0.13319778442382812, 0.1427459716796875, 0.15229415893554688, 0.16184234619140625, 0.17139053344726562, 0.180938720703125, 0.19048690795898438, 0.20003509521484375, 0.20958328247070312, 0.2191314697265625, 0.22867965698242188, 0.23822784423828125, 0.24777603149414062, 0.25732421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 7.0, 10.0, 5.0, 11.0, 16.0, 27.0, 54.0, 69.0, 99.0, 183.0, 353.0, 607.0, 1377.0, 3453.0, 10586.0, 44298.0, 245307.0, 583104.0, 123507.0, 24281.0, 6621.0, 2413.0, 1029.0, 491.0, 257.0, 134.0, 94.0, 55.0, 28.0, 24.0, 11.0, 10.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09912109375, -0.09561920166015625, -0.0921173095703125, -0.08861541748046875, -0.085113525390625, -0.08161163330078125, -0.0781097412109375, -0.07460784912109375, -0.07110595703125, -0.06760406494140625, -0.0641021728515625, -0.06060028076171875, -0.057098388671875, -0.05359649658203125, -0.0500946044921875, -0.04659271240234375, -0.0430908203125, -0.03958892822265625, -0.0360870361328125, -0.03258514404296875, -0.029083251953125, -0.02558135986328125, -0.0220794677734375, -0.01857757568359375, -0.01507568359375, -0.01157379150390625, -0.0080718994140625, -0.00457000732421875, -0.001068115234375, 0.00243377685546875, 0.0059356689453125, 0.00943756103515625, 0.012939453125, 0.01644134521484375, 0.0199432373046875, 0.02344512939453125, 0.026947021484375, 0.03044891357421875, 0.0339508056640625, 0.03745269775390625, 0.04095458984375, 0.04445648193359375, 0.0479583740234375, 0.05146026611328125, 0.054962158203125, 0.05846405029296875, 0.0619659423828125, 0.06546783447265625, 0.0689697265625, 0.07247161865234375, 0.0759735107421875, 0.07947540283203125, 0.082977294921875, 0.08647918701171875, 0.0899810791015625, 0.09348297119140625, 0.09698486328125, 0.10048675537109375, 0.1039886474609375, 0.10749053955078125, 0.110992431640625, 0.11449432373046875, 0.1179962158203125, 0.12149810791015625, 0.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 12.0, 10.0, 14.0, 19.0, 21.0, 24.0, 30.0, 42.0, 32.0, 49.0, 54.0, 81.0, 92.0, 106.0, 88.0, 77.0, 38.0, 38.0, 29.0, 28.0, 26.0, 14.0, 11.0, 13.0, 9.0, 6.0, 10.0, 11.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-05, -4.011392593383789e-05, -3.8504600524902344e-05, -3.68952751159668e-05, -3.528594970703125e-05, -3.36766242980957e-05, -3.2067298889160156e-05, -3.045797348022461e-05, -2.8848648071289062e-05, -2.7239322662353516e-05, -2.562999725341797e-05, -2.4020671844482422e-05, -2.2411346435546875e-05, -2.0802021026611328e-05, -1.919269561767578e-05, -1.7583370208740234e-05, -1.5974044799804688e-05, -1.436471939086914e-05, -1.2755393981933594e-05, -1.1146068572998047e-05, -9.5367431640625e-06, -7.927417755126953e-06, -6.318092346191406e-06, -4.708766937255859e-06, -3.0994415283203125e-06, -1.4901161193847656e-06, 1.1920928955078125e-07, 1.7285346984863281e-06, 3.337860107421875e-06, 4.947185516357422e-06, 6.556510925292969e-06, 8.165836334228516e-06, 9.775161743164062e-06, 1.138448715209961e-05, 1.2993812561035156e-05, 1.4603137969970703e-05, 1.621246337890625e-05, 1.7821788787841797e-05, 1.9431114196777344e-05, 2.104043960571289e-05, 2.2649765014648438e-05, 2.4259090423583984e-05, 2.586841583251953e-05, 2.7477741241455078e-05, 2.9087066650390625e-05, 3.069639205932617e-05, 3.230571746826172e-05, 3.3915042877197266e-05, 3.552436828613281e-05, 3.713369369506836e-05, 3.8743019104003906e-05, 4.035234451293945e-05, 4.1961669921875e-05, 4.357099533081055e-05, 4.5180320739746094e-05, 4.678964614868164e-05, 4.839897155761719e-05, 5.0008296966552734e-05, 5.161762237548828e-05, 5.322694778442383e-05, 5.4836273193359375e-05, 5.644559860229492e-05, 5.805492401123047e-05, 5.9664249420166016e-05, 6.127357482910156e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 5.0, 12.0, 11.0, 21.0, 24.0, 27.0, 38.0, 60.0, 92.0, 129.0, 246.0, 351.0, 591.0, 1218.0, 2578.0, 6460.0, 22617.0, 114802.0, 552775.0, 279469.0, 47639.0, 11485.0, 3987.0, 1745.0, 871.0, 481.0, 287.0, 179.0, 100.0, 71.0, 55.0, 34.0, 25.0, 17.0, 10.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10760498046875, -0.10421562194824219, -0.10082626342773438, -0.09743690490722656, -0.09404754638671875, -0.09065818786621094, -0.08726882934570312, -0.08387947082519531, -0.0804901123046875, -0.07710075378417969, -0.07371139526367188, -0.07032203674316406, -0.06693267822265625, -0.06354331970214844, -0.060153961181640625, -0.05676460266113281, -0.053375244140625, -0.04998588562011719, -0.046596527099609375, -0.04320716857910156, -0.03981781005859375, -0.03642845153808594, -0.033039093017578125, -0.029649734497070312, -0.0262603759765625, -0.022871017456054688, -0.019481658935546875, -0.016092300415039062, -0.01270294189453125, -0.009313583374023438, -0.005924224853515625, -0.0025348663330078125, 0.0008544921875, 0.0042438507080078125, 0.007633209228515625, 0.011022567749023438, 0.01441192626953125, 0.017801284790039062, 0.021190643310546875, 0.024580001831054688, 0.0279693603515625, 0.03135871887207031, 0.034748077392578125, 0.03813743591308594, 0.04152679443359375, 0.04491615295410156, 0.048305511474609375, 0.05169486999511719, 0.055084228515625, 0.05847358703613281, 0.061862945556640625, 0.06525230407714844, 0.06864166259765625, 0.07203102111816406, 0.07542037963867188, 0.07880973815917969, 0.0821990966796875, 0.08558845520019531, 0.08897781372070312, 0.09236717224121094, 0.09575653076171875, 0.09914588928222656, 0.10253524780273438, 0.10592460632324219, 0.10931396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 1.0, 1.0, 7.0, 7.0, 13.0, 14.0, 11.0, 15.0, 22.0, 25.0, 27.0, 29.0, 38.0, 47.0, 59.0, 46.0, 64.0, 72.0, 58.0, 55.0, 69.0, 46.0, 42.0, 43.0, 26.0, 28.0, 15.0, 18.0, 10.0, 14.0, 14.0, 7.0, 7.0, 13.0, 7.0, 1.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.08392047882080078, -0.08135414123535156, -0.07878780364990234, -0.07622146606445312, -0.0736551284790039, -0.07108879089355469, -0.06852245330810547, -0.06595611572265625, -0.06338977813720703, -0.06082344055175781, -0.058257102966308594, -0.055690765380859375, -0.053124427795410156, -0.05055809020996094, -0.04799175262451172, -0.0454254150390625, -0.04285907745361328, -0.04029273986816406, -0.037726402282714844, -0.035160064697265625, -0.032593727111816406, -0.030027389526367188, -0.02746105194091797, -0.02489471435546875, -0.02232837677001953, -0.019762039184570312, -0.017195701599121094, -0.014629364013671875, -0.012063026428222656, -0.009496688842773438, -0.006930351257324219, -0.004364013671875, -0.0017976760864257812, 0.0007686614990234375, 0.0033349990844726562, 0.005901336669921875, 0.008467674255371094, 0.011034011840820312, 0.013600349426269531, 0.01616668701171875, 0.01873302459716797, 0.021299362182617188, 0.023865699768066406, 0.026432037353515625, 0.028998374938964844, 0.03156471252441406, 0.03413105010986328, 0.0366973876953125, 0.03926372528076172, 0.04183006286621094, 0.044396400451660156, 0.046962738037109375, 0.049529075622558594, 0.05209541320800781, 0.05466175079345703, 0.05722808837890625, 0.05979442596435547, 0.06236076354980469, 0.0649271011352539, 0.06749343872070312, 0.07005977630615234, 0.07262611389160156, 0.07519245147705078, 0.0777587890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 8.0, 23.0, 27.0, 46.0, 70.0, 89.0, 101.0, 112.0, 122.0, 113.0, 73.0, 66.0, 59.0, 36.0, 13.0, 15.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1587326526641846, -2.1010186672210693, -2.043304920196533, -1.985590934753418, -1.9278769493103027, -1.870163083076477, -1.8124492168426514, -1.7547352313995361, -1.6970213651657104, -1.6393074989318848, -1.5815935134887695, -1.5238796472549438, -1.4661657810211182, -1.408451795578003, -1.3507379293441772, -1.2930240631103516, -1.2353100776672363, -1.1775962114334106, -1.1198822259902954, -1.0621683597564697, -1.0044543743133545, -0.9467405080795288, -0.8890266418457031, -0.8313127160072327, -0.7735987901687622, -0.7158848643302917, -0.6581709384918213, -0.6004570722579956, -0.5427431464195251, -0.4850292205810547, -0.4273153245449066, -0.36960142850875854, -0.3118875026702881, -0.2541735768318176, -0.19645968079566956, -0.1387457698583603, -0.08103185892105103, -0.023317933082580566, 0.034395962953567505, 0.09210985898971558, 0.14982378482818604, 0.2075376957654953, 0.26525160670280457, 0.32296550273895264, 0.3806794285774231, 0.43839335441589355, 0.4961072504520416, 0.5538211464881897, 0.6115350723266602, 0.6692489981651306, 0.7269629240036011, 0.7846767902374268, 0.8423907160758972, 0.9001046419143677, 0.9578185081481934, 1.0155324935913086, 1.0732463598251343, 1.13096022605896, 1.1886742115020752, 1.2463880777359009, 1.3041019439697266, 1.3618159294128418, 1.4195297956466675, 1.4772436618804932, 1.5349576473236084]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 15.0, 17.0, 7.0, 28.0, 17.0, 14.0, 22.0, 20.0, 33.0, 35.0, 39.0, 26.0, 39.0, 39.0, 38.0, 44.0, 50.0, 63.0, 52.0, 47.0, 52.0, 34.0, 31.0, 27.0, 34.0, 26.0, 18.0, 24.0, 13.0, 13.0, 13.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-1.6132254600524902, -1.5671130418777466, -1.521000623703003, -1.4748882055282593, -1.4287757873535156, -1.382663369178772, -1.3365509510040283, -1.2904385328292847, -1.244326114654541, -1.1982136964797974, -1.1521012783050537, -1.10598886013031, -1.0598764419555664, -1.0137640237808228, -0.9676516056060791, -0.9215391874313354, -0.875426709651947, -0.8293142914772034, -0.7832018733024597, -0.7370894551277161, -0.6909770369529724, -0.6448646187782288, -0.5987521409988403, -0.5526397228240967, -0.506527304649353, -0.4604148864746094, -0.4143024682998657, -0.36819005012512207, -0.3220776319503784, -0.27596521377563477, -0.22985276579856873, -0.18374034762382507, -0.1376279592514038, -0.09151554107666016, -0.04540311545133591, 0.0007093101739883423, 0.046821728348731995, 0.09293414652347565, 0.1390465795993805, 0.18515899777412415, 0.2312714159488678, 0.27738383412361145, 0.3234962522983551, 0.36960870027542114, 0.4157211184501648, 0.46183353662490845, 0.5079459547996521, 0.5540583729743958, 0.6001707911491394, 0.6462832093238831, 0.6923956274986267, 0.7385080456733704, 0.784620463848114, 0.8307328820228577, 0.8768453598022461, 0.9229577779769897, 0.9690701961517334, 1.015182614326477, 1.0612950325012207, 1.1074074506759644, 1.153519868850708, 1.1996322870254517, 1.2457447052001953, 1.291857123374939, 1.3379695415496826]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 19.0, 15.0, 31.0, 31.0, 51.0, 84.0, 134.0, 171.0, 278.0, 441.0, 699.0, 1093.0, 1910.0, 3375.0, 6021.0, 11704.0, 24240.0, 57194.0, 169165.0, 870389.0, 2393611.0, 457601.0, 112879.0, 42571.0, 19292.0, 9385.0, 4877.0, 2824.0, 1565.0, 947.0, 571.0, 415.0, 228.0, 153.0, 114.0, 60.0, 49.0, 20.0, 21.0, 17.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1444091796875, -0.14043426513671875, -0.1364593505859375, -0.13248443603515625, -0.128509521484375, -0.12453460693359375, -0.1205596923828125, -0.11658477783203125, -0.11260986328125, -0.10863494873046875, -0.1046600341796875, -0.10068511962890625, -0.096710205078125, -0.09273529052734375, -0.0887603759765625, -0.08478546142578125, -0.080810546875, -0.07683563232421875, -0.0728607177734375, -0.06888580322265625, -0.064910888671875, -0.06093597412109375, -0.0569610595703125, -0.05298614501953125, -0.04901123046875, -0.04503631591796875, -0.0410614013671875, -0.03708648681640625, -0.033111572265625, -0.02913665771484375, -0.0251617431640625, -0.02118682861328125, -0.0172119140625, -0.01323699951171875, -0.0092620849609375, -0.00528717041015625, -0.001312255859375, 0.00266265869140625, 0.0066375732421875, 0.01061248779296875, 0.01458740234375, 0.01856231689453125, 0.0225372314453125, 0.02651214599609375, 0.030487060546875, 0.03446197509765625, 0.0384368896484375, 0.04241180419921875, 0.04638671875, 0.05036163330078125, 0.0543365478515625, 0.05831146240234375, 0.062286376953125, 0.06626129150390625, 0.0702362060546875, 0.07421112060546875, 0.07818603515625, 0.08216094970703125, 0.0861358642578125, 0.09011077880859375, 0.094085693359375, 0.09806060791015625, 0.1020355224609375, 0.10601043701171875, 0.1099853515625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 11.0, 11.0, 10.0, 11.0, 21.0, 23.0, 25.0, 27.0, 33.0, 33.0, 36.0, 52.0, 44.0, 53.0, 34.0, 55.0, 59.0, 48.0, 49.0, 45.0, 50.0, 34.0, 41.0, 42.0, 24.0, 27.0, 21.0, 20.0, 10.0, 8.0, 10.0, 8.0, 3.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08941650390625, -0.08683586120605469, -0.08425521850585938, -0.08167457580566406, -0.07909393310546875, -0.07651329040527344, -0.07393264770507812, -0.07135200500488281, -0.0687713623046875, -0.06619071960449219, -0.06361007690429688, -0.06102943420410156, -0.05844879150390625, -0.05586814880371094, -0.053287506103515625, -0.05070686340332031, -0.048126220703125, -0.04554557800292969, -0.042964935302734375, -0.04038429260253906, -0.03780364990234375, -0.03522300720214844, -0.032642364501953125, -0.030061721801757812, -0.0274810791015625, -0.024900436401367188, -0.022319793701171875, -0.019739151000976562, -0.01715850830078125, -0.014577865600585938, -0.011997222900390625, -0.009416580200195312, -0.0068359375, -0.0042552947998046875, -0.001674652099609375, 0.0009059906005859375, 0.00348663330078125, 0.0060672760009765625, 0.008647918701171875, 0.011228561401367188, 0.0138092041015625, 0.016389846801757812, 0.018970489501953125, 0.021551132202148438, 0.02413177490234375, 0.026712417602539062, 0.029293060302734375, 0.03187370300292969, 0.034454345703125, 0.03703498840332031, 0.039615631103515625, 0.04219627380371094, 0.04477691650390625, 0.04735755920410156, 0.049938201904296875, 0.05251884460449219, 0.0550994873046875, 0.05768013000488281, 0.060260772705078125, 0.06284141540527344, 0.06542205810546875, 0.06800270080566406, 0.07058334350585938, 0.07316398620605469, 0.07574462890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 7.0, 11.0, 18.0, 32.0, 68.0, 106.0, 235.0, 465.0, 1210.0, 3830.0, 14412.0, 82426.0, 1843647.0, 2137188.0, 89002.0, 15426.0, 3944.0, 1287.0, 491.0, 244.0, 100.0, 61.0, 21.0, 20.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253662109375, -0.24352264404296875, -0.2333831787109375, -0.22324371337890625, -0.213104248046875, -0.20296478271484375, -0.1928253173828125, -0.18268585205078125, -0.17254638671875, -0.16240692138671875, -0.1522674560546875, -0.14212799072265625, -0.131988525390625, -0.12184906005859375, -0.1117095947265625, -0.10157012939453125, -0.0914306640625, -0.08129119873046875, -0.0711517333984375, -0.06101226806640625, -0.050872802734375, -0.04073333740234375, -0.0305938720703125, -0.02045440673828125, -0.01031494140625, -0.00017547607421875, 0.0099639892578125, 0.02010345458984375, 0.030242919921875, 0.04038238525390625, 0.0505218505859375, 0.06066131591796875, 0.07080078125, 0.08094024658203125, 0.0910797119140625, 0.10121917724609375, 0.111358642578125, 0.12149810791015625, 0.1316375732421875, 0.14177703857421875, 0.15191650390625, 0.16205596923828125, 0.1721954345703125, 0.18233489990234375, 0.192474365234375, 0.20261383056640625, 0.2127532958984375, 0.22289276123046875, 0.2330322265625, 0.24317169189453125, 0.2533111572265625, 0.26345062255859375, 0.273590087890625, 0.28372955322265625, 0.2938690185546875, 0.30400848388671875, 0.31414794921875, 0.32428741455078125, 0.3344268798828125, 0.34456634521484375, 0.354705810546875, 0.36484527587890625, 0.3749847412109375, 0.38512420654296875, 0.395263671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 8.0, 9.0, 13.0, 16.0, 18.0, 31.0, 51.0, 55.0, 84.0, 124.0, 237.0, 414.0, 753.0, 916.0, 525.0, 287.0, 160.0, 100.0, 65.0, 60.0, 40.0, 22.0, 17.0, 12.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31787109375, -0.3095550537109375, -0.301239013671875, -0.2929229736328125, -0.28460693359375, -0.2762908935546875, -0.267974853515625, -0.2596588134765625, -0.2513427734375, -0.2430267333984375, -0.234710693359375, -0.2263946533203125, -0.21807861328125, -0.2097625732421875, -0.201446533203125, -0.1931304931640625, -0.184814453125, -0.1764984130859375, -0.168182373046875, -0.1598663330078125, -0.15155029296875, -0.1432342529296875, -0.134918212890625, -0.1266021728515625, -0.1182861328125, -0.1099700927734375, -0.101654052734375, -0.0933380126953125, -0.08502197265625, -0.0767059326171875, -0.068389892578125, -0.0600738525390625, -0.0517578125, -0.0434417724609375, -0.035125732421875, -0.0268096923828125, -0.01849365234375, -0.0101776123046875, -0.001861572265625, 0.0064544677734375, 0.0147705078125, 0.0230865478515625, 0.031402587890625, 0.0397186279296875, 0.04803466796875, 0.0563507080078125, 0.064666748046875, 0.0729827880859375, 0.081298828125, 0.0896148681640625, 0.097930908203125, 0.1062469482421875, 0.11456298828125, 0.1228790283203125, 0.131195068359375, 0.1395111083984375, 0.1478271484375, 0.1561431884765625, 0.164459228515625, 0.1727752685546875, 0.18109130859375, 0.1894073486328125, 0.197723388671875, 0.2060394287109375, 0.21435546875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 10.0, 22.0, 41.0, 91.0, 153.0, 227.0, 204.0, 123.0, 64.0, 30.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.057502746582031, -3.955089569091797, -3.8526766300201416, -3.7502634525299072, -3.647850513458252, -3.5454373359680176, -3.443024158477783, -3.340611219406128, -3.2381982803344727, -3.1357851028442383, -3.033372163772583, -2.9309589862823486, -2.8285460472106934, -2.726132869720459, -2.6237196922302246, -2.5213067531585693, -2.418893575668335, -2.3164803981781006, -2.2140674591064453, -2.111654281616211, -2.0092413425445557, -1.9068281650543213, -1.8044151067733765, -1.7020020484924316, -1.5995889902114868, -1.497175931930542, -1.3947628736495972, -1.2923498153686523, -1.189936637878418, -1.0875236988067627, -0.9851105213165283, -0.8826974630355835, -0.7802846431732178, -0.677871584892273, -0.5754585266113281, -0.4730454087257385, -0.3706323504447937, -0.2682192921638489, -0.16580617427825928, -0.06339311599731445, 0.03901994228363037, 0.1414330154657364, 0.2438460886478424, 0.3462591767311096, 0.44867223501205444, 0.5510852932929993, 0.6534984111785889, 0.7559114694595337, 0.8583245277404785, 0.9607375860214233, 1.0631506443023682, 1.1655638217926025, 1.2679767608642578, 1.3703899383544922, 1.472802996635437, 1.5752160549163818, 1.6776291131973267, 1.7800421714782715, 1.8824552297592163, 1.9848682880401611, 2.0872814655303955, 2.189694404602051, 2.292107582092285, 2.3945207595825195, 2.496933698654175]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 12.0, 19.0, 19.0, 24.0, 31.0, 30.0, 36.0, 40.0, 53.0, 43.0, 41.0, 62.0, 49.0, 47.0, 44.0, 44.0, 51.0, 49.0, 40.0, 42.0, 26.0, 21.0, 25.0, 15.0, 21.0, 16.0, 13.0, 12.0, 10.0, 5.0, 5.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0209617614746094, -0.9830405712127686, -0.9451194405555725, -0.9071983098983765, -0.8692771196365356, -0.8313559293746948, -0.7934347987174988, -0.7555136680603027, -0.7175924777984619, -0.6796712875366211, -0.641750156879425, -0.603829026222229, -0.5659078359603882, -0.5279866456985474, -0.4900655150413513, -0.4521443545818329, -0.41422319412231445, -0.376302033662796, -0.3383808732032776, -0.30045971274375916, -0.2625385522842407, -0.2246173918247223, -0.18669623136520386, -0.14877507090568542, -0.11085391044616699, -0.07293274998664856, -0.03501158952713013, 0.0029095709323883057, 0.04083073139190674, 0.07875189185142517, 0.1166730523109436, 0.15459421277046204, 0.19251549243927002, 0.23043665289878845, 0.2683578133583069, 0.3062789738178253, 0.34420013427734375, 0.3821212947368622, 0.4200424551963806, 0.45796361565589905, 0.4958847761154175, 0.5338059663772583, 0.5717270970344543, 0.6096482276916504, 0.6475694179534912, 0.685490608215332, 0.7234117388725281, 0.7613328695297241, 0.7992540597915649, 0.8371752500534058, 0.8750963807106018, 0.9130175113677979, 0.9509387016296387, 0.9888598918914795, 1.0267810821533203, 1.0647021532058716, 1.1026233434677124, 1.1405445337295532, 1.1784656047821045, 1.2163867950439453, 1.2543079853057861, 1.292229175567627, 1.3301503658294678, 1.368071436882019, 1.4059926271438599]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 15.0, 19.0, 43.0, 55.0, 63.0, 106.0, 166.0, 310.0, 464.0, 828.0, 1421.0, 2354.0, 4300.0, 8438.0, 16758.0, 36360.0, 89450.0, 340543.0, 372984.0, 97999.0, 38450.0, 17802.0, 8952.0, 4591.0, 2545.0, 1381.0, 824.0, 487.0, 301.0, 181.0, 130.0, 74.0, 49.0, 37.0, 27.0, 16.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185791015625, -0.17916488647460938, -0.17253875732421875, -0.16591262817382812, -0.1592864990234375, -0.15266036987304688, -0.14603424072265625, -0.13940811157226562, -0.132781982421875, -0.12615585327148438, -0.11952972412109375, -0.11290359497070312, -0.1062774658203125, -0.09965133666992188, -0.09302520751953125, -0.08639907836914062, -0.07977294921875, -0.07314682006835938, -0.06652069091796875, -0.059894561767578125, -0.0532684326171875, -0.046642303466796875, -0.04001617431640625, -0.033390045166015625, -0.026763916015625, -0.020137786865234375, -0.01351165771484375, -0.006885528564453125, -0.0002593994140625, 0.006366729736328125, 0.01299285888671875, 0.019618988037109375, 0.0262451171875, 0.032871246337890625, 0.03949737548828125, 0.046123504638671875, 0.0527496337890625, 0.059375762939453125, 0.06600189208984375, 0.07262802124023438, 0.079254150390625, 0.08588027954101562, 0.09250640869140625, 0.09913253784179688, 0.1057586669921875, 0.11238479614257812, 0.11901092529296875, 0.12563705444335938, 0.13226318359375, 0.13888931274414062, 0.14551544189453125, 0.15214157104492188, 0.1587677001953125, 0.16539382934570312, 0.17201995849609375, 0.17864608764648438, 0.185272216796875, 0.19189834594726562, 0.19852447509765625, 0.20515060424804688, 0.2117767333984375, 0.21840286254882812, 0.22502899169921875, 0.23165512084960938, 0.23828125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 10.0, 18.0, 16.0, 19.0, 31.0, 45.0, 43.0, 48.0, 48.0, 60.0, 63.0, 65.0, 55.0, 48.0, 54.0, 51.0, 52.0, 46.0, 41.0, 35.0, 31.0, 29.0, 23.0, 13.0, 8.0, 9.0, 7.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.07561111450195312, -0.07236480712890625, -0.06911849975585938, -0.0658721923828125, -0.06262588500976562, -0.05937957763671875, -0.056133270263671875, -0.052886962890625, -0.049640655517578125, -0.04639434814453125, -0.043148040771484375, -0.0399017333984375, -0.036655426025390625, -0.03340911865234375, -0.030162811279296875, -0.02691650390625, -0.023670196533203125, -0.02042388916015625, -0.017177581787109375, -0.0139312744140625, -0.010684967041015625, -0.00743865966796875, -0.004192352294921875, -0.000946044921875, 0.002300262451171875, 0.00554656982421875, 0.008792877197265625, 0.0120391845703125, 0.015285491943359375, 0.01853179931640625, 0.021778106689453125, 0.0250244140625, 0.028270721435546875, 0.03151702880859375, 0.034763336181640625, 0.0380096435546875, 0.041255950927734375, 0.04450225830078125, 0.047748565673828125, 0.050994873046875, 0.054241180419921875, 0.05748748779296875, 0.060733795166015625, 0.0639801025390625, 0.06722640991210938, 0.07047271728515625, 0.07371902465820312, 0.07696533203125, 0.08021163940429688, 0.08345794677734375, 0.08670425415039062, 0.0899505615234375, 0.09319686889648438, 0.09644317626953125, 0.09968948364257812, 0.102935791015625, 0.10618209838867188, 0.10942840576171875, 0.11267471313476562, 0.1159210205078125, 0.11916732788085938, 0.12241363525390625, 0.12565994262695312, 0.12890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 3.0, 5.0, 8.0, 20.0, 20.0, 42.0, 40.0, 72.0, 102.0, 135.0, 227.0, 390.0, 734.0, 1486.0, 4025.0, 15862.0, 128579.0, 822866.0, 58631.0, 9690.0, 2849.0, 1238.0, 608.0, 329.0, 215.0, 109.0, 77.0, 57.0, 38.0, 25.0, 13.0, 19.0, 12.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.3471870422363281, -0.33231353759765625, -0.3174400329589844, -0.3025665283203125, -0.2876930236816406, -0.27281951904296875, -0.2579460144042969, -0.243072509765625, -0.22819900512695312, -0.21332550048828125, -0.19845199584960938, -0.1835784912109375, -0.16870498657226562, -0.15383148193359375, -0.13895797729492188, -0.12408447265625, -0.10921096801757812, -0.09433746337890625, -0.07946395874023438, -0.0645904541015625, -0.049716949462890625, -0.03484344482421875, -0.019969940185546875, -0.005096435546875, 0.009777069091796875, 0.02465057373046875, 0.039524078369140625, 0.0543975830078125, 0.06927108764648438, 0.08414459228515625, 0.09901809692382812, 0.1138916015625, 0.12876510620117188, 0.14363861083984375, 0.15851211547851562, 0.1733856201171875, 0.18825912475585938, 0.20313262939453125, 0.21800613403320312, 0.232879638671875, 0.24775314331054688, 0.26262664794921875, 0.2775001525878906, 0.2923736572265625, 0.3072471618652344, 0.32212066650390625, 0.3369941711425781, 0.35186767578125, 0.3667411804199219, 0.38161468505859375, 0.3964881896972656, 0.4113616943359375, 0.4262351989746094, 0.44110870361328125, 0.4559822082519531, 0.470855712890625, 0.4857292175292969, 0.5006027221679688, 0.5154762268066406, 0.5303497314453125, 0.5452232360839844, 0.5600967407226562, 0.5749702453613281, 0.58984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 4.0, 12.0, 12.0, 14.0, 21.0, 33.0, 28.0, 34.0, 36.0, 53.0, 52.0, 55.0, 63.0, 63.0, 71.0, 51.0, 59.0, 63.0, 64.0, 43.0, 31.0, 35.0, 20.0, 16.0, 13.0, 10.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3700599670410156, -0.35462188720703125, -0.3391838073730469, -0.3237457275390625, -0.3083076477050781, -0.29286956787109375, -0.2774314880371094, -0.261993408203125, -0.24655532836914062, -0.23111724853515625, -0.21567916870117188, -0.2002410888671875, -0.18480300903320312, -0.16936492919921875, -0.15392684936523438, -0.13848876953125, -0.12305068969726562, -0.10761260986328125, -0.09217453002929688, -0.0767364501953125, -0.061298370361328125, -0.04586029052734375, -0.030422210693359375, -0.014984130859375, 0.000453948974609375, 0.01589202880859375, 0.031330108642578125, 0.0467681884765625, 0.062206268310546875, 0.07764434814453125, 0.09308242797851562, 0.1085205078125, 0.12395858764648438, 0.13939666748046875, 0.15483474731445312, 0.1702728271484375, 0.18571090698242188, 0.20114898681640625, 0.21658706665039062, 0.232025146484375, 0.24746322631835938, 0.26290130615234375, 0.2783393859863281, 0.2937774658203125, 0.3092155456542969, 0.32465362548828125, 0.3400917053222656, 0.35552978515625, 0.3709678649902344, 0.38640594482421875, 0.4018440246582031, 0.4172821044921875, 0.4327201843261719, 0.44815826416015625, 0.4635963439941406, 0.479034423828125, 0.4944725036621094, 0.5099105834960938, 0.5253486633300781, 0.5407867431640625, 0.5562248229980469, 0.5716629028320312, 0.5871009826660156, 0.6025390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 11.0, 4.0, 15.0, 19.0, 44.0, 79.0, 113.0, 262.0, 680.0, 1761.0, 7357.0, 48873.0, 796162.0, 170779.0, 17231.0, 3375.0, 999.0, 353.0, 199.0, 87.0, 56.0, 32.0, 21.0, 15.0, 7.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.2087993621826172, -0.20177841186523438, -0.19475746154785156, -0.18773651123046875, -0.18071556091308594, -0.17369461059570312, -0.1666736602783203, -0.1596527099609375, -0.1526317596435547, -0.14561080932617188, -0.13858985900878906, -0.13156890869140625, -0.12454795837402344, -0.11752700805664062, -0.11050605773925781, -0.103485107421875, -0.09646415710449219, -0.08944320678710938, -0.08242225646972656, -0.07540130615234375, -0.06838035583496094, -0.061359405517578125, -0.05433845520019531, -0.0473175048828125, -0.04029655456542969, -0.033275604248046875, -0.026254653930664062, -0.01923370361328125, -0.012212753295898438, -0.005191802978515625, 0.0018291473388671875, 0.00885009765625, 0.015871047973632812, 0.022891998291015625, 0.029912948608398438, 0.03693389892578125, 0.04395484924316406, 0.050975799560546875, 0.05799674987792969, 0.0650177001953125, 0.07203865051269531, 0.07905960083007812, 0.08608055114746094, 0.09310150146484375, 0.10012245178222656, 0.10714340209960938, 0.11416435241699219, 0.121185302734375, 0.1282062530517578, 0.13522720336914062, 0.14224815368652344, 0.14926910400390625, 0.15629005432128906, 0.16331100463867188, 0.1703319549560547, 0.1773529052734375, 0.1843738555908203, 0.19139480590820312, 0.19841575622558594, 0.20543670654296875, 0.21245765686035156, 0.21947860717773438, 0.2264995574951172, 0.2335205078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 1.0, 5.0, 4.0, 9.0, 11.0, 9.0, 11.0, 17.0, 29.0, 44.0, 37.0, 68.0, 103.0, 135.0, 115.0, 106.0, 76.0, 63.0, 38.0, 27.0, 20.0, 15.0, 10.0, 9.0, 10.0, 6.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.349252700805664e-05, -7.15227797627449e-05, -6.955303251743317e-05, -6.758328527212143e-05, -6.561353802680969e-05, -6.364379078149796e-05, -6.167404353618622e-05, -5.970429629087448e-05, -5.7734549045562744e-05, -5.576480180025101e-05, -5.379505455493927e-05, -5.182530730962753e-05, -4.9855560064315796e-05, -4.788581281900406e-05, -4.591606557369232e-05, -4.3946318328380585e-05, -4.197657108306885e-05, -4.000682383775711e-05, -3.8037076592445374e-05, -3.6067329347133636e-05, -3.40975821018219e-05, -3.212783485651016e-05, -3.0158087611198425e-05, -2.8188340365886688e-05, -2.621859312057495e-05, -2.4248845875263214e-05, -2.2279098629951477e-05, -2.030935138463974e-05, -1.8339604139328003e-05, -1.6369856894016266e-05, -1.4400109648704529e-05, -1.2430362403392792e-05, -1.0460615158081055e-05, -8.490867912769318e-06, -6.5211206674575806e-06, -4.5513734221458435e-06, -2.5816261768341064e-06, -6.118789315223694e-07, 1.3578683137893677e-06, 3.3276155591011047e-06, 5.297362804412842e-06, 7.267110049724579e-06, 9.236857295036316e-06, 1.1206604540348053e-05, 1.317635178565979e-05, 1.5146099030971527e-05, 1.7115846276283264e-05, 1.9085593521595e-05, 2.1055340766906738e-05, 2.3025088012218475e-05, 2.4994835257530212e-05, 2.696458250284195e-05, 2.8934329748153687e-05, 3.0904076993465424e-05, 3.287382423877716e-05, 3.48435714840889e-05, 3.6813318729400635e-05, 3.878306597471237e-05, 4.075281322002411e-05, 4.2722560465335846e-05, 4.469230771064758e-05, 4.666205495595932e-05, 4.863180220127106e-05, 5.0601549446582794e-05, 5.257129669189453e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 8.0, 6.0, 12.0, 14.0, 18.0, 33.0, 34.0, 52.0, 86.0, 115.0, 176.0, 279.0, 542.0, 1003.0, 2214.0, 5789.0, 21296.0, 139227.0, 743651.0, 106656.0, 18010.0, 5080.0, 1985.0, 928.0, 480.0, 288.0, 192.0, 120.0, 79.0, 52.0, 38.0, 23.0, 14.0, 13.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.159393310546875, -0.15447998046875, -0.149566650390625, -0.1446533203125, -0.139739990234375, -0.13482666015625, -0.129913330078125, -0.125, -0.120086669921875, -0.11517333984375, -0.110260009765625, -0.1053466796875, -0.100433349609375, -0.09552001953125, -0.090606689453125, -0.085693359375, -0.080780029296875, -0.07586669921875, -0.070953369140625, -0.0660400390625, -0.061126708984375, -0.05621337890625, -0.051300048828125, -0.04638671875, -0.041473388671875, -0.03656005859375, -0.031646728515625, -0.0267333984375, -0.021820068359375, -0.01690673828125, -0.011993408203125, -0.007080078125, -0.002166748046875, 0.00274658203125, 0.007659912109375, 0.0125732421875, 0.017486572265625, 0.02239990234375, 0.027313232421875, 0.0322265625, 0.037139892578125, 0.04205322265625, 0.046966552734375, 0.0518798828125, 0.056793212890625, 0.06170654296875, 0.066619873046875, 0.071533203125, 0.076446533203125, 0.08135986328125, 0.086273193359375, 0.0911865234375, 0.096099853515625, 0.10101318359375, 0.105926513671875, 0.11083984375, 0.115753173828125, 0.12066650390625, 0.125579833984375, 0.1304931640625, 0.135406494140625, 0.14031982421875, 0.145233154296875, 0.150146484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 10.0, 14.0, 12.0, 17.0, 24.0, 30.0, 47.0, 52.0, 63.0, 97.0, 105.0, 93.0, 78.0, 70.0, 53.0, 46.0, 47.0, 25.0, 20.0, 19.0, 12.0, 8.0, 6.0, 8.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14013671875, -0.1360340118408203, -0.13193130493164062, -0.12782859802246094, -0.12372589111328125, -0.11962318420410156, -0.11552047729492188, -0.11141777038574219, -0.1073150634765625, -0.10321235656738281, -0.09910964965820312, -0.09500694274902344, -0.09090423583984375, -0.08680152893066406, -0.08269882202148438, -0.07859611511230469, -0.074493408203125, -0.07039070129394531, -0.06628799438476562, -0.06218528747558594, -0.05808258056640625, -0.05397987365722656, -0.049877166748046875, -0.04577445983886719, -0.0416717529296875, -0.03756904602050781, -0.033466339111328125, -0.029363632202148438, -0.02526092529296875, -0.021158218383789062, -0.017055511474609375, -0.012952804565429688, -0.00885009765625, -0.0047473907470703125, -0.000644683837890625, 0.0034580230712890625, 0.00756072998046875, 0.011663436889648438, 0.015766143798828125, 0.019868850708007812, 0.0239715576171875, 0.028074264526367188, 0.032176971435546875, 0.03627967834472656, 0.04038238525390625, 0.04448509216308594, 0.048587799072265625, 0.05269050598144531, 0.056793212890625, 0.06089591979980469, 0.06499862670898438, 0.06910133361816406, 0.07320404052734375, 0.07730674743652344, 0.08140945434570312, 0.08551216125488281, 0.0896148681640625, 0.09371757507324219, 0.09782028198242188, 0.10192298889160156, 0.10602569580078125, 0.11012840270996094, 0.11423110961914062, 0.11833381652832031, 0.1224365234375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 41.0, 164.0, 335.0, 262.0, 123.0, 29.0, 17.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.136778831481934, -3.963371753692627, -3.7899646759033203, -3.6165573596954346, -3.443150281906128, -3.2697432041168213, -3.0963358879089355, -2.922928810119629, -2.7495217323303223, -2.5761146545410156, -2.402707576751709, -2.2293002605438232, -2.0558931827545166, -1.88248610496521, -1.7090789079666138, -1.5356717109680176, -1.362264633178711, -1.1888575553894043, -1.015450358390808, -0.8420432209968567, -0.6686360836029053, -0.49522894620895386, -0.32182180881500244, -0.14841461181640625, 0.02499246597290039, 0.1983996033668518, 0.3718067407608032, 0.5452138781547546, 0.718621015548706, 0.8920281529426575, 1.0654352903366089, 1.238842487335205, 1.4122495651245117, 1.5856566429138184, 1.7590638399124146, 1.9324710369110107, 2.1058781147003174, 2.279285192489624, 2.4526925086975098, 2.6260995864868164, 2.799506664276123, 2.9729137420654297, 3.1463208198547363, 3.319728136062622, 3.4931352138519287, 3.6665422916412354, 3.839949607849121, 4.013356685638428, 4.186763763427734, 4.360170841217041, 4.533577919006348, 4.706984996795654, 4.880392074584961, 5.053799629211426, 5.227206707000732, 5.400613784790039, 5.574020862579346, 5.747427940368652, 5.920835018157959, 6.094242095947266, 6.2676496505737305, 6.441056728363037, 6.614463806152344, 6.78787088394165, 6.961277961730957]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 17.0, 21.0, 21.0, 39.0, 48.0, 51.0, 65.0, 70.0, 81.0, 104.0, 113.0, 89.0, 61.0, 60.0, 44.0, 35.0, 44.0, 15.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6194236278533936, -3.528352737426758, -3.437281608581543, -3.3462107181549072, -3.2551395893096924, -3.1640686988830566, -3.072997570037842, -2.981926679611206, -2.8908557891845703, -2.7997848987579346, -2.7087137699127197, -2.617642879486084, -2.526571750640869, -2.4355008602142334, -2.3444299697875977, -2.253358840942383, -2.162287712097168, -2.0712168216705322, -1.9801456928253174, -1.8890748023986816, -1.7980036735534668, -1.706932783126831, -1.6158617734909058, -1.5247907638549805, -1.4337197542190552, -1.3426487445831299, -1.2515777349472046, -1.1605067253112793, -1.0694358348846436, -0.9783647656440735, -0.887293815612793, -0.7962228059768677, -0.7051515579223633, -0.614080548286438, -0.5230095386505127, -0.4319385886192322, -0.3408675789833069, -0.2497965693473816, -0.15872561931610107, -0.06765460968017578, 0.02341639995574951, 0.11448739469051361, 0.2055583894252777, 0.2966293692588806, 0.3877003788948059, 0.4787713885307312, 0.5698423385620117, 0.660913348197937, 0.7519843578338623, 0.8430553674697876, 0.9341263771057129, 1.0251972675323486, 1.1162683963775635, 1.2073392868041992, 1.2984102964401245, 1.3894813060760498, 1.480552315711975, 1.5716233253479004, 1.6626943349838257, 1.753765344619751, 1.8448362350463867, 1.9359073638916016, 2.0269782543182373, 2.118049144744873, 2.209120273590088]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 2.0, 9.0, 6.0, 8.0, 9.0, 16.0, 25.0, 29.0, 31.0, 36.0, 62.0, 98.0, 138.0, 339.0, 1109.0, 9359.0, 325397.0, 3809270.0, 43986.0, 3117.0, 575.0, 220.0, 124.0, 77.0, 59.0, 27.0, 33.0, 24.0, 20.0, 16.0, 10.0, 16.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.611328125, -0.5953521728515625, -0.579376220703125, -0.5634002685546875, -0.54742431640625, -0.5314483642578125, -0.515472412109375, -0.4994964599609375, -0.4835205078125, -0.4675445556640625, -0.451568603515625, -0.4355926513671875, -0.41961669921875, -0.4036407470703125, -0.387664794921875, -0.3716888427734375, -0.355712890625, -0.3397369384765625, -0.323760986328125, -0.3077850341796875, -0.29180908203125, -0.2758331298828125, -0.259857177734375, -0.2438812255859375, -0.2279052734375, -0.2119293212890625, -0.195953369140625, -0.1799774169921875, -0.16400146484375, -0.1480255126953125, -0.132049560546875, -0.1160736083984375, -0.10009765625, -0.0841217041015625, -0.068145751953125, -0.0521697998046875, -0.03619384765625, -0.0202178955078125, -0.004241943359375, 0.0117340087890625, 0.0277099609375, 0.0436859130859375, 0.059661865234375, 0.0756378173828125, 0.09161376953125, 0.1075897216796875, 0.123565673828125, 0.1395416259765625, 0.155517578125, 0.1714935302734375, 0.187469482421875, 0.2034454345703125, 0.21942138671875, 0.2353973388671875, 0.251373291015625, 0.2673492431640625, 0.2833251953125, 0.2993011474609375, 0.315277099609375, 0.3312530517578125, 0.34722900390625, 0.3632049560546875, 0.379180908203125, 0.3951568603515625, 0.4111328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 5.0, 9.0, 21.0, 29.0, 36.0, 49.0, 57.0, 80.0, 79.0, 73.0, 89.0, 81.0, 67.0, 74.0, 74.0, 50.0, 35.0, 32.0, 27.0, 13.0, 4.0, 3.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1337890625, -0.129425048828125, -0.12506103515625, -0.120697021484375, -0.1163330078125, -0.111968994140625, -0.10760498046875, -0.103240966796875, -0.098876953125, -0.094512939453125, -0.09014892578125, -0.085784912109375, -0.0814208984375, -0.077056884765625, -0.07269287109375, -0.068328857421875, -0.06396484375, -0.059600830078125, -0.05523681640625, -0.050872802734375, -0.0465087890625, -0.042144775390625, -0.03778076171875, -0.033416748046875, -0.029052734375, -0.024688720703125, -0.02032470703125, -0.015960693359375, -0.0115966796875, -0.007232666015625, -0.00286865234375, 0.001495361328125, 0.005859375, 0.010223388671875, 0.01458740234375, 0.018951416015625, 0.0233154296875, 0.027679443359375, 0.03204345703125, 0.036407470703125, 0.040771484375, 0.045135498046875, 0.04949951171875, 0.053863525390625, 0.0582275390625, 0.062591552734375, 0.06695556640625, 0.071319580078125, 0.07568359375, 0.080047607421875, 0.08441162109375, 0.088775634765625, 0.0931396484375, 0.097503662109375, 0.10186767578125, 0.106231689453125, 0.110595703125, 0.114959716796875, 0.11932373046875, 0.123687744140625, 0.1280517578125, 0.132415771484375, 0.13677978515625, 0.141143798828125, 0.1455078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 13.0, 16.0, 37.0, 43.0, 66.0, 112.0, 167.0, 278.0, 505.0, 931.0, 1610.0, 3202.0, 6636.0, 15095.0, 36881.0, 108313.0, 494897.0, 2557393.0, 746880.0, 141752.0, 45020.0, 18327.0, 8134.0, 3726.0, 1904.0, 998.0, 557.0, 273.0, 186.0, 100.0, 82.0, 49.0, 30.0, 16.0, 9.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.16317176818847656, -0.15800857543945312, -0.1528453826904297, -0.14768218994140625, -0.1425189971923828, -0.13735580444335938, -0.13219261169433594, -0.1270294189453125, -0.12186622619628906, -0.11670303344726562, -0.11153984069824219, -0.10637664794921875, -0.10121345520019531, -0.09605026245117188, -0.09088706970214844, -0.085723876953125, -0.08056068420410156, -0.07539749145507812, -0.07023429870605469, -0.06507110595703125, -0.05990791320800781, -0.054744720458984375, -0.04958152770996094, -0.0444183349609375, -0.03925514221191406, -0.034091949462890625, -0.028928756713867188, -0.02376556396484375, -0.018602371215820312, -0.013439178466796875, -0.008275985717773438, -0.00311279296875, 0.0020503997802734375, 0.007213592529296875, 0.012376785278320312, 0.01753997802734375, 0.022703170776367188, 0.027866363525390625, 0.03302955627441406, 0.0381927490234375, 0.04335594177246094, 0.048519134521484375, 0.05368232727050781, 0.05884552001953125, 0.06400871276855469, 0.06917190551757812, 0.07433509826660156, 0.079498291015625, 0.08466148376464844, 0.08982467651367188, 0.09498786926269531, 0.10015106201171875, 0.10531425476074219, 0.11047744750976562, 0.11564064025878906, 0.1208038330078125, 0.12596702575683594, 0.13113021850585938, 0.1362934112548828, 0.14145660400390625, 0.1466197967529297, 0.15178298950195312, 0.15694618225097656, 0.162109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 7.0, 6.0, 2.0, 13.0, 13.0, 17.0, 30.0, 41.0, 44.0, 62.0, 90.0, 147.0, 281.0, 464.0, 830.0, 806.0, 434.0, 291.0, 167.0, 97.0, 86.0, 34.0, 22.0, 27.0, 18.0, 8.0, 13.0, 6.0, 12.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314208984375, -0.3057117462158203, -0.2972145080566406, -0.28871726989746094, -0.28022003173828125, -0.27172279357910156, -0.2632255554199219, -0.2547283172607422, -0.2462310791015625, -0.2377338409423828, -0.22923660278320312, -0.22073936462402344, -0.21224212646484375, -0.20374488830566406, -0.19524765014648438, -0.1867504119873047, -0.178253173828125, -0.1697559356689453, -0.16125869750976562, -0.15276145935058594, -0.14426422119140625, -0.13576698303222656, -0.12726974487304688, -0.11877250671386719, -0.1102752685546875, -0.10177803039550781, -0.09328079223632812, -0.08478355407714844, -0.07628631591796875, -0.06778907775878906, -0.059291839599609375, -0.05079460144042969, -0.04229736328125, -0.03380012512207031, -0.025302886962890625, -0.016805648803710938, -0.00830841064453125, 0.0001888275146484375, 0.008686065673828125, 0.017183303833007812, 0.0256805419921875, 0.03417778015136719, 0.042675018310546875, 0.05117225646972656, 0.05966949462890625, 0.06816673278808594, 0.07666397094726562, 0.08516120910644531, 0.093658447265625, 0.10215568542480469, 0.11065292358398438, 0.11915016174316406, 0.12764739990234375, 0.13614463806152344, 0.14464187622070312, 0.1531391143798828, 0.1616363525390625, 0.1701335906982422, 0.17863082885742188, 0.18712806701660156, 0.19562530517578125, 0.20412254333496094, 0.21261978149414062, 0.2211170196533203, 0.2296142578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 7.0, 17.0, 51.0, 117.0, 229.0, 268.0, 168.0, 66.0, 37.0, 12.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4222029447555542, -1.3133485317230225, -1.2044942378997803, -1.0956398248672485, -0.9867854118347168, -0.8779309988021851, -0.7690766453742981, -0.6602222919464111, -0.5513678789138794, -0.44251349568367004, -0.3336591124534607, -0.22480472922325134, -0.11595034599304199, -0.007095932960510254, 0.10175842046737671, 0.21061277389526367, 0.3194671869277954, 0.42832157015800476, 0.5371759533882141, 0.6460303068161011, 0.7548847198486328, 0.8637391328811646, 0.9725934863090515, 1.0814478397369385, 1.1903022527694702, 1.299156665802002, 1.4080109596252441, 1.5168653726577759, 1.6257197856903076, 1.7345741987228394, 1.843428611755371, 1.9522829055786133, 2.0611371994018555, 2.1699914932250977, 2.278846025466919, 2.387700319290161, 2.4965548515319824, 2.6054091453552246, 2.714263439178467, 2.823117733001709, 2.9319722652435303, 3.0408265590667725, 3.1496810913085938, 3.258535385131836, 3.367389678955078, 3.4762442111968994, 3.5850985050201416, 3.693953037261963, 3.802807331085205, 3.9116616249084473, 4.0205159187316895, 4.12937068939209, 4.238224983215332, 4.347079277038574, 4.455933570861816, 4.564787864685059, 4.673642158508301, 4.782496452331543, 4.891350746154785, 5.0002055168151855, 5.109059810638428, 5.21791410446167, 5.326768398284912, 5.435622692108154, 5.544477462768555]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 13.0, 28.0, 26.0, 23.0, 42.0, 42.0, 35.0, 37.0, 45.0, 62.0, 42.0, 53.0, 54.0, 59.0, 52.0, 45.0, 45.0, 34.0, 38.0, 31.0, 35.0, 21.0, 24.0, 17.0, 13.0, 14.0, 11.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9469990730285645, -0.9092732667922974, -0.8715474009513855, -0.8338215351104736, -0.7960957288742065, -0.7583699226379395, -0.7206440567970276, -0.6829181909561157, -0.6451923847198486, -0.6074665784835815, -0.5697407126426697, -0.5320148468017578, -0.4942890405654907, -0.45656320452690125, -0.41883736848831177, -0.3811115324497223, -0.3433856964111328, -0.30565986037254333, -0.26793402433395386, -0.23020818829536438, -0.1924823522567749, -0.15475651621818542, -0.11703068017959595, -0.07930484414100647, -0.04157900810241699, -0.0038531720638275146, 0.03387266397476196, 0.07159850001335144, 0.10932433605194092, 0.1470501720905304, 0.18477600812911987, 0.22250184416770935, 0.2602275609970093, 0.29795339703559875, 0.33567923307418823, 0.3734050691127777, 0.4111309051513672, 0.44885674118995667, 0.48658257722854614, 0.524308443069458, 0.5620342493057251, 0.5997600555419922, 0.637485921382904, 0.6752117872238159, 0.712937593460083, 0.7506633996963501, 0.788389265537262, 0.8261151313781738, 0.8638409376144409, 0.901566743850708, 0.9392926096916199, 0.9770184755325317, 1.0147442817687988, 1.052470088005066, 1.090195894241333, 1.1279218196868896, 1.1656476259231567, 1.2033734321594238, 1.2410993576049805, 1.2788251638412476, 1.3165509700775146, 1.3542767763137817, 1.3920025825500488, 1.4297285079956055, 1.4674543142318726]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 9.0, 13.0, 20.0, 28.0, 26.0, 49.0, 72.0, 112.0, 144.0, 193.0, 253.0, 397.0, 576.0, 800.0, 1336.0, 2035.0, 3374.0, 5562.0, 9557.0, 17194.0, 33672.0, 77692.0, 219479.0, 377279.0, 170936.0, 62596.0, 28404.0, 14864.0, 8407.0, 4967.0, 2925.0, 1857.0, 1155.0, 805.0, 572.0, 325.0, 244.0, 176.0, 123.0, 99.0, 70.0, 42.0, 28.0, 23.0, 23.0, 12.0, 9.0, 7.0, 1.0, 0.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.14599609375, -0.1413440704345703, -0.13669204711914062, -0.13204002380371094, -0.12738800048828125, -0.12273597717285156, -0.11808395385742188, -0.11343193054199219, -0.1087799072265625, -0.10412788391113281, -0.09947586059570312, -0.09482383728027344, -0.09017181396484375, -0.08551979064941406, -0.08086776733398438, -0.07621574401855469, -0.071563720703125, -0.06691169738769531, -0.062259674072265625, -0.05760765075683594, -0.05295562744140625, -0.04830360412597656, -0.043651580810546875, -0.03899955749511719, -0.0343475341796875, -0.029695510864257812, -0.025043487548828125, -0.020391464233398438, -0.01573944091796875, -0.011087417602539062, -0.006435394287109375, -0.0017833709716796875, 0.00286865234375, 0.0075206756591796875, 0.012172698974609375, 0.016824722290039062, 0.02147674560546875, 0.026128768920898438, 0.030780792236328125, 0.03543281555175781, 0.0400848388671875, 0.04473686218261719, 0.049388885498046875, 0.05404090881347656, 0.05869293212890625, 0.06334495544433594, 0.06799697875976562, 0.07264900207519531, 0.077301025390625, 0.08195304870605469, 0.08660507202148438, 0.09125709533691406, 0.09590911865234375, 0.10056114196777344, 0.10521316528320312, 0.10986518859863281, 0.1145172119140625, 0.11916923522949219, 0.12382125854492188, 0.12847328186035156, 0.13312530517578125, 0.13777732849121094, 0.14242935180664062, 0.1470813751220703, 0.1517333984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 10.0, 9.0, 14.0, 5.0, 6.0, 23.0, 22.0, 21.0, 31.0, 20.0, 27.0, 34.0, 42.0, 28.0, 38.0, 33.0, 43.0, 48.0, 33.0, 44.0, 39.0, 39.0, 33.0, 42.0, 42.0, 41.0, 22.0, 31.0, 32.0, 19.0, 18.0, 16.0, 24.0, 13.0, 9.0, 9.0, 5.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07855224609375, -0.07616043090820312, -0.07376861572265625, -0.07137680053710938, -0.0689849853515625, -0.06659317016601562, -0.06420135498046875, -0.061809539794921875, -0.059417724609375, -0.057025909423828125, -0.05463409423828125, -0.052242279052734375, -0.0498504638671875, -0.047458648681640625, -0.04506683349609375, -0.042675018310546875, -0.040283203125, -0.037891387939453125, -0.03549957275390625, -0.033107757568359375, -0.0307159423828125, -0.028324127197265625, -0.02593231201171875, -0.023540496826171875, -0.021148681640625, -0.018756866455078125, -0.01636505126953125, -0.013973236083984375, -0.0115814208984375, -0.009189605712890625, -0.00679779052734375, -0.004405975341796875, -0.00201416015625, 0.000377655029296875, 0.00276947021484375, 0.005161285400390625, 0.0075531005859375, 0.009944915771484375, 0.01233673095703125, 0.014728546142578125, 0.017120361328125, 0.019512176513671875, 0.02190399169921875, 0.024295806884765625, 0.0266876220703125, 0.029079437255859375, 0.03147125244140625, 0.033863067626953125, 0.0362548828125, 0.038646697998046875, 0.04103851318359375, 0.043430328369140625, 0.0458221435546875, 0.048213958740234375, 0.05060577392578125, 0.052997589111328125, 0.055389404296875, 0.057781219482421875, 0.06017303466796875, 0.06256484985351562, 0.0649566650390625, 0.06734848022460938, 0.06974029541015625, 0.07213211059570312, 0.07452392578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 12.0, 17.0, 24.0, 39.0, 75.0, 84.0, 183.0, 268.0, 582.0, 1233.0, 3071.0, 10459.0, 54765.0, 738060.0, 206203.0, 23930.0, 5775.0, 1953.0, 790.0, 425.0, 197.0, 127.0, 84.0, 55.0, 40.0, 20.0, 16.0, 18.0, 8.0, 12.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2634391784667969, -0.25075531005859375, -0.23807144165039062, -0.2253875732421875, -0.21270370483398438, -0.20001983642578125, -0.18733596801757812, -0.174652099609375, -0.16196823120117188, -0.14928436279296875, -0.13660049438476562, -0.1239166259765625, -0.11123275756835938, -0.09854888916015625, -0.08586502075195312, -0.07318115234375, -0.060497283935546875, -0.04781341552734375, -0.035129547119140625, -0.0224456787109375, -0.009761810302734375, 0.00292205810546875, 0.015605926513671875, 0.028289794921875, 0.040973663330078125, 0.05365753173828125, 0.06634140014648438, 0.0790252685546875, 0.09170913696289062, 0.10439300537109375, 0.11707687377929688, 0.1297607421875, 0.14244461059570312, 0.15512847900390625, 0.16781234741210938, 0.1804962158203125, 0.19318008422851562, 0.20586395263671875, 0.21854782104492188, 0.231231689453125, 0.24391555786132812, 0.25659942626953125, 0.2692832946777344, 0.2819671630859375, 0.2946510314941406, 0.30733489990234375, 0.3200187683105469, 0.33270263671875, 0.3453865051269531, 0.35807037353515625, 0.3707542419433594, 0.3834381103515625, 0.3961219787597656, 0.40880584716796875, 0.4214897155761719, 0.434173583984375, 0.4468574523925781, 0.45954132080078125, 0.4722251892089844, 0.4849090576171875, 0.4975929260253906, 0.5102767944335938, 0.5229606628417969, 0.53564453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 11.0, 6.0, 9.0, 15.0, 18.0, 36.0, 54.0, 66.0, 82.0, 99.0, 88.0, 90.0, 98.0, 97.0, 59.0, 53.0, 37.0, 33.0, 19.0, 12.0, 6.0, 9.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67626953125, -0.6538238525390625, -0.631378173828125, -0.6089324951171875, -0.58648681640625, -0.5640411376953125, -0.541595458984375, -0.5191497802734375, -0.4967041015625, -0.4742584228515625, -0.451812744140625, -0.4293670654296875, -0.40692138671875, -0.3844757080078125, -0.362030029296875, -0.3395843505859375, -0.317138671875, -0.2946929931640625, -0.272247314453125, -0.2498016357421875, -0.22735595703125, -0.2049102783203125, -0.182464599609375, -0.1600189208984375, -0.1375732421875, -0.1151275634765625, -0.092681884765625, -0.0702362060546875, -0.04779052734375, -0.0253448486328125, -0.002899169921875, 0.0195465087890625, 0.0419921875, 0.0644378662109375, 0.086883544921875, 0.1093292236328125, 0.13177490234375, 0.1542205810546875, 0.176666259765625, 0.1991119384765625, 0.2215576171875, 0.2440032958984375, 0.266448974609375, 0.2888946533203125, 0.31134033203125, 0.3337860107421875, 0.356231689453125, 0.3786773681640625, 0.401123046875, 0.4235687255859375, 0.446014404296875, 0.4684600830078125, 0.49090576171875, 0.5133514404296875, 0.535797119140625, 0.5582427978515625, 0.5806884765625, 0.6031341552734375, 0.625579833984375, 0.6480255126953125, 0.67047119140625, 0.6929168701171875, 0.715362548828125, 0.7378082275390625, 0.76025390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 11.0, 33.0, 59.0, 185.0, 851.0, 7793.0, 598194.0, 433227.0, 7016.0, 828.0, 205.0, 66.0, 33.0, 16.0, 9.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59765625, -0.5843696594238281, -0.5710830688476562, -0.5577964782714844, -0.5445098876953125, -0.5312232971191406, -0.5179367065429688, -0.5046501159667969, -0.491363525390625, -0.4780769348144531, -0.46479034423828125, -0.4515037536621094, -0.4382171630859375, -0.4249305725097656, -0.41164398193359375, -0.3983573913574219, -0.38507080078125, -0.3717842102050781, -0.35849761962890625, -0.3452110290527344, -0.3319244384765625, -0.3186378479003906, -0.30535125732421875, -0.2920646667480469, -0.278778076171875, -0.2654914855957031, -0.25220489501953125, -0.23891830444335938, -0.2256317138671875, -0.21234512329101562, -0.19905853271484375, -0.18577194213867188, -0.1724853515625, -0.15919876098632812, -0.14591217041015625, -0.13262557983398438, -0.1193389892578125, -0.10605239868164062, -0.09276580810546875, -0.07947921752929688, -0.066192626953125, -0.052906036376953125, -0.03961944580078125, -0.026332855224609375, -0.0130462646484375, 0.000240325927734375, 0.01352691650390625, 0.026813507080078125, 0.04010009765625, 0.053386688232421875, 0.06667327880859375, 0.07995986938476562, 0.0932464599609375, 0.10653305053710938, 0.11981964111328125, 0.13310623168945312, 0.146392822265625, 0.15967941284179688, 0.17296600341796875, 0.18625259399414062, 0.1995391845703125, 0.21282577514648438, 0.22611236572265625, 0.23939895629882812, 0.252685546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 5.0, 12.0, 12.0, 14.0, 26.0, 26.0, 53.0, 56.0, 68.0, 86.0, 80.0, 111.0, 83.0, 78.0, 57.0, 53.0, 46.0, 26.0, 20.0, 16.0, 12.0, 7.0, 8.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.3752603232860565e-05, -4.2265281081199646e-05, -4.077795892953873e-05, -3.929063677787781e-05, -3.780331462621689e-05, -3.631599247455597e-05, -3.482867032289505e-05, -3.334134817123413e-05, -3.185402601957321e-05, -3.0366703867912292e-05, -2.8879381716251373e-05, -2.7392059564590454e-05, -2.5904737412929535e-05, -2.4417415261268616e-05, -2.2930093109607697e-05, -2.1442770957946777e-05, -1.9955448806285858e-05, -1.846812665462494e-05, -1.698080450296402e-05, -1.54934823513031e-05, -1.4006160199642181e-05, -1.2518838047981262e-05, -1.1031515896320343e-05, -9.544193744659424e-06, -8.056871592998505e-06, -6.5695494413375854e-06, -5.082227289676666e-06, -3.594905138015747e-06, -2.107582986354828e-06, -6.202608346939087e-07, 8.670613169670105e-07, 2.3543834686279297e-06, 3.841705620288849e-06, 5.329027771949768e-06, 6.816349923610687e-06, 8.303672075271606e-06, 9.790994226932526e-06, 1.1278316378593445e-05, 1.2765638530254364e-05, 1.4252960681915283e-05, 1.5740282833576202e-05, 1.722760498523712e-05, 1.871492713689804e-05, 2.020224928855896e-05, 2.168957144021988e-05, 2.31768935918808e-05, 2.4664215743541718e-05, 2.6151537895202637e-05, 2.7638860046863556e-05, 2.9126182198524475e-05, 3.0613504350185394e-05, 3.2100826501846313e-05, 3.358814865350723e-05, 3.507547080516815e-05, 3.656279295682907e-05, 3.805011510848999e-05, 3.953743726015091e-05, 4.102475941181183e-05, 4.251208156347275e-05, 4.399940371513367e-05, 4.5486725866794586e-05, 4.6974048018455505e-05, 4.8461370170116425e-05, 4.9948692321777344e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 8.0, 15.0, 24.0, 38.0, 74.0, 151.0, 397.0, 1116.0, 4217.0, 32495.0, 750465.0, 242114.0, 13730.0, 2386.0, 768.0, 269.0, 115.0, 77.0, 39.0, 20.0, 7.0, 6.0, 6.0, 0.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.320068359375, -0.3122272491455078, -0.3043861389160156, -0.29654502868652344, -0.28870391845703125, -0.28086280822753906, -0.2730216979980469, -0.2651805877685547, -0.2573394775390625, -0.2494983673095703, -0.24165725708007812, -0.23381614685058594, -0.22597503662109375, -0.21813392639160156, -0.21029281616210938, -0.2024517059326172, -0.194610595703125, -0.1867694854736328, -0.17892837524414062, -0.17108726501464844, -0.16324615478515625, -0.15540504455566406, -0.14756393432617188, -0.1397228240966797, -0.1318817138671875, -0.12404060363769531, -0.11619949340820312, -0.10835838317871094, -0.10051727294921875, -0.09267616271972656, -0.08483505249023438, -0.07699394226074219, -0.06915283203125, -0.06131172180175781, -0.053470611572265625, -0.04562950134277344, -0.03778839111328125, -0.029947280883789062, -0.022106170654296875, -0.014265060424804688, -0.0064239501953125, 0.0014171600341796875, 0.009258270263671875, 0.017099380493164062, 0.02494049072265625, 0.03278160095214844, 0.040622711181640625, 0.04846382141113281, 0.056304931640625, 0.06414604187011719, 0.07198715209960938, 0.07982826232910156, 0.08766937255859375, 0.09551048278808594, 0.10335159301757812, 0.11119270324707031, 0.1190338134765625, 0.1268749237060547, 0.13471603393554688, 0.14255714416503906, 0.15039825439453125, 0.15823936462402344, 0.16608047485351562, 0.1739215850830078, 0.1817626953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 11.0, 19.0, 32.0, 44.0, 49.0, 98.0, 158.0, 165.0, 144.0, 104.0, 69.0, 51.0, 20.0, 15.0, 11.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.364990234375, -0.35746288299560547, -0.34993553161621094, -0.3424081802368164, -0.3348808288574219, -0.32735347747802734, -0.3198261260986328, -0.3122987747192383, -0.30477142333984375, -0.2972440719604492, -0.2897167205810547, -0.28218936920166016, -0.2746620178222656, -0.2671346664428711, -0.25960731506347656, -0.25207996368408203, -0.2445526123046875, -0.23702526092529297, -0.22949790954589844, -0.2219705581665039, -0.21444320678710938, -0.20691585540771484, -0.1993885040283203, -0.19186115264892578, -0.18433380126953125, -0.17680644989013672, -0.1692790985107422, -0.16175174713134766, -0.15422439575195312, -0.1466970443725586, -0.13916969299316406, -0.13164234161376953, -0.124114990234375, -0.11658763885498047, -0.10906028747558594, -0.1015329360961914, -0.09400558471679688, -0.08647823333740234, -0.07895088195800781, -0.07142353057861328, -0.06389617919921875, -0.05636882781982422, -0.04884147644042969, -0.041314125061035156, -0.033786773681640625, -0.026259422302246094, -0.018732070922851562, -0.011204719543457031, -0.0036773681640625, 0.0038499832153320312, 0.011377334594726562, 0.018904685974121094, 0.026432037353515625, 0.033959388732910156, 0.04148674011230469, 0.04901409149169922, 0.05654144287109375, 0.06406879425048828, 0.07159614562988281, 0.07912349700927734, 0.08665084838867188, 0.0941781997680664, 0.10170555114746094, 0.10923290252685547, 0.11676025390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 13.0, 35.0, 93.0, 210.0, 304.0, 192.0, 92.0, 27.0, 8.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.023674011230469, -3.8949646949768066, -3.7662553787231445, -3.6375458240509033, -3.508836507797241, -3.380127191543579, -3.251417636871338, -3.122708320617676, -2.9939990043640137, -2.8652896881103516, -2.7365803718566895, -2.6078708171844482, -2.479161500930786, -2.350452184677124, -2.221742630004883, -2.0930333137512207, -1.9643239974975586, -1.8356146812438965, -1.7069052457809448, -1.5781958103179932, -1.449486494064331, -1.320777177810669, -1.1920677423477173, -1.0633583068847656, -0.9346489906311035, -0.8059396147727966, -0.6772302389144897, -0.5485208630561829, -0.419811487197876, -0.2911021113395691, -0.1623927354812622, -0.03368335962295532, 0.09502649307250977, 0.22373586893081665, 0.35244524478912354, 0.4811546206474304, 0.6098639965057373, 0.7385733723640442, 0.8672827482223511, 0.995992124080658, 1.1247014999389648, 1.253410816192627, 1.3821202516555786, 1.5108296871185303, 1.6395390033721924, 1.7682483196258545, 1.8969577550888062, 2.025667190551758, 2.15437650680542, 2.283085823059082, 2.411795139312744, 2.5405046939849854, 2.6692140102386475, 2.7979233264923096, 2.926632881164551, 3.055342197418213, 3.184051513671875, 3.312760829925537, 3.441470146179199, 3.5701797008514404, 3.6988890171051025, 3.8275983333587646, 3.956307888031006, 4.085017204284668, 4.21372652053833]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 15.0, 11.0, 17.0, 41.0, 50.0, 63.0, 72.0, 99.0, 130.0, 131.0, 83.0, 73.0, 61.0, 55.0, 47.0, 23.0, 16.0, 10.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6359992027282715, -4.5257887840271, -4.415578365325928, -4.305367946624756, -4.195158004760742, -4.08494758605957, -3.9747371673583984, -3.8645267486572266, -3.7543163299560547, -3.644105911254883, -3.53389573097229, -3.423685312271118, -3.3134748935699463, -3.2032647132873535, -3.0930542945861816, -2.9828438758850098, -2.872633457183838, -2.762423038482666, -2.6522128582000732, -2.5420024394989014, -2.4317920207977295, -2.3215818405151367, -2.211371421813965, -2.101161003112793, -1.9909508228302002, -1.8807405233383179, -1.770530104637146, -1.6603198051452637, -1.5501093864440918, -1.4398990869522095, -1.3296887874603271, -1.2194783687591553, -1.1092679500579834, -0.9990575909614563, -0.8888472318649292, -0.7786369323730469, -0.668426513671875, -0.5582162141799927, -0.4480058550834656, -0.3377954959869385, -0.22758513689041138, -0.11737478524446487, -0.007164433598518372, 0.10304591059684753, 0.21325626969337463, 0.32346659898757935, 0.43367695808410645, 0.5438873171806335, 0.6540976762771606, 0.7643080353736877, 0.8745183944702148, 0.9847286939620972, 1.094939112663269, 1.2051494121551514, 1.3153598308563232, 1.4255701303482056, 1.535780429840088, 1.6459907293319702, 1.756201148033142, 1.8664114475250244, 1.9766218662261963, 2.086832046508789, 2.197042465209961, 2.307252883911133, 2.4174633026123047]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 2.0, 11.0, 8.0, 6.0, 6.0, 11.0, 11.0, 24.0, 33.0, 24.0, 58.0, 113.0, 190.0, 431.0, 1113.0, 3272.0, 11563.0, 51879.0, 378248.0, 2759825.0, 863088.0, 96486.0, 19437.0, 5417.0, 1812.0, 672.0, 307.0, 123.0, 57.0, 19.0, 12.0, 6.0, 3.0, 2.0], "bins": [-0.32177734375, -0.31529903411865234, -0.3088207244873047, -0.30234241485595703, -0.2958641052246094, -0.2893857955932617, -0.28290748596191406, -0.2764291763305664, -0.26995086669921875, -0.2634725570678711, -0.25699424743652344, -0.2505159378051758, -0.24403762817382812, -0.23755931854248047, -0.2310810089111328, -0.22460269927978516, -0.2181243896484375, -0.21164608001708984, -0.2051677703857422, -0.19868946075439453, -0.19221115112304688, -0.18573284149169922, -0.17925453186035156, -0.1727762222290039, -0.16629791259765625, -0.1598196029663086, -0.15334129333496094, -0.14686298370361328, -0.14038467407226562, -0.13390636444091797, -0.1274280548095703, -0.12094974517822266, -0.114471435546875, -0.10799312591552734, -0.10151481628417969, -0.09503650665283203, -0.08855819702148438, -0.08207988739013672, -0.07560157775878906, -0.0691232681274414, -0.06264495849609375, -0.056166648864746094, -0.04968833923339844, -0.04321002960205078, -0.036731719970703125, -0.03025341033935547, -0.023775100708007812, -0.017296791076660156, -0.0108184814453125, -0.004340171813964844, 0.0021381378173828125, 0.008616447448730469, 0.015094757080078125, 0.02157306671142578, 0.028051376342773438, 0.034529685974121094, 0.04100799560546875, 0.047486305236816406, 0.05396461486816406, 0.06044292449951172, 0.06692123413085938, 0.07339954376220703, 0.07987785339355469, 0.08635616302490234, 0.09283447265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 11.0, 18.0, 40.0, 69.0, 108.0, 153.0, 153.0, 142.0, 118.0, 101.0, 47.0, 38.0, 9.0, 5.0, 3.0], "bins": [-0.47119140625, -0.46272754669189453, -0.45426368713378906, -0.4457998275756836, -0.4373359680175781, -0.42887210845947266, -0.4204082489013672, -0.4119443893432617, -0.40348052978515625, -0.3950166702270508, -0.3865528106689453, -0.37808895111083984, -0.3696250915527344, -0.3611612319946289, -0.35269737243652344, -0.34423351287841797, -0.3357696533203125, -0.32730579376220703, -0.31884193420410156, -0.3103780746459961, -0.3019142150878906, -0.29345035552978516, -0.2849864959716797, -0.2765226364135742, -0.26805877685546875, -0.2595949172973633, -0.2511310577392578, -0.24266719818115234, -0.23420333862304688, -0.2257394790649414, -0.21727561950683594, -0.20881175994873047, -0.200347900390625, -0.19188404083251953, -0.18342018127441406, -0.1749563217163086, -0.16649246215820312, -0.15802860260009766, -0.1495647430419922, -0.14110088348388672, -0.13263702392578125, -0.12417316436767578, -0.11570930480957031, -0.10724544525146484, -0.09878158569335938, -0.0903177261352539, -0.08185386657714844, -0.07339000701904297, -0.0649261474609375, -0.05646228790283203, -0.04799842834472656, -0.039534568786621094, -0.031070709228515625, -0.022606849670410156, -0.014142990112304688, -0.005679130554199219, 0.00278472900390625, 0.011248588562011719, 0.019712448120117188, 0.028176307678222656, 0.036640167236328125, 0.045104026794433594, 0.05356788635253906, 0.06203174591064453, 0.07049560546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 6.0, 17.0, 13.0, 24.0, 29.0, 43.0, 55.0, 96.0, 161.0, 235.0, 414.0, 766.0, 1653.0, 3659.0, 9039.0, 24612.0, 77224.0, 302937.0, 1847317.0, 1559236.0, 260281.0, 68791.0, 22217.0, 8402.0, 3320.0, 1601.0, 830.0, 469.0, 252.0, 173.0, 129.0, 80.0, 46.0, 45.0, 26.0, 26.0, 12.0, 6.0, 5.0, 4.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.19482421875, -0.18924903869628906, -0.18367385864257812, -0.1780986785888672, -0.17252349853515625, -0.1669483184814453, -0.16137313842773438, -0.15579795837402344, -0.1502227783203125, -0.14464759826660156, -0.13907241821289062, -0.1334972381591797, -0.12792205810546875, -0.12234687805175781, -0.11677169799804688, -0.11119651794433594, -0.105621337890625, -0.10004615783691406, -0.09447097778320312, -0.08889579772949219, -0.08332061767578125, -0.07774543762207031, -0.07217025756835938, -0.06659507751464844, -0.0610198974609375, -0.05544471740722656, -0.049869537353515625, -0.04429435729980469, -0.03871917724609375, -0.03314399719238281, -0.027568817138671875, -0.021993637084960938, -0.01641845703125, -0.010843276977539062, -0.005268096923828125, 0.0003070831298828125, 0.00588226318359375, 0.011457443237304688, 0.017032623291015625, 0.022607803344726562, 0.0281829833984375, 0.03375816345214844, 0.039333343505859375, 0.04490852355957031, 0.05048370361328125, 0.05605888366699219, 0.061634063720703125, 0.06720924377441406, 0.072784423828125, 0.07835960388183594, 0.08393478393554688, 0.08950996398925781, 0.09508514404296875, 0.10066032409667969, 0.10623550415039062, 0.11181068420410156, 0.1173858642578125, 0.12296104431152344, 0.12853622436523438, 0.1341114044189453, 0.13968658447265625, 0.1452617645263672, 0.15083694458007812, 0.15641212463378906, 0.1619873046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 19.0, 16.0, 26.0, 29.0, 43.0, 49.0, 70.0, 102.0, 135.0, 185.0, 298.0, 434.0, 505.0, 563.0, 476.0, 322.0, 198.0, 172.0, 98.0, 89.0, 55.0, 39.0, 35.0, 30.0, 18.0, 12.0, 8.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2325439453125, -0.22426414489746094, -0.21598434448242188, -0.2077045440673828, -0.19942474365234375, -0.1911449432373047, -0.18286514282226562, -0.17458534240722656, -0.1663055419921875, -0.15802574157714844, -0.14974594116210938, -0.1414661407470703, -0.13318634033203125, -0.12490653991699219, -0.11662673950195312, -0.10834693908691406, -0.100067138671875, -0.09178733825683594, -0.08350753784179688, -0.07522773742675781, -0.06694793701171875, -0.05866813659667969, -0.050388336181640625, -0.04210853576660156, -0.0338287353515625, -0.025548934936523438, -0.017269134521484375, -0.008989334106445312, -0.00070953369140625, 0.0075702667236328125, 0.015850067138671875, 0.024129867553710938, 0.03240966796875, 0.04068946838378906, 0.048969268798828125, 0.05724906921386719, 0.06552886962890625, 0.07380867004394531, 0.08208847045898438, 0.09036827087402344, 0.0986480712890625, 0.10692787170410156, 0.11520767211914062, 0.12348747253417969, 0.13176727294921875, 0.1400470733642578, 0.14832687377929688, 0.15660667419433594, 0.164886474609375, 0.17316627502441406, 0.18144607543945312, 0.1897258758544922, 0.19800567626953125, 0.2062854766845703, 0.21456527709960938, 0.22284507751464844, 0.2311248779296875, 0.23940467834472656, 0.24768447875976562, 0.2559642791748047, 0.26424407958984375, 0.2725238800048828, 0.2808036804199219, 0.28908348083496094, 0.29736328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 20.0, 40.0, 181.0, 302.0, 241.0, 120.0, 40.0, 21.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.394401788711548, -2.241150379180908, -2.0878992080688477, -1.934647798538208, -1.781396508216858, -1.6281452178955078, -1.4748938083648682, -1.321642518043518, -1.168391227722168, -1.0151399374008179, -0.861888587474823, -0.7086372375488281, -0.555385947227478, -0.40213465690612793, -0.24888330698013306, -0.09563195705413818, 0.057619333267211914, 0.2108706533908844, 0.3641219735145569, 0.5173733234405518, 0.6706246137619019, 0.823875904083252, 0.9771272540092468, 1.1303786039352417, 1.2836298942565918, 1.436881184577942, 1.590132474899292, 1.7433838844299316, 1.8966351747512817, 2.049886465072632, 2.2031378746032715, 2.356389045715332, 2.509640693664551, 2.6628921031951904, 2.816143274307251, 2.9693946838378906, 3.122645854949951, 3.275897264480591, 3.4291486740112305, 3.582399845123291, 3.7356512546539307, 3.8889026641845703, 4.042153835296631, 4.195405006408691, 4.34865665435791, 4.501907825469971, 4.655158996582031, 4.80841064453125, 4.9616618156433105, 5.114912986755371, 5.26816463470459, 5.42141580581665, 5.574666976928711, 5.72791862487793, 5.88116979598999, 6.034420967102051, 6.1876726150512695, 6.34092378616333, 6.494175434112549, 6.647426605224609, 6.80067777633667, 6.9539289474487305, 7.107180595397949, 7.26043176651001, 7.41368293762207]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 13.0, 10.0, 16.0, 27.0, 42.0, 53.0, 65.0, 73.0, 76.0, 98.0, 94.0, 97.0, 70.0, 64.0, 54.0, 48.0, 39.0, 20.0, 14.0, 14.0, 9.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4143567085266113, -1.3306742906570435, -1.2469918727874756, -1.1633094549179077, -1.0796270370483398, -0.995944619178772, -0.9122622013092041, -0.8285797834396362, -0.7448973655700684, -0.6612149477005005, -0.5775325298309326, -0.49385011196136475, -0.4101676940917969, -0.326485276222229, -0.24280285835266113, -0.15912044048309326, -0.07543802261352539, 0.00824439525604248, 0.09192681312561035, 0.17560923099517822, 0.2592916488647461, 0.34297406673431396, 0.42665648460388184, 0.5103389024734497, 0.5940213203430176, 0.6777037382125854, 0.7613861560821533, 0.8450685739517212, 0.9287509918212891, 1.012433409690857, 1.0961158275604248, 1.1797982454299927, 1.2634809017181396, 1.3471633195877075, 1.4308457374572754, 1.5145281553268433, 1.5982105731964111, 1.681892991065979, 1.7655754089355469, 1.8492578268051147, 1.9329402446746826, 2.016622543334961, 2.1003050804138184, 2.183987617492676, 2.267669916152954, 2.3513522148132324, 2.43503475189209, 2.5187172889709473, 2.6023995876312256, 2.686081886291504, 2.7697644233703613, 2.8534469604492188, 2.937129259109497, 3.0208115577697754, 3.104494094848633, 3.1881766319274902, 3.2718589305877686, 3.355541229248047, 3.4392237663269043, 3.5229063034057617, 3.60658860206604, 3.6902709007263184, 3.773953437805176, 3.857635974884033, 3.9413182735443115]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 12.0, 10.0, 22.0, 30.0, 39.0, 57.0, 106.0, 181.0, 243.0, 389.0, 549.0, 837.0, 1346.0, 2054.0, 3260.0, 5057.0, 8182.0, 13241.0, 21684.0, 36856.0, 64947.0, 128402.0, 264975.0, 239516.0, 111804.0, 58508.0, 33747.0, 19904.0, 11959.0, 7610.0, 4655.0, 2942.0, 1968.0, 1201.0, 792.0, 483.0, 369.0, 210.0, 128.0, 109.0, 52.0, 42.0, 29.0, 15.0, 8.0, 7.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1435546875, -0.1391925811767578, -0.13483047485351562, -0.13046836853027344, -0.12610626220703125, -0.12174415588378906, -0.11738204956054688, -0.11301994323730469, -0.1086578369140625, -0.10429573059082031, -0.09993362426757812, -0.09557151794433594, -0.09120941162109375, -0.08684730529785156, -0.08248519897460938, -0.07812309265136719, -0.073760986328125, -0.06939888000488281, -0.06503677368164062, -0.06067466735839844, -0.05631256103515625, -0.05195045471191406, -0.047588348388671875, -0.04322624206542969, -0.0388641357421875, -0.03450202941894531, -0.030139923095703125, -0.025777816772460938, -0.02141571044921875, -0.017053604125976562, -0.012691497802734375, -0.008329391479492188, -0.00396728515625, 0.0003948211669921875, 0.004756927490234375, 0.009119033813476562, 0.01348114013671875, 0.017843246459960938, 0.022205352783203125, 0.026567459106445312, 0.0309295654296875, 0.03529167175292969, 0.039653778076171875, 0.04401588439941406, 0.04837799072265625, 0.05274009704589844, 0.057102203369140625, 0.06146430969238281, 0.065826416015625, 0.07018852233886719, 0.07455062866210938, 0.07891273498535156, 0.08327484130859375, 0.08763694763183594, 0.09199905395507812, 0.09636116027832031, 0.1007232666015625, 0.10508537292480469, 0.10944747924804688, 0.11380958557128906, 0.11817169189453125, 0.12253379821777344, 0.12689590454101562, 0.1312580108642578, 0.1356201171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 1.0, 5.0, 9.0, 11.0, 12.0, 16.0, 23.0, 33.0, 45.0, 45.0, 57.0, 62.0, 59.0, 68.0, 71.0, 68.0, 61.0, 60.0, 45.0, 55.0, 47.0, 41.0, 27.0, 26.0, 22.0, 16.0, 12.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15185260772705078, -0.14794349670410156, -0.14403438568115234, -0.14012527465820312, -0.1362161636352539, -0.1323070526123047, -0.12839794158935547, -0.12448883056640625, -0.12057971954345703, -0.11667060852050781, -0.1127614974975586, -0.10885238647460938, -0.10494327545166016, -0.10103416442871094, -0.09712505340576172, -0.0932159423828125, -0.08930683135986328, -0.08539772033691406, -0.08148860931396484, -0.07757949829101562, -0.0736703872680664, -0.06976127624511719, -0.06585216522216797, -0.06194305419921875, -0.05803394317626953, -0.05412483215332031, -0.050215721130371094, -0.046306610107421875, -0.042397499084472656, -0.03848838806152344, -0.03457927703857422, -0.030670166015625, -0.02676105499267578, -0.022851943969726562, -0.018942832946777344, -0.015033721923828125, -0.011124610900878906, -0.0072154998779296875, -0.0033063888549804688, 0.00060272216796875, 0.004511833190917969, 0.008420944213867188, 0.012330055236816406, 0.016239166259765625, 0.020148277282714844, 0.024057388305664062, 0.02796649932861328, 0.0318756103515625, 0.03578472137451172, 0.03969383239746094, 0.043602943420410156, 0.047512054443359375, 0.051421165466308594, 0.05533027648925781, 0.05923938751220703, 0.06314849853515625, 0.06705760955810547, 0.07096672058105469, 0.0748758316040039, 0.07878494262695312, 0.08269405364990234, 0.08660316467285156, 0.09051227569580078, 0.09442138671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 8.0, 10.0, 14.0, 17.0, 16.0, 18.0, 29.0, 48.0, 59.0, 83.0, 96.0, 140.0, 228.0, 374.0, 558.0, 950.0, 1706.0, 3625.0, 9569.0, 34355.0, 210116.0, 687107.0, 71763.0, 16416.0, 5414.0, 2414.0, 1234.0, 765.0, 448.0, 251.0, 189.0, 161.0, 95.0, 77.0, 56.0, 49.0, 24.0, 26.0, 12.0, 12.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.45166015625, -0.4380683898925781, -0.42447662353515625, -0.4108848571777344, -0.3972930908203125, -0.3837013244628906, -0.37010955810546875, -0.3565177917480469, -0.342926025390625, -0.3293342590332031, -0.31574249267578125, -0.3021507263183594, -0.2885589599609375, -0.2749671936035156, -0.26137542724609375, -0.24778366088867188, -0.23419189453125, -0.22060012817382812, -0.20700836181640625, -0.19341659545898438, -0.1798248291015625, -0.16623306274414062, -0.15264129638671875, -0.13904953002929688, -0.125457763671875, -0.11186599731445312, -0.09827423095703125, -0.08468246459960938, -0.0710906982421875, -0.057498931884765625, -0.04390716552734375, -0.030315399169921875, -0.0167236328125, -0.003131866455078125, 0.01045989990234375, 0.024051666259765625, 0.0376434326171875, 0.051235198974609375, 0.06482696533203125, 0.07841873168945312, 0.092010498046875, 0.10560226440429688, 0.11919403076171875, 0.13278579711914062, 0.1463775634765625, 0.15996932983398438, 0.17356109619140625, 0.18715286254882812, 0.20074462890625, 0.21433639526367188, 0.22792816162109375, 0.24151992797851562, 0.2551116943359375, 0.2687034606933594, 0.28229522705078125, 0.2958869934082031, 0.309478759765625, 0.3230705261230469, 0.33666229248046875, 0.3502540588378906, 0.3638458251953125, 0.3774375915527344, 0.39102935791015625, 0.4046211242675781, 0.418212890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 9.0, 10.0, 16.0, 19.0, 21.0, 28.0, 37.0, 39.0, 35.0, 39.0, 38.0, 44.0, 57.0, 45.0, 51.0, 66.0, 54.0, 51.0, 50.0, 38.0, 33.0, 32.0, 29.0, 22.0, 23.0, 13.0, 26.0, 18.0, 10.0, 5.0, 8.0, 9.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.53515625, -0.5210113525390625, -0.506866455078125, -0.4927215576171875, -0.47857666015625, -0.4644317626953125, -0.450286865234375, -0.4361419677734375, -0.4219970703125, -0.4078521728515625, -0.393707275390625, -0.3795623779296875, -0.36541748046875, -0.3512725830078125, -0.337127685546875, -0.3229827880859375, -0.308837890625, -0.2946929931640625, -0.280548095703125, -0.2664031982421875, -0.25225830078125, -0.2381134033203125, -0.223968505859375, -0.2098236083984375, -0.1956787109375, -0.1815338134765625, -0.167388916015625, -0.1532440185546875, -0.13909912109375, -0.1249542236328125, -0.110809326171875, -0.0966644287109375, -0.08251953125, -0.0683746337890625, -0.054229736328125, -0.0400848388671875, -0.02593994140625, -0.0117950439453125, 0.002349853515625, 0.0164947509765625, 0.0306396484375, 0.0447845458984375, 0.058929443359375, 0.0730743408203125, 0.08721923828125, 0.1013641357421875, 0.115509033203125, 0.1296539306640625, 0.143798828125, 0.1579437255859375, 0.172088623046875, 0.1862335205078125, 0.20037841796875, 0.2145233154296875, 0.228668212890625, 0.2428131103515625, 0.2569580078125, 0.2711029052734375, 0.285247802734375, 0.2993927001953125, 0.31353759765625, 0.3276824951171875, 0.341827392578125, 0.3559722900390625, 0.3701171875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 10.0, 20.0, 33.0, 48.0, 62.0, 137.0, 283.0, 570.0, 1442.0, 4207.0, 16318.0, 96492.0, 742118.0, 154433.0, 23484.0, 5589.0, 1825.0, 764.0, 336.0, 163.0, 86.0, 46.0, 30.0, 20.0, 7.0, 9.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.254638671875, -0.24821090698242188, -0.24178314208984375, -0.23535537719726562, -0.2289276123046875, -0.22249984741210938, -0.21607208251953125, -0.20964431762695312, -0.203216552734375, -0.19678878784179688, -0.19036102294921875, -0.18393325805664062, -0.1775054931640625, -0.17107772827148438, -0.16464996337890625, -0.15822219848632812, -0.15179443359375, -0.14536666870117188, -0.13893890380859375, -0.13251113891601562, -0.1260833740234375, -0.11965560913085938, -0.11322784423828125, -0.10680007934570312, -0.100372314453125, -0.09394454956054688, -0.08751678466796875, -0.08108901977539062, -0.0746612548828125, -0.06823348999023438, -0.06180572509765625, -0.055377960205078125, -0.0489501953125, -0.042522430419921875, -0.03609466552734375, -0.029666900634765625, -0.0232391357421875, -0.016811370849609375, -0.01038360595703125, -0.003955841064453125, 0.002471923828125, 0.008899688720703125, 0.01532745361328125, 0.021755218505859375, 0.0281829833984375, 0.034610748291015625, 0.04103851318359375, 0.047466278076171875, 0.05389404296875, 0.060321807861328125, 0.06674957275390625, 0.07317733764648438, 0.0796051025390625, 0.08603286743164062, 0.09246063232421875, 0.09888839721679688, 0.105316162109375, 0.11174392700195312, 0.11817169189453125, 0.12459945678710938, 0.1310272216796875, 0.13745498657226562, 0.14388275146484375, 0.15031051635742188, 0.15673828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 3.0, 5.0, 9.0, 11.0, 12.0, 15.0, 16.0, 14.0, 17.0, 22.0, 30.0, 37.0, 33.0, 59.0, 70.0, 75.0, 86.0, 75.0, 84.0, 53.0, 54.0, 43.0, 26.0, 30.0, 20.0, 19.0, 13.0, 8.0, 9.0, 8.0, 7.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8683414459228516e-05, -3.7243589758872986e-05, -3.5803765058517456e-05, -3.4363940358161926e-05, -3.2924115657806396e-05, -3.148429095745087e-05, -3.0044466257095337e-05, -2.8604641556739807e-05, -2.7164816856384277e-05, -2.5724992156028748e-05, -2.4285167455673218e-05, -2.2845342755317688e-05, -2.1405518054962158e-05, -1.996569335460663e-05, -1.85258686542511e-05, -1.708604395389557e-05, -1.564621925354004e-05, -1.420639455318451e-05, -1.276656985282898e-05, -1.132674515247345e-05, -9.88692045211792e-06, -8.44709575176239e-06, -7.00727105140686e-06, -5.5674463510513306e-06, -4.127621650695801e-06, -2.687796950340271e-06, -1.2479722499847412e-06, 1.9185245037078857e-07, 1.6316771507263184e-06, 3.071501851081848e-06, 4.511326551437378e-06, 5.951151251792908e-06, 7.3909759521484375e-06, 8.830800652503967e-06, 1.0270625352859497e-05, 1.1710450053215027e-05, 1.3150274753570557e-05, 1.4590099453926086e-05, 1.6029924154281616e-05, 1.7469748854637146e-05, 1.8909573554992676e-05, 2.0349398255348206e-05, 2.1789222955703735e-05, 2.3229047656059265e-05, 2.4668872356414795e-05, 2.6108697056770325e-05, 2.7548521757125854e-05, 2.8988346457481384e-05, 3.0428171157836914e-05, 3.1867995858192444e-05, 3.3307820558547974e-05, 3.4747645258903503e-05, 3.618746995925903e-05, 3.762729465961456e-05, 3.906711935997009e-05, 4.050694406032562e-05, 4.194676876068115e-05, 4.338659346103668e-05, 4.482641816139221e-05, 4.626624286174774e-05, 4.770606756210327e-05, 4.91458922624588e-05, 5.058571696281433e-05, 5.202554166316986e-05, 5.346536636352539e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 10.0, 13.0, 14.0, 13.0, 27.0, 29.0, 40.0, 59.0, 87.0, 129.0, 198.0, 310.0, 499.0, 864.0, 1625.0, 3577.0, 9314.0, 35639.0, 205126.0, 663780.0, 95898.0, 19752.0, 5879.0, 2490.0, 1211.0, 749.0, 425.0, 253.0, 172.0, 101.0, 78.0, 57.0, 38.0, 20.0, 19.0, 12.0, 12.0, 9.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.14892578125, -0.1441669464111328, -0.13940811157226562, -0.13464927673339844, -0.12989044189453125, -0.12513160705566406, -0.12037277221679688, -0.11561393737792969, -0.1108551025390625, -0.10609626770019531, -0.10133743286132812, -0.09657859802246094, -0.09181976318359375, -0.08706092834472656, -0.08230209350585938, -0.07754325866699219, -0.072784423828125, -0.06802558898925781, -0.06326675415039062, -0.05850791931152344, -0.05374908447265625, -0.04899024963378906, -0.044231414794921875, -0.03947257995605469, -0.0347137451171875, -0.029954910278320312, -0.025196075439453125, -0.020437240600585938, -0.01567840576171875, -0.010919570922851562, -0.006160736083984375, -0.0014019012451171875, 0.00335693359375, 0.008115768432617188, 0.012874603271484375, 0.017633438110351562, 0.02239227294921875, 0.027151107788085938, 0.031909942626953125, 0.03666877746582031, 0.0414276123046875, 0.04618644714355469, 0.050945281982421875, 0.05570411682128906, 0.06046295166015625, 0.06522178649902344, 0.06998062133789062, 0.07473945617675781, 0.079498291015625, 0.08425712585449219, 0.08901596069335938, 0.09377479553222656, 0.09853363037109375, 0.10329246520996094, 0.10805130004882812, 0.11281013488769531, 0.1175689697265625, 0.12232780456542969, 0.12708663940429688, 0.13184547424316406, 0.13660430908203125, 0.14136314392089844, 0.14612197875976562, 0.1508808135986328, 0.1556396484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 15.0, 16.0, 20.0, 16.0, 15.0, 38.0, 31.0, 37.0, 59.0, 45.0, 64.0, 75.0, 71.0, 66.0, 69.0, 57.0, 57.0, 38.0, 42.0, 31.0, 17.0, 20.0, 15.0, 17.0, 8.0, 6.0, 8.0, 3.0, 3.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12138748168945312, -0.11728668212890625, -0.11318588256835938, -0.1090850830078125, -0.10498428344726562, -0.10088348388671875, -0.09678268432617188, -0.092681884765625, -0.08858108520507812, -0.08448028564453125, -0.08037948608398438, -0.0762786865234375, -0.07217788696289062, -0.06807708740234375, -0.06397628784179688, -0.05987548828125, -0.055774688720703125, -0.05167388916015625, -0.047573089599609375, -0.0434722900390625, -0.039371490478515625, -0.03527069091796875, -0.031169891357421875, -0.027069091796875, -0.022968292236328125, -0.01886749267578125, -0.014766693115234375, -0.0106658935546875, -0.006565093994140625, -0.00246429443359375, 0.001636505126953125, 0.0057373046875, 0.009838104248046875, 0.01393890380859375, 0.018039703369140625, 0.0221405029296875, 0.026241302490234375, 0.03034210205078125, 0.034442901611328125, 0.038543701171875, 0.042644500732421875, 0.04674530029296875, 0.050846099853515625, 0.0549468994140625, 0.059047698974609375, 0.06314849853515625, 0.06724929809570312, 0.07135009765625, 0.07545089721679688, 0.07955169677734375, 0.08365249633789062, 0.0877532958984375, 0.09185409545898438, 0.09595489501953125, 0.10005569458007812, 0.104156494140625, 0.10825729370117188, 0.11235809326171875, 0.11645889282226562, 0.1205596923828125, 0.12466049194335938, 0.12876129150390625, 0.13286209106445312, 0.136962890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 17.0, 40.0, 78.0, 124.0, 279.0, 205.0, 109.0, 64.0, 27.0, 18.0, 12.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.352621555328369, -3.210792303085327, -3.068963050842285, -2.927133798599243, -2.785304546356201, -2.643475294113159, -2.501646041870117, -2.359816789627075, -2.217987537384033, -2.076158285140991, -1.9343290328979492, -1.7924997806549072, -1.6506705284118652, -1.5088412761688232, -1.3670120239257812, -1.2251827716827393, -1.0833535194396973, -0.9415242671966553, -0.7996950149536133, -0.6578657627105713, -0.5160365104675293, -0.3742072582244873, -0.2323780059814453, -0.09054875373840332, 0.05128049850463867, 0.19310975074768066, 0.33493900299072266, 0.47676825523376465, 0.6185975074768066, 0.7604267597198486, 0.9022560119628906, 1.0440852642059326, 1.1859140396118164, 1.3277432918548584, 1.4695725440979004, 1.6114017963409424, 1.7532310485839844, 1.8950603008270264, 2.0368895530700684, 2.1787188053131104, 2.3205480575561523, 2.4623773097991943, 2.6042065620422363, 2.7460358142852783, 2.8878650665283203, 3.0296943187713623, 3.1715235710144043, 3.3133528232574463, 3.4551820755004883, 3.5970113277435303, 3.7388405799865723, 3.8806698322296143, 4.022499084472656, 4.164328575134277, 4.30615758895874, 4.447986602783203, 4.589816093444824, 4.731645584106445, 4.873474597930908, 5.015303611755371, 5.157133102416992, 5.298962593078613, 5.440791606903076, 5.582620620727539, 5.72445011138916]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 6.0, 7.0, 8.0, 1.0, 18.0, 12.0, 12.0, 21.0, 19.0, 24.0, 26.0, 22.0, 23.0, 30.0, 39.0, 38.0, 52.0, 53.0, 63.0, 50.0, 62.0, 46.0, 45.0, 32.0, 37.0, 38.0, 28.0, 23.0, 27.0, 24.0, 14.0, 22.0, 13.0, 22.0, 4.0, 3.0, 6.0, 7.0, 5.0, 3.0, 8.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6170198917388916, -1.5671344995498657, -1.5172491073608398, -1.4673638343811035, -1.4174784421920776, -1.3675930500030518, -1.3177076578140259, -1.267822265625, -1.2179369926452637, -1.1680516004562378, -1.118166208267212, -1.0682809352874756, -1.0183955430984497, -0.9685101509094238, -0.918624758720398, -0.8687393665313721, -0.8188539743423462, -0.7689685821533203, -0.7190832495689392, -0.6691978573799133, -0.6193125247955322, -0.5694271326065063, -0.5195417404174805, -0.469656378030777, -0.4197710156440735, -0.36988565325737, -0.3200002908706665, -0.2701148986816406, -0.22022953629493713, -0.17034417390823364, -0.12045878171920776, -0.07057341933250427, -0.02068793773651123, 0.029197432100772858, 0.07908280193805695, 0.12896817922592163, 0.17885354161262512, 0.2287389039993286, 0.2786242961883545, 0.328509658575058, 0.3783950209617615, 0.42828038334846497, 0.47816574573516846, 0.5280511379241943, 0.5779365301132202, 0.6278218626976013, 0.6777072548866272, 0.7275925874710083, 0.7774779796600342, 0.8273633718490601, 0.8772487044334412, 0.927134096622467, 0.9770194292068481, 1.026904821395874, 1.0767902135849, 1.1266756057739258, 1.176560878753662, 1.226446270942688, 1.2763316631317139, 1.3262169361114502, 1.376102328300476, 1.425987720489502, 1.4758731126785278, 1.5257585048675537, 1.5756438970565796]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 6.0, 7.0, 16.0, 18.0, 13.0, 43.0, 54.0, 78.0, 110.0, 178.0, 274.0, 448.0, 767.0, 1300.0, 2189.0, 3901.0, 7173.0, 13792.0, 28199.0, 61542.0, 157710.0, 478225.0, 1372458.0, 1336529.0, 457310.0, 153234.0, 60513.0, 27780.0, 13703.0, 7208.0, 3969.0, 2220.0, 1279.0, 723.0, 471.0, 285.0, 204.0, 116.0, 83.0, 47.0, 31.0, 26.0, 16.0, 19.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0897216796875, -0.08682632446289062, -0.08393096923828125, -0.08103561401367188, -0.0781402587890625, -0.07524490356445312, -0.07234954833984375, -0.06945419311523438, -0.066558837890625, -0.06366348266601562, -0.06076812744140625, -0.057872772216796875, -0.0549774169921875, -0.052082061767578125, -0.04918670654296875, -0.046291351318359375, -0.04339599609375, -0.040500640869140625, -0.03760528564453125, -0.034709930419921875, -0.0318145751953125, -0.028919219970703125, -0.02602386474609375, -0.023128509521484375, -0.020233154296875, -0.017337799072265625, -0.01444244384765625, -0.011547088623046875, -0.0086517333984375, -0.005756378173828125, -0.00286102294921875, 3.4332275390625e-05, 0.0029296875, 0.005825042724609375, 0.00872039794921875, 0.011615753173828125, 0.0145111083984375, 0.017406463623046875, 0.02030181884765625, 0.023197174072265625, 0.026092529296875, 0.028987884521484375, 0.03188323974609375, 0.034778594970703125, 0.0376739501953125, 0.040569305419921875, 0.04346466064453125, 0.046360015869140625, 0.04925537109375, 0.052150726318359375, 0.05504608154296875, 0.057941436767578125, 0.0608367919921875, 0.06373214721679688, 0.06662750244140625, 0.06952285766601562, 0.072418212890625, 0.07531356811523438, 0.07820892333984375, 0.08110427856445312, 0.0839996337890625, 0.08689498901367188, 0.08979034423828125, 0.09268569946289062, 0.0955810546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 8.0, 10.0, 9.0, 14.0, 17.0, 19.0, 26.0, 30.0, 37.0, 37.0, 37.0, 41.0, 52.0, 40.0, 51.0, 40.0, 45.0, 38.0, 49.0, 48.0, 50.0, 34.0, 35.0, 35.0, 24.0, 18.0, 21.0, 16.0, 16.0, 16.0, 11.0, 5.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0731201171875, -0.07046890258789062, -0.06781768798828125, -0.06516647338867188, -0.0625152587890625, -0.059864044189453125, -0.05721282958984375, -0.054561614990234375, -0.051910400390625, -0.049259185791015625, -0.04660797119140625, -0.043956756591796875, -0.0413055419921875, -0.038654327392578125, -0.03600311279296875, -0.033351898193359375, -0.03070068359375, -0.028049468994140625, -0.02539825439453125, -0.022747039794921875, -0.0200958251953125, -0.017444610595703125, -0.01479339599609375, -0.012142181396484375, -0.009490966796875, -0.006839752197265625, -0.00418853759765625, -0.001537322998046875, 0.0011138916015625, 0.003765106201171875, 0.00641632080078125, 0.009067535400390625, 0.01171875, 0.014369964599609375, 0.01702117919921875, 0.019672393798828125, 0.0223236083984375, 0.024974822998046875, 0.02762603759765625, 0.030277252197265625, 0.032928466796875, 0.035579681396484375, 0.03823089599609375, 0.040882110595703125, 0.0435333251953125, 0.046184539794921875, 0.04883575439453125, 0.051486968994140625, 0.05413818359375, 0.056789398193359375, 0.05944061279296875, 0.062091827392578125, 0.0647430419921875, 0.06739425659179688, 0.07004547119140625, 0.07269668579101562, 0.075347900390625, 0.07799911499023438, 0.08065032958984375, 0.08330154418945312, 0.0859527587890625, 0.08860397338867188, 0.09125518798828125, 0.09390640258789062, 0.0965576171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 10.0, 21.0, 27.0, 46.0, 71.0, 109.0, 207.0, 457.0, 1202.0, 3765.0, 15801.0, 99486.0, 1393468.0, 2477906.0, 167879.0, 24936.0, 5796.0, 1823.0, 621.0, 265.0, 156.0, 90.0, 54.0, 32.0, 12.0, 7.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.26617431640625, -0.2559814453125, -0.24578857421875, -0.235595703125, -0.22540283203125, -0.2152099609375, -0.20501708984375, -0.19482421875, -0.18463134765625, -0.1744384765625, -0.16424560546875, -0.154052734375, -0.14385986328125, -0.1336669921875, -0.12347412109375, -0.11328125, -0.10308837890625, -0.0928955078125, -0.08270263671875, -0.072509765625, -0.06231689453125, -0.0521240234375, -0.04193115234375, -0.03173828125, -0.02154541015625, -0.0113525390625, -0.00115966796875, 0.009033203125, 0.01922607421875, 0.0294189453125, 0.03961181640625, 0.0498046875, 0.05999755859375, 0.0701904296875, 0.08038330078125, 0.090576171875, 0.10076904296875, 0.1109619140625, 0.12115478515625, 0.13134765625, 0.14154052734375, 0.1517333984375, 0.16192626953125, 0.172119140625, 0.18231201171875, 0.1925048828125, 0.20269775390625, 0.212890625, 0.22308349609375, 0.2332763671875, 0.24346923828125, 0.253662109375, 0.26385498046875, 0.2740478515625, 0.28424072265625, 0.29443359375, 0.30462646484375, 0.3148193359375, 0.32501220703125, 0.335205078125, 0.34539794921875, 0.3555908203125, 0.36578369140625, 0.3759765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 10.0, 13.0, 3.0, 11.0, 20.0, 20.0, 23.0, 37.0, 60.0, 60.0, 109.0, 148.0, 251.0, 325.0, 421.0, 504.0, 588.0, 409.0, 294.0, 213.0, 142.0, 98.0, 79.0, 58.0, 45.0, 40.0, 22.0, 15.0, 23.0, 9.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.27581024169921875, -0.2671966552734375, -0.25858306884765625, -0.249969482421875, -0.24135589599609375, -0.2327423095703125, -0.22412872314453125, -0.21551513671875, -0.20690155029296875, -0.1982879638671875, -0.18967437744140625, -0.181060791015625, -0.17244720458984375, -0.1638336181640625, -0.15522003173828125, -0.1466064453125, -0.13799285888671875, -0.1293792724609375, -0.12076568603515625, -0.112152099609375, -0.10353851318359375, -0.0949249267578125, -0.08631134033203125, -0.07769775390625, -0.06908416748046875, -0.0604705810546875, -0.05185699462890625, -0.043243408203125, -0.03462982177734375, -0.0260162353515625, -0.01740264892578125, -0.0087890625, -0.00017547607421875, 0.0084381103515625, 0.01705169677734375, 0.025665283203125, 0.03427886962890625, 0.0428924560546875, 0.05150604248046875, 0.06011962890625, 0.06873321533203125, 0.0773468017578125, 0.08596038818359375, 0.094573974609375, 0.10318756103515625, 0.1118011474609375, 0.12041473388671875, 0.1290283203125, 0.13764190673828125, 0.1462554931640625, 0.15486907958984375, 0.163482666015625, 0.17209625244140625, 0.1807098388671875, 0.18932342529296875, 0.19793701171875, 0.20655059814453125, 0.2151641845703125, 0.22377777099609375, 0.232391357421875, 0.24100494384765625, 0.2496185302734375, 0.25823211669921875, 0.266845703125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 33.0, 119.0, 305.0, 334.0, 141.0, 37.0, 8.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.593810081481934, -4.385926246643066, -4.178042411804199, -3.970158576965332, -3.762274742126465, -3.5543909072875977, -3.3465073108673096, -3.1386234760284424, -2.930739641189575, -2.722855806350708, -2.514971971511841, -2.3070883750915527, -2.0992045402526855, -1.8913205862045288, -1.6834368705749512, -1.475553035736084, -1.2676692008972168, -1.0597853660583496, -0.8519015908241272, -0.6440178155899048, -0.4361339807510376, -0.2282501459121704, -0.020366430282592773, 0.18751740455627441, 0.3954012393951416, 0.6032850742340088, 0.8111688494682312, 1.0190526247024536, 1.2269364595413208, 1.434820294380188, 1.6427040100097656, 1.8505878448486328, 2.0584716796875, 2.266355514526367, 2.4742393493652344, 2.6821231842041016, 2.8900070190429688, 3.097890853881836, 3.305774450302124, 3.513658285140991, 3.7215421199798584, 3.9294259548187256, 4.137309551239014, 4.345193386077881, 4.553077220916748, 4.760961055755615, 4.968844890594482, 5.17672872543335, 5.384612560272217, 5.592496395111084, 5.800380229949951, 6.008264064788818, 6.2161478996276855, 6.424031734466553, 6.631915092468262, 6.839798927307129, 7.047682762145996, 7.255566596984863, 7.4634504318237305, 7.671334266662598, 7.879218101501465, 8.087101936340332, 8.2949857711792, 8.502869606018066, 8.710753440856934]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 5.0, 18.0, 11.0, 9.0, 18.0, 21.0, 27.0, 37.0, 26.0, 30.0, 50.0, 47.0, 50.0, 54.0, 58.0, 52.0, 65.0, 50.0, 44.0, 37.0, 42.0, 32.0, 37.0, 34.0, 28.0, 27.0, 18.0, 15.0, 14.0, 4.0, 9.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7327477931976318, -1.6812776327133179, -1.6298075914382935, -1.5783374309539795, -1.526867389678955, -1.4753972291946411, -1.4239270687103271, -1.3724570274353027, -1.3209868669509888, -1.2695167064666748, -1.2180466651916504, -1.1665765047073364, -1.1151063442230225, -1.063636302947998, -1.012166142463684, -0.9606960415840149, -0.9092259407043457, -0.8577558398246765, -0.8062857389450073, -0.7548155784606934, -0.7033454775810242, -0.651875376701355, -0.600405216217041, -0.5489351153373718, -0.49746501445770264, -0.44599491357803345, -0.39452478289604187, -0.3430546522140503, -0.2915845513343811, -0.24011445045471191, -0.18864431977272034, -0.13717418909072876, -0.08570408821105957, -0.03423397243022919, 0.017236143350601196, 0.06870625913143158, 0.12017637491226196, 0.17164647579193115, 0.22311660647392273, 0.2745867371559143, 0.3260568380355835, 0.3775269389152527, 0.42899706959724426, 0.48046720027923584, 0.531937301158905, 0.5834074020385742, 0.6348775625228882, 0.6863476634025574, 0.7378177642822266, 0.7892878651618958, 0.8407579660415649, 0.8922281265258789, 0.9436982274055481, 0.9951683282852173, 1.0466384887695312, 1.0981085300445557, 1.1495786905288696, 1.2010488510131836, 1.252518892288208, 1.303989052772522, 1.355459213256836, 1.4069292545318604, 1.4583994150161743, 1.5098695755004883, 1.5613396167755127]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 6.0, 15.0, 19.0, 24.0, 37.0, 58.0, 72.0, 132.0, 197.0, 304.0, 417.0, 660.0, 1026.0, 1609.0, 2544.0, 4038.0, 6968.0, 12157.0, 22698.0, 47008.0, 116031.0, 306390.0, 308740.0, 116705.0, 47094.0, 23078.0, 12225.0, 7058.0, 4092.0, 2550.0, 1583.0, 1022.0, 680.0, 428.0, 295.0, 199.0, 123.0, 97.0, 59.0, 37.0, 31.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1729736328125, -0.16788673400878906, -0.16279983520507812, -0.1577129364013672, -0.15262603759765625, -0.1475391387939453, -0.14245223999023438, -0.13736534118652344, -0.1322784423828125, -0.12719154357910156, -0.12210464477539062, -0.11701774597167969, -0.11193084716796875, -0.10684394836425781, -0.10175704956054688, -0.09667015075683594, -0.091583251953125, -0.08649635314941406, -0.08140945434570312, -0.07632255554199219, -0.07123565673828125, -0.06614875793457031, -0.061061859130859375, -0.05597496032714844, -0.0508880615234375, -0.04580116271972656, -0.040714263916015625, -0.03562736511230469, -0.03054046630859375, -0.025453567504882812, -0.020366668701171875, -0.015279769897460938, -0.01019287109375, -0.0051059722900390625, -1.9073486328125e-05, 0.0050678253173828125, 0.01015472412109375, 0.015241622924804688, 0.020328521728515625, 0.025415420532226562, 0.0305023193359375, 0.03558921813964844, 0.040676116943359375, 0.04576301574707031, 0.05084991455078125, 0.05593681335449219, 0.061023712158203125, 0.06611061096191406, 0.071197509765625, 0.07628440856933594, 0.08137130737304688, 0.08645820617675781, 0.09154510498046875, 0.09663200378417969, 0.10171890258789062, 0.10680580139160156, 0.1118927001953125, 0.11697959899902344, 0.12206649780273438, 0.1271533966064453, 0.13224029541015625, 0.1373271942138672, 0.14241409301757812, 0.14750099182128906, 0.152587890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 11.0, 9.0, 12.0, 11.0, 30.0, 16.0, 22.0, 21.0, 31.0, 36.0, 35.0, 37.0, 35.0, 49.0, 46.0, 56.0, 39.0, 37.0, 50.0, 45.0, 41.0, 39.0, 40.0, 28.0, 39.0, 18.0, 19.0, 18.0, 20.0, 14.0, 16.0, 19.0, 8.0, 9.0, 14.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0985107421875, -0.09566974639892578, -0.09282875061035156, -0.08998775482177734, -0.08714675903320312, -0.0843057632446289, -0.08146476745605469, -0.07862377166748047, -0.07578277587890625, -0.07294178009033203, -0.07010078430175781, -0.0672597885131836, -0.06441879272460938, -0.061577796936035156, -0.05873680114746094, -0.05589580535888672, -0.0530548095703125, -0.05021381378173828, -0.04737281799316406, -0.044531822204589844, -0.041690826416015625, -0.038849830627441406, -0.03600883483886719, -0.03316783905029297, -0.03032684326171875, -0.02748584747314453, -0.024644851684570312, -0.021803855895996094, -0.018962860107421875, -0.016121864318847656, -0.013280868530273438, -0.010439872741699219, -0.007598876953125, -0.004757881164550781, -0.0019168853759765625, 0.0009241104125976562, 0.003765106201171875, 0.006606101989746094, 0.009447097778320312, 0.012288093566894531, 0.01512908935546875, 0.01797008514404297, 0.020811080932617188, 0.023652076721191406, 0.026493072509765625, 0.029334068298339844, 0.03217506408691406, 0.03501605987548828, 0.0378570556640625, 0.04069805145263672, 0.04353904724121094, 0.046380043029785156, 0.049221038818359375, 0.052062034606933594, 0.05490303039550781, 0.05774402618408203, 0.06058502197265625, 0.06342601776123047, 0.06626701354980469, 0.0691080093383789, 0.07194900512695312, 0.07479000091552734, 0.07763099670410156, 0.08047199249267578, 0.08331298828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 15.0, 25.0, 29.0, 30.0, 50.0, 66.0, 99.0, 138.0, 200.0, 375.0, 582.0, 1079.0, 2474.0, 7259.0, 28125.0, 225900.0, 707806.0, 55352.0, 11777.0, 3585.0, 1484.0, 746.0, 428.0, 258.0, 188.0, 112.0, 76.0, 69.0, 56.0, 34.0, 38.0, 22.0, 4.0, 17.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.475341796875, -0.4618377685546875, -0.448333740234375, -0.4348297119140625, -0.42132568359375, -0.4078216552734375, -0.394317626953125, -0.3808135986328125, -0.3673095703125, -0.3538055419921875, -0.340301513671875, -0.3267974853515625, -0.31329345703125, -0.2997894287109375, -0.286285400390625, -0.2727813720703125, -0.25927734375, -0.2457733154296875, -0.232269287109375, -0.2187652587890625, -0.20526123046875, -0.1917572021484375, -0.178253173828125, -0.1647491455078125, -0.1512451171875, -0.1377410888671875, -0.124237060546875, -0.1107330322265625, -0.09722900390625, -0.0837249755859375, -0.070220947265625, -0.0567169189453125, -0.043212890625, -0.0297088623046875, -0.016204833984375, -0.0027008056640625, 0.01080322265625, 0.0243072509765625, 0.037811279296875, 0.0513153076171875, 0.0648193359375, 0.0783233642578125, 0.091827392578125, 0.1053314208984375, 0.11883544921875, 0.1323394775390625, 0.145843505859375, 0.1593475341796875, 0.1728515625, 0.1863555908203125, 0.199859619140625, 0.2133636474609375, 0.22686767578125, 0.2403717041015625, 0.253875732421875, 0.2673797607421875, 0.2808837890625, 0.2943878173828125, 0.307891845703125, 0.3213958740234375, 0.33489990234375, 0.3484039306640625, 0.361907958984375, 0.3754119873046875, 0.388916015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 3.0, 9.0, 7.0, 8.0, 22.0, 18.0, 30.0, 22.0, 33.0, 29.0, 38.0, 54.0, 40.0, 52.0, 44.0, 59.0, 55.0, 45.0, 59.0, 44.0, 45.0, 40.0, 39.0, 33.0, 21.0, 24.0, 22.0, 18.0, 17.0, 18.0, 7.0, 4.0, 5.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.5087890625, -0.49488067626953125, -0.4809722900390625, -0.46706390380859375, -0.453155517578125, -0.43924713134765625, -0.4253387451171875, -0.41143035888671875, -0.39752197265625, -0.38361358642578125, -0.3697052001953125, -0.35579681396484375, -0.341888427734375, -0.32798004150390625, -0.3140716552734375, -0.30016326904296875, -0.2862548828125, -0.27234649658203125, -0.2584381103515625, -0.24452972412109375, -0.230621337890625, -0.21671295166015625, -0.2028045654296875, -0.18889617919921875, -0.17498779296875, -0.16107940673828125, -0.1471710205078125, -0.13326263427734375, -0.119354248046875, -0.10544586181640625, -0.0915374755859375, -0.07762908935546875, -0.063720703125, -0.04981231689453125, -0.0359039306640625, -0.02199554443359375, -0.008087158203125, 0.00582122802734375, 0.0197296142578125, 0.03363800048828125, 0.04754638671875, 0.06145477294921875, 0.0753631591796875, 0.08927154541015625, 0.103179931640625, 0.11708831787109375, 0.1309967041015625, 0.14490509033203125, 0.1588134765625, 0.17272186279296875, 0.1866302490234375, 0.20053863525390625, 0.214447021484375, 0.22835540771484375, 0.2422637939453125, 0.25617218017578125, 0.27008056640625, 0.28398895263671875, 0.2978973388671875, 0.31180572509765625, 0.325714111328125, 0.33962249755859375, 0.3535308837890625, 0.36743927001953125, 0.38134765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 12.0, 13.0, 19.0, 20.0, 45.0, 72.0, 145.0, 261.0, 502.0, 1068.0, 2956.0, 9259.0, 39906.0, 248455.0, 646810.0, 76062.0, 15581.0, 4404.0, 1571.0, 691.0, 304.0, 162.0, 96.0, 47.0, 39.0, 14.0, 9.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17308998107910156, -0.16771316528320312, -0.1623363494873047, -0.15695953369140625, -0.1515827178955078, -0.14620590209960938, -0.14082908630371094, -0.1354522705078125, -0.13007545471191406, -0.12469863891601562, -0.11932182312011719, -0.11394500732421875, -0.10856819152832031, -0.10319137573242188, -0.09781455993652344, -0.092437744140625, -0.08706092834472656, -0.08168411254882812, -0.07630729675292969, -0.07093048095703125, -0.06555366516113281, -0.060176849365234375, -0.05480003356933594, -0.0494232177734375, -0.04404640197753906, -0.038669586181640625, -0.03329277038574219, -0.02791595458984375, -0.022539138793945312, -0.017162322998046875, -0.011785507202148438, -0.00640869140625, -0.0010318756103515625, 0.004344940185546875, 0.009721755981445312, 0.01509857177734375, 0.020475387573242188, 0.025852203369140625, 0.031229019165039062, 0.0366058349609375, 0.04198265075683594, 0.047359466552734375, 0.05273628234863281, 0.05811309814453125, 0.06348991394042969, 0.06886672973632812, 0.07424354553222656, 0.079620361328125, 0.08499717712402344, 0.09037399291992188, 0.09575080871582031, 0.10112762451171875, 0.10650444030761719, 0.11188125610351562, 0.11725807189941406, 0.1226348876953125, 0.12801170349121094, 0.13338851928710938, 0.1387653350830078, 0.14414215087890625, 0.1495189666748047, 0.15489578247070312, 0.16027259826660156, 0.1656494140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 7.0, 13.0, 22.0, 24.0, 30.0, 45.0, 88.0, 125.0, 157.0, 141.0, 111.0, 74.0, 58.0, 26.0, 26.0, 15.0, 12.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.934573709964752e-05, -5.66430389881134e-05, -5.3940340876579285e-05, -5.1237642765045166e-05, -4.853494465351105e-05, -4.583224654197693e-05, -4.312954843044281e-05, -4.042685031890869e-05, -3.772415220737457e-05, -3.5021454095840454e-05, -3.2318755984306335e-05, -2.9616057872772217e-05, -2.6913359761238098e-05, -2.421066164970398e-05, -2.150796353816986e-05, -1.8805265426635742e-05, -1.6102567315101624e-05, -1.3399869203567505e-05, -1.0697171092033386e-05, -7.994472980499268e-06, -5.291774868965149e-06, -2.5890767574310303e-06, 1.1362135410308838e-07, 2.816319465637207e-06, 5.519017577171326e-06, 8.221715688705444e-06, 1.0924413800239563e-05, 1.3627111911773682e-05, 1.63298100233078e-05, 1.903250813484192e-05, 2.1735206246376038e-05, 2.4437904357910156e-05, 2.7140602469444275e-05, 2.9843300580978394e-05, 3.254599869251251e-05, 3.524869680404663e-05, 3.795139491558075e-05, 4.065409302711487e-05, 4.335679113864899e-05, 4.6059489250183105e-05, 4.8762187361717224e-05, 5.146488547325134e-05, 5.416758358478546e-05, 5.687028169631958e-05, 5.95729798078537e-05, 6.227567791938782e-05, 6.497837603092194e-05, 6.768107414245605e-05, 7.038377225399017e-05, 7.308647036552429e-05, 7.578916847705841e-05, 7.849186658859253e-05, 8.119456470012665e-05, 8.389726281166077e-05, 8.659996092319489e-05, 8.9302659034729e-05, 9.200535714626312e-05, 9.470805525779724e-05, 9.741075336933136e-05, 0.00010011345148086548, 0.0001028161495923996, 0.00010551884770393372, 0.00010822154581546783, 0.00011092424392700195]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 9.0, 11.0, 29.0, 37.0, 47.0, 93.0, 168.0, 369.0, 817.0, 1988.0, 7156.0, 50365.0, 723657.0, 235686.0, 21466.0, 4035.0, 1367.0, 615.0, 268.0, 164.0, 77.0, 44.0, 36.0, 13.0, 12.0, 2.0, 10.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15541648864746094, -0.14860153198242188, -0.1417865753173828, -0.13497161865234375, -0.1281566619873047, -0.12134170532226562, -0.11452674865722656, -0.1077117919921875, -0.10089683532714844, -0.09408187866210938, -0.08726692199707031, -0.08045196533203125, -0.07363700866699219, -0.06682205200195312, -0.06000709533691406, -0.053192138671875, -0.04637718200683594, -0.039562225341796875, -0.03274726867675781, -0.02593231201171875, -0.019117355346679688, -0.012302398681640625, -0.0054874420166015625, 0.0013275146484375, 0.008142471313476562, 0.014957427978515625, 0.021772384643554688, 0.02858734130859375, 0.03540229797363281, 0.042217254638671875, 0.04903221130371094, 0.05584716796875, 0.06266212463378906, 0.06947708129882812, 0.07629203796386719, 0.08310699462890625, 0.08992195129394531, 0.09673690795898438, 0.10355186462402344, 0.1103668212890625, 0.11718177795410156, 0.12399673461914062, 0.1308116912841797, 0.13762664794921875, 0.1444416046142578, 0.15125656127929688, 0.15807151794433594, 0.164886474609375, 0.17170143127441406, 0.17851638793945312, 0.1853313446044922, 0.19214630126953125, 0.1989612579345703, 0.20577621459960938, 0.21259117126464844, 0.2194061279296875, 0.22622108459472656, 0.23303604125976562, 0.2398509979248047, 0.24666595458984375, 0.2534809112548828, 0.2602958679199219, 0.26711082458496094, 0.27392578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 16.0, 8.0, 16.0, 18.0, 36.0, 43.0, 44.0, 47.0, 77.0, 85.0, 101.0, 101.0, 76.0, 70.0, 48.0, 41.0, 38.0, 28.0, 20.0, 21.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.15641403198242188, -0.15181732177734375, -0.14722061157226562, -0.1426239013671875, -0.13802719116210938, -0.13343048095703125, -0.12883377075195312, -0.124237060546875, -0.11964035034179688, -0.11504364013671875, -0.11044692993164062, -0.1058502197265625, -0.10125350952148438, -0.09665679931640625, -0.09206008911132812, -0.08746337890625, -0.08286666870117188, -0.07826995849609375, -0.07367324829101562, -0.0690765380859375, -0.06447982788085938, -0.05988311767578125, -0.055286407470703125, -0.050689697265625, -0.046092987060546875, -0.04149627685546875, -0.036899566650390625, -0.0323028564453125, -0.027706146240234375, -0.02310943603515625, -0.018512725830078125, -0.013916015625, -0.009319305419921875, -0.00472259521484375, -0.000125885009765625, 0.0044708251953125, 0.009067535400390625, 0.01366424560546875, 0.018260955810546875, 0.022857666015625, 0.027454376220703125, 0.03205108642578125, 0.036647796630859375, 0.0412445068359375, 0.045841217041015625, 0.05043792724609375, 0.055034637451171875, 0.05963134765625, 0.06422805786132812, 0.06882476806640625, 0.07342147827148438, 0.0780181884765625, 0.08261489868164062, 0.08721160888671875, 0.09180831909179688, 0.096405029296875, 0.10100173950195312, 0.10559844970703125, 0.11019515991210938, 0.1147918701171875, 0.11938858032226562, 0.12398529052734375, 0.12858200073242188, 0.1331787109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 6.0, 15.0, 38.0, 45.0, 63.0, 96.0, 157.0, 211.0, 123.0, 81.0, 58.0, 34.0, 17.0, 8.0, 11.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716684103012085, -2.6395390033721924, -2.5623936653137207, -2.485248565673828, -2.4081032276153564, -2.330958127975464, -2.253812789916992, -2.1766676902770996, -2.099522590637207, -2.0223774909973145, -1.9452321529388428, -1.8680869340896606, -1.7909417152404785, -1.713796615600586, -1.6366513967514038, -1.5595061779022217, -1.48236083984375, -1.4052156209945679, -1.3280704021453857, -1.2509251832962036, -1.1737799644470215, -1.096634864807129, -1.0194896459579468, -0.9423444271087646, -0.8651992082595825, -0.7880539894104004, -0.7109087705612183, -0.6337636113166809, -0.5566183924674988, -0.47947317361831665, -0.4023279845714569, -0.32518279552459717, -0.24803781509399414, -0.1708926111459732, -0.09374740719795227, -0.016602203249931335, 0.0605430006980896, 0.13768821954727173, 0.21483340859413147, 0.2919785976409912, 0.36912381649017334, 0.44626903533935547, 0.5234142541885376, 0.600559413433075, 0.6777046322822571, 0.7548498511314392, 0.8319950103759766, 0.9091402292251587, 0.9862854480743408, 1.063430666923523, 1.140575885772705, 1.2177211046218872, 1.2948663234710693, 1.372011423110962, 1.449156641960144, 1.5263018608093262, 1.6034470796585083, 1.6805922985076904, 1.7577375173568726, 1.8348827362060547, 1.9120278358459473, 1.989173173904419, 2.0663182735443115, 2.143463611602783, 2.220608711242676]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 8.0, 11.0, 17.0, 13.0, 2.0, 15.0, 13.0, 26.0, 17.0, 26.0, 32.0, 29.0, 32.0, 35.0, 36.0, 42.0, 54.0, 72.0, 53.0, 51.0, 44.0, 40.0, 37.0, 32.0, 21.0, 21.0, 28.0, 23.0, 18.0, 20.0, 26.0, 17.0, 14.0, 13.0, 8.0, 10.0, 6.0, 7.0, 7.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2956559658050537, -1.248177170753479, -1.2006983757019043, -1.1532195806503296, -1.1057407855987549, -1.0582619905471802, -1.0107831954956055, -0.963304340839386, -0.9158255457878113, -0.8683467507362366, -0.8208679556846619, -0.7733891010284424, -0.7259103059768677, -0.678431510925293, -0.6309527158737183, -0.5834739208221436, -0.5359951257705688, -0.48851633071899414, -0.44103753566741943, -0.39355871081352234, -0.34607991576194763, -0.2986011207103729, -0.25112229585647583, -0.20364350080490112, -0.15616470575332642, -0.10868590325117111, -0.06120710074901581, -0.013728290796279907, 0.0337505042552948, 0.0812292993068695, 0.1287081241607666, 0.1761869192123413, 0.22366571426391602, 0.2711445093154907, 0.31862330436706543, 0.3661021292209625, 0.41358092427253723, 0.46105971932411194, 0.508538544178009, 0.5560173392295837, 0.6034961342811584, 0.6509749293327332, 0.6984537243843079, 0.7459325790405273, 0.793411374092102, 0.8408901691436768, 0.8883689641952515, 0.9358477592468262, 0.9833265542984009, 1.0308053493499756, 1.0782841444015503, 1.125762939453125, 1.1732417345046997, 1.2207205295562744, 1.2681994438171387, 1.3156781196594238, 1.363157033920288, 1.4106358289718628, 1.4581146240234375, 1.5055934190750122, 1.553072214126587, 1.6005510091781616, 1.6480298042297363, 1.6955087184906006, 1.7429873943328857]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 10.0, 26.0, 33.0, 51.0, 81.0, 167.0, 298.0, 516.0, 1131.0, 2391.0, 5129.0, 11971.0, 32381.0, 113191.0, 602930.0, 2389046.0, 826910.0, 142349.0, 39660.0, 14466.0, 6090.0, 2794.0, 1267.0, 645.0, 324.0, 194.0, 93.0, 59.0, 29.0, 20.0, 14.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115478515625, -0.11113548278808594, -0.10679244995117188, -0.10244941711425781, -0.09810638427734375, -0.09376335144042969, -0.08942031860351562, -0.08507728576660156, -0.0807342529296875, -0.07639122009277344, -0.07204818725585938, -0.06770515441894531, -0.06336212158203125, -0.05901908874511719, -0.054676055908203125, -0.05033302307128906, -0.045989990234375, -0.04164695739746094, -0.037303924560546875, -0.03296089172363281, -0.02861785888671875, -0.024274826049804688, -0.019931793212890625, -0.015588760375976562, -0.0112457275390625, -0.0069026947021484375, -0.002559661865234375, 0.0017833709716796875, 0.00612640380859375, 0.010469436645507812, 0.014812469482421875, 0.019155502319335938, 0.02349853515625, 0.027841567993164062, 0.032184600830078125, 0.03652763366699219, 0.04087066650390625, 0.04521369934082031, 0.049556732177734375, 0.05389976501464844, 0.0582427978515625, 0.06258583068847656, 0.06692886352539062, 0.07127189636230469, 0.07561492919921875, 0.07995796203613281, 0.08430099487304688, 0.08864402770996094, 0.092987060546875, 0.09733009338378906, 0.10167312622070312, 0.10601615905761719, 0.11035919189453125, 0.11470222473144531, 0.11904525756835938, 0.12338829040527344, 0.1277313232421875, 0.13207435607910156, 0.13641738891601562, 0.1407604217529297, 0.14510345458984375, 0.1494464874267578, 0.15378952026367188, 0.15813255310058594, 0.1624755859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 8.0, 12.0, 10.0, 12.0, 25.0, 25.0, 22.0, 18.0, 36.0, 18.0, 23.0, 43.0, 37.0, 41.0, 51.0, 44.0, 33.0, 47.0, 32.0, 49.0, 43.0, 37.0, 43.0, 30.0, 37.0, 31.0, 31.0, 24.0, 26.0, 15.0, 16.0, 10.0, 15.0, 10.0, 12.0, 5.0, 4.0, 12.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.09185791015625, -0.08912944793701172, -0.08640098571777344, -0.08367252349853516, -0.08094406127929688, -0.0782155990600586, -0.07548713684082031, -0.07275867462158203, -0.07003021240234375, -0.06730175018310547, -0.06457328796386719, -0.061844825744628906, -0.059116363525390625, -0.056387901306152344, -0.05365943908691406, -0.05093097686767578, -0.0482025146484375, -0.04547405242919922, -0.04274559020996094, -0.040017127990722656, -0.037288665771484375, -0.034560203552246094, -0.03183174133300781, -0.02910327911376953, -0.02637481689453125, -0.02364635467529297, -0.020917892456054688, -0.018189430236816406, -0.015460968017578125, -0.012732505798339844, -0.010004043579101562, -0.007275581359863281, -0.004547119140625, -0.0018186569213867188, 0.0009098052978515625, 0.0036382675170898438, 0.006366729736328125, 0.009095191955566406, 0.011823654174804688, 0.014552116394042969, 0.01728057861328125, 0.02000904083251953, 0.022737503051757812, 0.025465965270996094, 0.028194427490234375, 0.030922889709472656, 0.03365135192871094, 0.03637981414794922, 0.0391082763671875, 0.04183673858642578, 0.04456520080566406, 0.047293663024902344, 0.050022125244140625, 0.052750587463378906, 0.05547904968261719, 0.05820751190185547, 0.06093597412109375, 0.06366443634033203, 0.06639289855957031, 0.0691213607788086, 0.07184982299804688, 0.07457828521728516, 0.07730674743652344, 0.08003520965576172, 0.082763671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 15.0, 18.0, 30.0, 25.0, 48.0, 76.0, 146.0, 289.0, 649.0, 1697.0, 6374.0, 29110.0, 235719.0, 3274532.0, 581802.0, 50274.0, 9452.0, 2420.0, 780.0, 323.0, 169.0, 107.0, 67.0, 39.0, 26.0, 13.0, 25.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31982421875, -0.3093910217285156, -0.29895782470703125, -0.2885246276855469, -0.2780914306640625, -0.2676582336425781, -0.25722503662109375, -0.24679183959960938, -0.236358642578125, -0.22592544555664062, -0.21549224853515625, -0.20505905151367188, -0.1946258544921875, -0.18419265747070312, -0.17375946044921875, -0.16332626342773438, -0.15289306640625, -0.14245986938476562, -0.13202667236328125, -0.12159347534179688, -0.1111602783203125, -0.10072708129882812, -0.09029388427734375, -0.07986068725585938, -0.069427490234375, -0.058994293212890625, -0.04856109619140625, -0.038127899169921875, -0.0276947021484375, -0.017261505126953125, -0.00682830810546875, 0.003604888916015625, 0.0140380859375, 0.024471282958984375, 0.03490447998046875, 0.045337677001953125, 0.0557708740234375, 0.06620407104492188, 0.07663726806640625, 0.08707046508789062, 0.097503662109375, 0.10793685913085938, 0.11837005615234375, 0.12880325317382812, 0.1392364501953125, 0.14966964721679688, 0.16010284423828125, 0.17053604125976562, 0.18096923828125, 0.19140243530273438, 0.20183563232421875, 0.21226882934570312, 0.2227020263671875, 0.23313522338867188, 0.24356842041015625, 0.2540016174316406, 0.264434814453125, 0.2748680114746094, 0.28530120849609375, 0.2957344055175781, 0.3061676025390625, 0.3166007995605469, 0.32703399658203125, 0.3374671936035156, 0.347900390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 4.0, 6.0, 10.0, 10.0, 9.0, 12.0, 16.0, 17.0, 30.0, 39.0, 48.0, 64.0, 94.0, 108.0, 138.0, 209.0, 265.0, 387.0, 471.0, 447.0, 426.0, 318.0, 233.0, 173.0, 130.0, 95.0, 59.0, 49.0, 35.0, 31.0, 32.0, 19.0, 10.0, 14.0, 13.0, 16.0, 2.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.208740234375, -0.20246315002441406, -0.19618606567382812, -0.1899089813232422, -0.18363189697265625, -0.1773548126220703, -0.17107772827148438, -0.16480064392089844, -0.1585235595703125, -0.15224647521972656, -0.14596939086914062, -0.1396923065185547, -0.13341522216796875, -0.1271381378173828, -0.12086105346679688, -0.11458396911621094, -0.108306884765625, -0.10202980041503906, -0.09575271606445312, -0.08947563171386719, -0.08319854736328125, -0.07692146301269531, -0.07064437866210938, -0.06436729431152344, -0.0580902099609375, -0.05181312561035156, -0.045536041259765625, -0.03925895690917969, -0.03298187255859375, -0.026704788208007812, -0.020427703857421875, -0.014150619506835938, -0.00787353515625, -0.0015964508056640625, 0.004680633544921875, 0.010957717895507812, 0.01723480224609375, 0.023511886596679688, 0.029788970947265625, 0.03606605529785156, 0.0423431396484375, 0.04862022399902344, 0.054897308349609375, 0.06117439270019531, 0.06745147705078125, 0.07372856140136719, 0.08000564575195312, 0.08628273010253906, 0.092559814453125, 0.09883689880371094, 0.10511398315429688, 0.11139106750488281, 0.11766815185546875, 0.12394523620605469, 0.13022232055664062, 0.13649940490722656, 0.1427764892578125, 0.14905357360839844, 0.15533065795898438, 0.1616077423095703, 0.16788482666015625, 0.1741619110107422, 0.18043899536132812, 0.18671607971191406, 0.1929931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 3.0, 11.0, 21.0, 50.0, 128.0, 189.0, 222.0, 190.0, 98.0, 33.0, 30.0, 10.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.001578330993652, -3.8913233280181885, -3.7810683250427246, -3.67081356048584, -3.560558557510376, -3.450303554534912, -3.3400485515594482, -3.2297935485839844, -3.1195385456085205, -3.0092835426330566, -2.8990285396575928, -2.788773536682129, -2.678518772125244, -2.5682637691497803, -2.4580087661743164, -2.3477537631988525, -2.2374987602233887, -2.127243757247925, -2.016988754272461, -1.9067338705062866, -1.7964788675308228, -1.6862239837646484, -1.5759689807891846, -1.4657139778137207, -1.355459213256836, -1.245204210281372, -1.1349493265151978, -1.0246943235397339, -0.91443932056427, -0.8041843771934509, -0.6939294338226318, -0.583674430847168, -0.4734194278717041, -0.3631644546985626, -0.25290948152542114, -0.14265453815460205, -0.03239956498146057, 0.07785540819168091, 0.1881103515625, 0.29836535453796387, 0.40862029790878296, 0.518875241279602, 0.6291302442550659, 0.739385187625885, 0.8496401309967041, 0.959895133972168, 1.0701501369476318, 1.1804051399230957, 1.29066002368927, 1.4009150266647339, 1.5111699104309082, 1.621424913406372, 1.731679916381836, 1.8419349193572998, 1.9521898031234741, 2.0624446868896484, 2.1726996898651123, 2.282954692840576, 2.39320969581604, 2.503464698791504, 2.6137194633483887, 2.7239744663238525, 2.8342294692993164, 2.9444844722747803, 3.054739475250244]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 1.0, 3.0, 6.0, 3.0, 4.0, 9.0, 3.0, 6.0, 21.0, 9.0, 13.0, 15.0, 10.0, 15.0, 27.0, 17.0, 27.0, 17.0, 30.0, 26.0, 24.0, 32.0, 40.0, 49.0, 50.0, 41.0, 48.0, 34.0, 28.0, 25.0, 43.0, 27.0, 36.0, 30.0, 27.0, 19.0, 20.0, 27.0, 25.0, 19.0, 19.0, 19.0, 12.0, 4.0, 8.0, 11.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.9727334380149841, -0.9419143795967102, -0.911095380783081, -0.8802763223648071, -0.8494572639465332, -0.8186382055282593, -0.7878191471099854, -0.7570001482963562, -0.7261810898780823, -0.6953620314598083, -0.6645430326461792, -0.6337239742279053, -0.6029049158096313, -0.5720858573913574, -0.5412667989730835, -0.5104478001594543, -0.4796287417411804, -0.4488096833229065, -0.41799065470695496, -0.3871716260910034, -0.3563525676727295, -0.32553350925445557, -0.29471448063850403, -0.2638954520225525, -0.23307639360427856, -0.20225735008716583, -0.1714383065700531, -0.14061926305294037, -0.10980021953582764, -0.0789811760187149, -0.04816213250160217, -0.01734308898448944, 0.013475894927978516, 0.04429493844509125, 0.07511398196220398, 0.10593302547931671, 0.13675206899642944, 0.16757111251354218, 0.1983901560306549, 0.22920919954776764, 0.26002824306488037, 0.2908473014831543, 0.32166633009910583, 0.3524853587150574, 0.3833044171333313, 0.4141234755516052, 0.44494250416755676, 0.4757615327835083, 0.5065805912017822, 0.5373996496200562, 0.5682187080383301, 0.5990377068519592, 0.6298567652702332, 0.6606758236885071, 0.6914948225021362, 0.7223138809204102, 0.7531329393386841, 0.783951997756958, 0.8147710561752319, 0.8455900549888611, 0.876409113407135, 0.9072281718254089, 0.9380471706390381, 0.968866229057312, 0.9996852874755859]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 18.0, 19.0, 28.0, 49.0, 67.0, 80.0, 113.0, 154.0, 240.0, 386.0, 500.0, 780.0, 1275.0, 2041.0, 3319.0, 5835.0, 11634.0, 27507.0, 75728.0, 208970.0, 356553.0, 218206.0, 78832.0, 28612.0, 12245.0, 5960.0, 3436.0, 1982.0, 1324.0, 846.0, 562.0, 376.0, 284.0, 188.0, 112.0, 69.0, 56.0, 38.0, 37.0, 33.0, 10.0, 9.0, 2.0, 7.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.1357421875, -0.13169288635253906, -0.12764358520507812, -0.12359428405761719, -0.11954498291015625, -0.11549568176269531, -0.11144638061523438, -0.10739707946777344, -0.1033477783203125, -0.09929847717285156, -0.09524917602539062, -0.09119987487792969, -0.08715057373046875, -0.08310127258300781, -0.07905197143554688, -0.07500267028808594, -0.070953369140625, -0.06690406799316406, -0.06285476684570312, -0.05880546569824219, -0.05475616455078125, -0.05070686340332031, -0.046657562255859375, -0.04260826110839844, -0.0385589599609375, -0.03450965881347656, -0.030460357666015625, -0.026411056518554688, -0.02236175537109375, -0.018312454223632812, -0.014263153076171875, -0.010213851928710938, -0.00616455078125, -0.0021152496337890625, 0.001934051513671875, 0.0059833526611328125, 0.01003265380859375, 0.014081954956054688, 0.018131256103515625, 0.022180557250976562, 0.0262298583984375, 0.030279159545898438, 0.034328460693359375, 0.03837776184082031, 0.04242706298828125, 0.04647636413574219, 0.050525665283203125, 0.05457496643066406, 0.058624267578125, 0.06267356872558594, 0.06672286987304688, 0.07077217102050781, 0.07482147216796875, 0.07887077331542969, 0.08292007446289062, 0.08696937561035156, 0.0910186767578125, 0.09506797790527344, 0.09911727905273438, 0.10316658020019531, 0.10721588134765625, 0.11126518249511719, 0.11531448364257812, 0.11936378479003906, 0.1234130859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 6.0, 3.0, 8.0, 7.0, 8.0, 12.0, 26.0, 20.0, 30.0, 29.0, 29.0, 35.0, 50.0, 46.0, 52.0, 49.0, 61.0, 43.0, 44.0, 42.0, 58.0, 42.0, 36.0, 37.0, 35.0, 34.0, 30.0, 20.0, 15.0, 24.0, 13.0, 14.0, 9.0, 10.0, 9.0, 2.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11265277862548828, -0.10921669006347656, -0.10578060150146484, -0.10234451293945312, -0.0989084243774414, -0.09547233581542969, -0.09203624725341797, -0.08860015869140625, -0.08516407012939453, -0.08172798156738281, -0.0782918930053711, -0.07485580444335938, -0.07141971588134766, -0.06798362731933594, -0.06454753875732422, -0.0611114501953125, -0.05767536163330078, -0.05423927307128906, -0.050803184509277344, -0.047367095947265625, -0.043931007385253906, -0.04049491882324219, -0.03705883026123047, -0.03362274169921875, -0.03018665313720703, -0.026750564575195312, -0.023314476013183594, -0.019878387451171875, -0.016442298889160156, -0.013006210327148438, -0.009570121765136719, -0.006134033203125, -0.0026979446411132812, 0.0007381439208984375, 0.004174232482910156, 0.007610321044921875, 0.011046409606933594, 0.014482498168945312, 0.01791858673095703, 0.02135467529296875, 0.02479076385498047, 0.028226852416992188, 0.031662940979003906, 0.035099029541015625, 0.038535118103027344, 0.04197120666503906, 0.04540729522705078, 0.0488433837890625, 0.05227947235107422, 0.05571556091308594, 0.059151649475097656, 0.06258773803710938, 0.0660238265991211, 0.06945991516113281, 0.07289600372314453, 0.07633209228515625, 0.07976818084716797, 0.08320426940917969, 0.0866403579711914, 0.09007644653320312, 0.09351253509521484, 0.09694862365722656, 0.10038471221923828, 0.10382080078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 10.0, 12.0, 9.0, 15.0, 27.0, 33.0, 53.0, 84.0, 132.0, 264.0, 495.0, 1064.0, 2671.0, 8138.0, 47748.0, 664711.0, 287364.0, 26294.0, 5546.0, 2041.0, 835.0, 380.0, 217.0, 124.0, 74.0, 58.0, 38.0, 24.0, 16.0, 13.0, 13.0, 8.0, 10.0, 5.0, 6.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.336669921875, -0.32642364501953125, -0.3161773681640625, -0.30593109130859375, -0.295684814453125, -0.28543853759765625, -0.2751922607421875, -0.26494598388671875, -0.25469970703125, -0.24445343017578125, -0.2342071533203125, -0.22396087646484375, -0.213714599609375, -0.20346832275390625, -0.1932220458984375, -0.18297576904296875, -0.1727294921875, -0.16248321533203125, -0.1522369384765625, -0.14199066162109375, -0.131744384765625, -0.12149810791015625, -0.1112518310546875, -0.10100555419921875, -0.09075927734375, -0.08051300048828125, -0.0702667236328125, -0.06002044677734375, -0.049774169921875, -0.03952789306640625, -0.0292816162109375, -0.01903533935546875, -0.0087890625, 0.00145721435546875, 0.0117034912109375, 0.02194976806640625, 0.032196044921875, 0.04244232177734375, 0.0526885986328125, 0.06293487548828125, 0.07318115234375, 0.08342742919921875, 0.0936737060546875, 0.10391998291015625, 0.114166259765625, 0.12441253662109375, 0.1346588134765625, 0.14490509033203125, 0.1551513671875, 0.16539764404296875, 0.1756439208984375, 0.18589019775390625, 0.196136474609375, 0.20638275146484375, 0.2166290283203125, 0.22687530517578125, 0.23712158203125, 0.24736785888671875, 0.2576141357421875, 0.26786041259765625, 0.278106689453125, 0.28835296630859375, 0.2985992431640625, 0.30884552001953125, 0.319091796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 14.0, 13.0, 22.0, 13.0, 19.0, 27.0, 34.0, 32.0, 45.0, 60.0, 47.0, 61.0, 86.0, 59.0, 62.0, 59.0, 69.0, 42.0, 35.0, 38.0, 35.0, 23.0, 16.0, 9.0, 9.0, 12.0, 4.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51416015625, -0.49811553955078125, -0.4820709228515625, -0.46602630615234375, -0.449981689453125, -0.43393707275390625, -0.4178924560546875, -0.40184783935546875, -0.38580322265625, -0.36975860595703125, -0.3537139892578125, -0.33766937255859375, -0.321624755859375, -0.30558013916015625, -0.2895355224609375, -0.27349090576171875, -0.2574462890625, -0.24140167236328125, -0.2253570556640625, -0.20931243896484375, -0.193267822265625, -0.17722320556640625, -0.1611785888671875, -0.14513397216796875, -0.12908935546875, -0.11304473876953125, -0.0970001220703125, -0.08095550537109375, -0.064910888671875, -0.04886627197265625, -0.0328216552734375, -0.01677703857421875, -0.000732421875, 0.01531219482421875, 0.0313568115234375, 0.04740142822265625, 0.063446044921875, 0.07949066162109375, 0.0955352783203125, 0.11157989501953125, 0.12762451171875, 0.14366912841796875, 0.1597137451171875, 0.17575836181640625, 0.191802978515625, 0.20784759521484375, 0.2238922119140625, 0.23993682861328125, 0.2559814453125, 0.27202606201171875, 0.2880706787109375, 0.30411529541015625, 0.320159912109375, 0.33620452880859375, 0.3522491455078125, 0.36829376220703125, 0.38433837890625, 0.40038299560546875, 0.4164276123046875, 0.43247222900390625, 0.448516845703125, 0.46456146240234375, 0.4806060791015625, 0.49665069580078125, 0.5126953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 12.0, 14.0, 26.0, 35.0, 60.0, 127.0, 252.0, 554.0, 1418.0, 4677.0, 20803.0, 142456.0, 745483.0, 109505.0, 16982.0, 3862.0, 1275.0, 526.0, 214.0, 101.0, 69.0, 39.0, 25.0, 12.0, 8.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.124267578125, -0.11918258666992188, -0.11409759521484375, -0.10901260375976562, -0.1039276123046875, -0.09884262084960938, -0.09375762939453125, -0.08867263793945312, -0.083587646484375, -0.07850265502929688, -0.07341766357421875, -0.06833267211914062, -0.0632476806640625, -0.058162689208984375, -0.05307769775390625, -0.047992706298828125, -0.04290771484375, -0.037822723388671875, -0.03273773193359375, -0.027652740478515625, -0.0225677490234375, -0.017482757568359375, -0.01239776611328125, -0.007312774658203125, -0.002227783203125, 0.002857208251953125, 0.00794219970703125, 0.013027191162109375, 0.0181121826171875, 0.023197174072265625, 0.02828216552734375, 0.033367156982421875, 0.0384521484375, 0.043537139892578125, 0.04862213134765625, 0.053707122802734375, 0.0587921142578125, 0.06387710571289062, 0.06896209716796875, 0.07404708862304688, 0.079132080078125, 0.08421707153320312, 0.08930206298828125, 0.09438705444335938, 0.0994720458984375, 0.10455703735351562, 0.10964202880859375, 0.11472702026367188, 0.11981201171875, 0.12489700317382812, 0.12998199462890625, 0.13506698608398438, 0.1401519775390625, 0.14523696899414062, 0.15032196044921875, 0.15540695190429688, 0.160491943359375, 0.16557693481445312, 0.17066192626953125, 0.17574691772460938, 0.1808319091796875, 0.18591690063476562, 0.19100189208984375, 0.19608688354492188, 0.201171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 7.0, 11.0, 18.0, 18.0, 35.0, 32.0, 28.0, 71.0, 74.0, 82.0, 101.0, 85.0, 98.0, 77.0, 70.0, 36.0, 28.0, 32.0, 29.0, 24.0, 7.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.607439041137695e-05, -4.481431096792221e-05, -4.355423152446747e-05, -4.2294152081012726e-05, -4.1034072637557983e-05, -3.977399319410324e-05, -3.85139137506485e-05, -3.7253834307193756e-05, -3.5993754863739014e-05, -3.473367542028427e-05, -3.347359597682953e-05, -3.2213516533374786e-05, -3.0953437089920044e-05, -2.96933576464653e-05, -2.843327820301056e-05, -2.7173198759555817e-05, -2.5913119316101074e-05, -2.4653039872646332e-05, -2.339296042919159e-05, -2.2132880985736847e-05, -2.0872801542282104e-05, -1.9612722098827362e-05, -1.835264265537262e-05, -1.7092563211917877e-05, -1.5832483768463135e-05, -1.4572404325008392e-05, -1.331232488155365e-05, -1.2052245438098907e-05, -1.0792165994644165e-05, -9.532086551189423e-06, -8.27200710773468e-06, -7.011927664279938e-06, -5.751848220825195e-06, -4.491768777370453e-06, -3.2316893339157104e-06, -1.971609890460968e-06, -7.115304470062256e-07, 5.485489964485168e-07, 1.8086284399032593e-06, 3.0687078833580017e-06, 4.328787326812744e-06, 5.5888667702674866e-06, 6.848946213722229e-06, 8.109025657176971e-06, 9.369105100631714e-06, 1.0629184544086456e-05, 1.1889263987541199e-05, 1.3149343430995941e-05, 1.4409422874450684e-05, 1.5669502317905426e-05, 1.692958176136017e-05, 1.818966120481491e-05, 1.9449740648269653e-05, 2.0709820091724396e-05, 2.1969899535179138e-05, 2.322997897863388e-05, 2.4490058422088623e-05, 2.5750137865543365e-05, 2.7010217308998108e-05, 2.827029675245285e-05, 2.9530376195907593e-05, 3.0790455639362335e-05, 3.205053508281708e-05, 3.331061452627182e-05, 3.457069396972656e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 12.0, 13.0, 21.0, 24.0, 51.0, 56.0, 87.0, 170.0, 355.0, 649.0, 1452.0, 3589.0, 11813.0, 49752.0, 288272.0, 590288.0, 77347.0, 16300.0, 4789.0, 1754.0, 819.0, 389.0, 195.0, 117.0, 82.0, 41.0, 29.0, 20.0, 15.0, 16.0, 12.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.160400390625, -0.15619373321533203, -0.15198707580566406, -0.1477804183959961, -0.14357376098632812, -0.13936710357666016, -0.1351604461669922, -0.13095378875732422, -0.12674713134765625, -0.12254047393798828, -0.11833381652832031, -0.11412715911865234, -0.10992050170898438, -0.1057138442993164, -0.10150718688964844, -0.09730052947998047, -0.0930938720703125, -0.08888721466064453, -0.08468055725097656, -0.0804738998413086, -0.07626724243164062, -0.07206058502197266, -0.06785392761230469, -0.06364727020263672, -0.05944061279296875, -0.05523395538330078, -0.05102729797363281, -0.046820640563964844, -0.042613983154296875, -0.038407325744628906, -0.03420066833496094, -0.02999401092529297, -0.025787353515625, -0.02158069610595703, -0.017374038696289062, -0.013167381286621094, -0.008960723876953125, -0.004754066467285156, -0.0005474090576171875, 0.0036592483520507812, 0.00786590576171875, 0.012072563171386719, 0.016279220581054688, 0.020485877990722656, 0.024692535400390625, 0.028899192810058594, 0.03310585021972656, 0.03731250762939453, 0.0415191650390625, 0.04572582244873047, 0.04993247985839844, 0.054139137268066406, 0.058345794677734375, 0.06255245208740234, 0.06675910949707031, 0.07096576690673828, 0.07517242431640625, 0.07937908172607422, 0.08358573913574219, 0.08779239654541016, 0.09199905395507812, 0.0962057113647461, 0.10041236877441406, 0.10461902618408203, 0.10882568359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 16.0, 26.0, 39.0, 52.0, 65.0, 71.0, 95.0, 104.0, 90.0, 91.0, 67.0, 54.0, 58.0, 38.0, 23.0, 13.0, 19.0, 7.0, 6.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.14571762084960938, -0.14165496826171875, -0.13759231567382812, -0.1335296630859375, -0.12946701049804688, -0.12540435791015625, -0.12134170532226562, -0.117279052734375, -0.11321640014648438, -0.10915374755859375, -0.10509109497070312, -0.1010284423828125, -0.09696578979492188, -0.09290313720703125, -0.08884048461914062, -0.08477783203125, -0.08071517944335938, -0.07665252685546875, -0.07258987426757812, -0.0685272216796875, -0.06446456909179688, -0.06040191650390625, -0.056339263916015625, -0.052276611328125, -0.048213958740234375, -0.04415130615234375, -0.040088653564453125, -0.0360260009765625, -0.031963348388671875, -0.02790069580078125, -0.023838043212890625, -0.019775390625, -0.015712738037109375, -0.01165008544921875, -0.007587432861328125, -0.0035247802734375, 0.000537872314453125, 0.00460052490234375, 0.008663177490234375, 0.012725830078125, 0.016788482666015625, 0.02085113525390625, 0.024913787841796875, 0.0289764404296875, 0.033039093017578125, 0.03710174560546875, 0.041164398193359375, 0.04522705078125, 0.049289703369140625, 0.05335235595703125, 0.057415008544921875, 0.0614776611328125, 0.06554031372070312, 0.06960296630859375, 0.07366561889648438, 0.077728271484375, 0.08179092407226562, 0.08585357666015625, 0.08991622924804688, 0.0939788818359375, 0.09804153442382812, 0.10210418701171875, 0.10616683959960938, 0.1102294921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 11.0, 14.0, 25.0, 52.0, 95.0, 136.0, 265.0, 177.0, 97.0, 58.0, 32.0, 8.0, 6.0, 9.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.548521041870117, -3.4740092754364014, -3.3994977474212646, -3.324985980987549, -3.250474214553833, -3.175962448120117, -3.1014509201049805, -3.0269391536712646, -2.952427387237549, -2.877915620803833, -2.8034040927886963, -2.7288923263549805, -2.6543805599212646, -2.579868793487549, -2.505357265472412, -2.4308454990386963, -2.3563339710235596, -2.2818222045898438, -2.207310676574707, -2.132798910140991, -2.0582871437072754, -1.9837754964828491, -1.9092638492584229, -1.834752082824707, -1.7602404356002808, -1.6857287883758545, -1.6112170219421387, -1.5367053747177124, -1.4621937274932861, -1.3876819610595703, -1.313170313835144, -1.2386586666107178, -1.1641470193862915, -1.0896353721618652, -1.0151236057281494, -0.9406119585037231, -0.8661002516746521, -0.791588544845581, -0.7170768976211548, -0.6425651907920837, -0.5680534839630127, -0.49354177713394165, -0.419030100107193, -0.34451842308044434, -0.2700067162513733, -0.19549500942230225, -0.12098333239555359, -0.04647165536880493, 0.028040051460266113, 0.10255174338817596, 0.17706343531608582, 0.2515751123428345, 0.3260868191719055, 0.40059852600097656, 0.4751102030277252, 0.5496218800544739, 0.6241335868835449, 0.698645293712616, 0.773157000541687, 0.8476686477661133, 0.9221803545951843, 0.9966920614242554, 1.0712037086486816, 1.1457154750823975, 1.2202271223068237]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 15.0, 17.0, 19.0, 20.0, 17.0, 30.0, 31.0, 56.0, 41.0, 60.0, 93.0, 86.0, 73.0, 82.0, 62.0, 48.0, 31.0, 28.0, 24.0, 25.0, 15.0, 15.0, 14.0, 12.0, 15.0, 9.0, 9.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.151763916015625, -2.0883803367614746, -2.024996757507324, -1.9616132974624634, -1.8982298374176025, -1.8348462581634521, -1.7714626789093018, -1.7080790996551514, -1.6446956396102905, -1.5813120603561401, -1.5179286003112793, -1.454545021057129, -1.3911614418029785, -1.3277779817581177, -1.2643944025039673, -1.2010109424591064, -1.137627363204956, -1.0742437839508057, -1.0108603239059448, -0.9474767446517944, -0.8840932250022888, -0.8207097053527832, -0.7573261260986328, -0.6939426064491272, -0.6305590867996216, -0.567175567150116, -0.5037920475006104, -0.44040846824645996, -0.37702494859695435, -0.31364142894744873, -0.2502578794956207, -0.18687433004379272, -0.12349069118499756, -0.06010715663433075, 0.0032763779163360596, 0.06665991246700287, 0.13004344701766968, 0.1934269666671753, 0.2568105161190033, 0.3201940655708313, 0.3835775852203369, 0.44696110486984253, 0.5103446245193481, 0.5737282037734985, 0.6371117234230042, 0.7004952430725098, 0.7638788223266602, 0.8272623419761658, 0.8906458616256714, 0.954029381275177, 1.0174129009246826, 1.080796480178833, 1.1441800594329834, 1.2075635194778442, 1.2709470987319946, 1.3343305587768555, 1.3977141380310059, 1.4610977172851562, 1.524481177330017, 1.5878647565841675, 1.6512482166290283, 1.7146317958831787, 1.778015375137329, 1.8413989543914795, 1.9047824144363403]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 12.0, 27.0, 23.0, 43.0, 73.0, 113.0, 173.0, 313.0, 478.0, 824.0, 1417.0, 2629.0, 4741.0, 9433.0, 20248.0, 48136.0, 140285.0, 530389.0, 1851855.0, 1155840.0, 281993.0, 83610.0, 31713.0, 14273.0, 6908.0, 3727.0, 2065.0, 1109.0, 668.0, 436.0, 233.0, 185.0, 112.0, 69.0, 33.0, 35.0, 15.0, 8.0, 7.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1180419921875, -0.11474227905273438, -0.11144256591796875, -0.10814285278320312, -0.1048431396484375, -0.10154342651367188, -0.09824371337890625, -0.09494400024414062, -0.091644287109375, -0.08834457397460938, -0.08504486083984375, -0.08174514770507812, -0.0784454345703125, -0.07514572143554688, -0.07184600830078125, -0.06854629516601562, -0.06524658203125, -0.061946868896484375, -0.05864715576171875, -0.055347442626953125, -0.0520477294921875, -0.048748016357421875, -0.04544830322265625, -0.042148590087890625, -0.038848876953125, -0.035549163818359375, -0.03224945068359375, -0.028949737548828125, -0.0256500244140625, -0.022350311279296875, -0.01905059814453125, -0.015750885009765625, -0.012451171875, -0.009151458740234375, -0.00585174560546875, -0.002552032470703125, 0.0007476806640625, 0.004047393798828125, 0.00734710693359375, 0.010646820068359375, 0.013946533203125, 0.017246246337890625, 0.02054595947265625, 0.023845672607421875, 0.0271453857421875, 0.030445098876953125, 0.03374481201171875, 0.037044525146484375, 0.04034423828125, 0.043643951416015625, 0.04694366455078125, 0.050243377685546875, 0.0535430908203125, 0.056842803955078125, 0.06014251708984375, 0.06344223022460938, 0.066741943359375, 0.07004165649414062, 0.07334136962890625, 0.07664108276367188, 0.0799407958984375, 0.08324050903320312, 0.08654022216796875, 0.08983993530273438, 0.0931396484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 8.0, 10.0, 10.0, 11.0, 19.0, 13.0, 26.0, 27.0, 35.0, 35.0, 37.0, 48.0, 52.0, 46.0, 52.0, 47.0, 59.0, 45.0, 51.0, 55.0, 39.0, 45.0, 37.0, 33.0, 17.0, 24.0, 26.0, 17.0, 8.0, 18.0, 9.0, 14.0, 6.0, 7.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10247802734375, -0.09899139404296875, -0.0955047607421875, -0.09201812744140625, -0.088531494140625, -0.08504486083984375, -0.0815582275390625, -0.07807159423828125, -0.0745849609375, -0.07109832763671875, -0.0676116943359375, -0.06412506103515625, -0.060638427734375, -0.05715179443359375, -0.0536651611328125, -0.05017852783203125, -0.04669189453125, -0.04320526123046875, -0.0397186279296875, -0.03623199462890625, -0.032745361328125, -0.02925872802734375, -0.0257720947265625, -0.02228546142578125, -0.018798828125, -0.01531219482421875, -0.0118255615234375, -0.00833892822265625, -0.004852294921875, -0.00136566162109375, 0.0021209716796875, 0.00560760498046875, 0.00909423828125, 0.01258087158203125, 0.0160675048828125, 0.01955413818359375, 0.023040771484375, 0.02652740478515625, 0.0300140380859375, 0.03350067138671875, 0.0369873046875, 0.04047393798828125, 0.0439605712890625, 0.04744720458984375, 0.050933837890625, 0.05442047119140625, 0.0579071044921875, 0.06139373779296875, 0.06488037109375, 0.06836700439453125, 0.0718536376953125, 0.07534027099609375, 0.078826904296875, 0.08231353759765625, 0.0858001708984375, 0.08928680419921875, 0.0927734375, 0.09626007080078125, 0.0997467041015625, 0.10323333740234375, 0.106719970703125, 0.11020660400390625, 0.1136932373046875, 0.11717987060546875, 0.12066650390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 9.0, 15.0, 24.0, 40.0, 77.0, 192.0, 479.0, 2534.0, 30734.0, 3126536.0, 1014953.0, 16496.0, 1540.0, 373.0, 105.0, 67.0, 37.0, 21.0, 16.0, 7.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6374435424804688, -0.6186370849609375, -0.5998306274414062, -0.581024169921875, -0.5622177124023438, -0.5434112548828125, -0.5246047973632812, -0.50579833984375, -0.48699188232421875, -0.4681854248046875, -0.44937896728515625, -0.430572509765625, -0.41176605224609375, -0.3929595947265625, -0.37415313720703125, -0.3553466796875, -0.33654022216796875, -0.3177337646484375, -0.29892730712890625, -0.280120849609375, -0.26131439208984375, -0.2425079345703125, -0.22370147705078125, -0.20489501953125, -0.18608856201171875, -0.1672821044921875, -0.14847564697265625, -0.129669189453125, -0.11086273193359375, -0.0920562744140625, -0.07324981689453125, -0.054443359375, -0.03563690185546875, -0.0168304443359375, 0.00197601318359375, 0.020782470703125, 0.03958892822265625, 0.0583953857421875, 0.07720184326171875, 0.09600830078125, 0.11481475830078125, 0.1336212158203125, 0.15242767333984375, 0.171234130859375, 0.19004058837890625, 0.2088470458984375, 0.22765350341796875, 0.2464599609375, 0.26526641845703125, 0.2840728759765625, 0.30287933349609375, 0.321685791015625, 0.34049224853515625, 0.3592987060546875, 0.37810516357421875, 0.39691162109375, 0.41571807861328125, 0.4345245361328125, 0.45333099365234375, 0.472137451171875, 0.49094390869140625, 0.5097503662109375, 0.5285568237304688, 0.54736328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 4.0, 4.0, 12.0, 11.0, 18.0, 23.0, 26.0, 40.0, 49.0, 92.0, 102.0, 147.0, 195.0, 360.0, 509.0, 575.0, 610.0, 379.0, 272.0, 165.0, 118.0, 92.0, 74.0, 38.0, 27.0, 29.0, 18.0, 17.0, 13.0, 9.0, 9.0, 6.0, 8.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.25914764404296875, -0.2516937255859375, -0.24423980712890625, -0.236785888671875, -0.22933197021484375, -0.2218780517578125, -0.21442413330078125, -0.20697021484375, -0.19951629638671875, -0.1920623779296875, -0.18460845947265625, -0.177154541015625, -0.16970062255859375, -0.1622467041015625, -0.15479278564453125, -0.1473388671875, -0.13988494873046875, -0.1324310302734375, -0.12497711181640625, -0.117523193359375, -0.11006927490234375, -0.1026153564453125, -0.09516143798828125, -0.08770751953125, -0.08025360107421875, -0.0727996826171875, -0.06534576416015625, -0.057891845703125, -0.05043792724609375, -0.0429840087890625, -0.03553009033203125, -0.028076171875, -0.02062225341796875, -0.0131683349609375, -0.00571441650390625, 0.001739501953125, 0.00919342041015625, 0.0166473388671875, 0.02410125732421875, 0.03155517578125, 0.03900909423828125, 0.0464630126953125, 0.05391693115234375, 0.061370849609375, 0.06882476806640625, 0.0762786865234375, 0.08373260498046875, 0.0911865234375, 0.09864044189453125, 0.1060943603515625, 0.11354827880859375, 0.121002197265625, 0.12845611572265625, 0.1359100341796875, 0.14336395263671875, 0.15081787109375, 0.15827178955078125, 0.1657257080078125, 0.17317962646484375, 0.180633544921875, 0.18808746337890625, 0.1955413818359375, 0.20299530029296875, 0.21044921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 5.0, 12.0, 30.0, 71.0, 178.0, 270.0, 217.0, 127.0, 57.0, 16.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.443475246429443, -4.325896739959717, -4.20831823348999, -4.090740203857422, -3.9731616973876953, -3.8555831909179688, -3.738004684448242, -3.6204264163970947, -3.5028481483459473, -3.3852696418762207, -3.2676913738250732, -3.1501128673553467, -3.032534599304199, -2.9149560928344727, -2.797377586364746, -2.6797993183135986, -2.562220811843872, -2.4446423053741455, -2.327064037322998, -2.2094855308532715, -2.091907262802124, -1.9743287563323975, -1.8567503690719604, -1.7391719818115234, -1.6215935945510864, -1.5040152072906494, -1.3864368200302124, -1.2688584327697754, -1.1512799263000488, -1.0337016582489014, -0.9161231517791748, -0.7985447645187378, -0.6809661388397217, -0.5633877515792847, -0.44580933451652527, -0.32823091745376587, -0.21065253019332886, -0.09307414293289185, 0.02450430393218994, 0.14208269119262695, 0.25966107845306396, 0.377239465713501, 0.4948178827762604, 0.6123962998390198, 0.7299746870994568, 0.8475530743598938, 0.9651315212249756, 1.0827099084854126, 1.2002882957458496, 1.3178666830062866, 1.4354450702667236, 1.5530235767364502, 1.6706018447875977, 1.7881803512573242, 1.9057587385177612, 2.0233371257781982, 2.1409153938293457, 2.2584939002990723, 2.3760721683502197, 2.4936506748199463, 2.6112289428710938, 2.7288074493408203, 2.846385955810547, 2.9639642238616943, 3.081542730331421]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 13.0, 7.0, 12.0, 12.0, 15.0, 15.0, 23.0, 27.0, 23.0, 29.0, 31.0, 27.0, 27.0, 36.0, 43.0, 47.0, 38.0, 46.0, 53.0, 42.0, 40.0, 32.0, 43.0, 28.0, 33.0, 25.0, 29.0, 27.0, 23.0, 20.0, 17.0, 20.0, 18.0, 11.0, 12.0, 9.0, 12.0, 2.0, 5.0, 5.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.9159272909164429, -0.8853943943977356, -0.8548614978790283, -0.824328601360321, -0.7937957048416138, -0.7632628083229065, -0.7327299118041992, -0.7021970152854919, -0.6716641187667847, -0.6411312222480774, -0.6105983257293701, -0.5800654292106628, -0.5495325326919556, -0.5189996361732483, -0.488466739654541, -0.45793384313583374, -0.4274009168148041, -0.3968680202960968, -0.3663351237773895, -0.33580222725868225, -0.305269330739975, -0.2747364044189453, -0.24420352280139923, -0.21367062628269196, -0.18313772976398468, -0.1526048332452774, -0.12207193672657013, -0.09153903275728226, -0.06100613623857498, -0.03047323226928711, 5.9664249420166016e-05, 0.03059256076812744, 0.06112545728683472, 0.09165835380554199, 0.12219125032424927, 0.15272414684295654, 0.18325704336166382, 0.2137899547815323, 0.24432285130023956, 0.27485573291778564, 0.3053886294364929, 0.3359215259552002, 0.36645442247390747, 0.39698731899261475, 0.427520215511322, 0.4580531120300293, 0.4885860085487366, 0.5191189050674438, 0.5496518611907959, 0.5801847577095032, 0.6107176542282104, 0.6412505507469177, 0.671783447265625, 0.7023163437843323, 0.7328492403030396, 0.7633821368217468, 0.7939150333404541, 0.8244479298591614, 0.8549808263778687, 0.8855137228965759, 0.9160466194152832, 0.9465795159339905, 0.9771124124526978, 1.0076453685760498, 1.0381782054901123]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 20.0, 28.0, 35.0, 43.0, 55.0, 124.0, 149.0, 228.0, 378.0, 565.0, 966.0, 1739.0, 3484.0, 7865.0, 21546.0, 79546.0, 345421.0, 431516.0, 109036.0, 27529.0, 9451.0, 3891.0, 2012.0, 1116.0, 676.0, 378.0, 248.0, 159.0, 106.0, 81.0, 49.0, 35.0, 21.0, 19.0, 9.0, 9.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.20703125, -0.20113372802734375, -0.1952362060546875, -0.18933868408203125, -0.183441162109375, -0.17754364013671875, -0.1716461181640625, -0.16574859619140625, -0.15985107421875, -0.15395355224609375, -0.1480560302734375, -0.14215850830078125, -0.136260986328125, -0.13036346435546875, -0.1244659423828125, -0.11856842041015625, -0.1126708984375, -0.10677337646484375, -0.1008758544921875, -0.09497833251953125, -0.089080810546875, -0.08318328857421875, -0.0772857666015625, -0.07138824462890625, -0.06549072265625, -0.05959320068359375, -0.0536956787109375, -0.04779815673828125, -0.041900634765625, -0.03600311279296875, -0.0301055908203125, -0.02420806884765625, -0.018310546875, -0.01241302490234375, -0.0065155029296875, -0.00061798095703125, 0.005279541015625, 0.01117706298828125, 0.0170745849609375, 0.02297210693359375, 0.02886962890625, 0.03476715087890625, 0.0406646728515625, 0.04656219482421875, 0.052459716796875, 0.05835723876953125, 0.0642547607421875, 0.07015228271484375, 0.0760498046875, 0.08194732666015625, 0.0878448486328125, 0.09374237060546875, 0.099639892578125, 0.10553741455078125, 0.1114349365234375, 0.11733245849609375, 0.12322998046875, 0.12912750244140625, 0.1350250244140625, 0.14092254638671875, 0.146820068359375, 0.15271759033203125, 0.1586151123046875, 0.16451263427734375, 0.17041015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 7.0, 18.0, 14.0, 17.0, 12.0, 17.0, 17.0, 18.0, 27.0, 34.0, 38.0, 27.0, 33.0, 35.0, 46.0, 36.0, 47.0, 42.0, 43.0, 34.0, 26.0, 43.0, 38.0, 48.0, 24.0, 29.0, 34.0, 27.0, 19.0, 9.0, 22.0, 13.0, 18.0, 10.0, 7.0, 11.0, 10.0, 4.0, 7.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.09228515625, -0.0894479751586914, -0.08661079406738281, -0.08377361297607422, -0.08093643188476562, -0.07809925079345703, -0.07526206970214844, -0.07242488861083984, -0.06958770751953125, -0.06675052642822266, -0.06391334533691406, -0.06107616424560547, -0.058238983154296875, -0.05540180206298828, -0.05256462097167969, -0.049727439880371094, -0.0468902587890625, -0.044053077697753906, -0.04121589660644531, -0.03837871551513672, -0.035541534423828125, -0.03270435333251953, -0.029867172241210938, -0.027029991149902344, -0.02419281005859375, -0.021355628967285156, -0.018518447875976562, -0.01568126678466797, -0.012844085693359375, -0.010006904602050781, -0.0071697235107421875, -0.004332542419433594, -0.001495361328125, 0.0013418197631835938, 0.0041790008544921875, 0.007016181945800781, 0.009853363037109375, 0.012690544128417969, 0.015527725219726562, 0.018364906311035156, 0.02120208740234375, 0.024039268493652344, 0.026876449584960938, 0.02971363067626953, 0.032550811767578125, 0.03538799285888672, 0.03822517395019531, 0.041062355041503906, 0.0438995361328125, 0.046736717224121094, 0.04957389831542969, 0.05241107940673828, 0.055248260498046875, 0.05808544158935547, 0.06092262268066406, 0.06375980377197266, 0.06659698486328125, 0.06943416595458984, 0.07227134704589844, 0.07510852813720703, 0.07794570922851562, 0.08078289031982422, 0.08362007141113281, 0.0864572525024414, 0.08929443359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 6.0, 1.0, 6.0, 6.0, 11.0, 13.0, 22.0, 21.0, 27.0, 46.0, 57.0, 87.0, 120.0, 179.0, 343.0, 577.0, 1137.0, 2652.0, 8290.0, 41535.0, 590465.0, 355327.0, 35229.0, 7199.0, 2508.0, 1168.0, 568.0, 343.0, 198.0, 130.0, 87.0, 53.0, 34.0, 34.0, 20.0, 11.0, 12.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.322998046875, -0.31375885009765625, -0.3045196533203125, -0.29528045654296875, -0.286041259765625, -0.27680206298828125, -0.2675628662109375, -0.25832366943359375, -0.24908447265625, -0.23984527587890625, -0.2306060791015625, -0.22136688232421875, -0.212127685546875, -0.20288848876953125, -0.1936492919921875, -0.18441009521484375, -0.1751708984375, -0.16593170166015625, -0.1566925048828125, -0.14745330810546875, -0.138214111328125, -0.12897491455078125, -0.1197357177734375, -0.11049652099609375, -0.10125732421875, -0.09201812744140625, -0.0827789306640625, -0.07353973388671875, -0.064300537109375, -0.05506134033203125, -0.0458221435546875, -0.03658294677734375, -0.02734375, -0.01810455322265625, -0.0088653564453125, 0.00037384033203125, 0.009613037109375, 0.01885223388671875, 0.0280914306640625, 0.03733062744140625, 0.04656982421875, 0.05580902099609375, 0.0650482177734375, 0.07428741455078125, 0.083526611328125, 0.09276580810546875, 0.1020050048828125, 0.11124420166015625, 0.1204833984375, 0.12972259521484375, 0.1389617919921875, 0.14820098876953125, 0.157440185546875, 0.16667938232421875, 0.1759185791015625, 0.18515777587890625, 0.19439697265625, 0.20363616943359375, 0.2128753662109375, 0.22211456298828125, 0.231353759765625, 0.24059295654296875, 0.2498321533203125, 0.25907135009765625, 0.268310546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 6.0, 1.0, 3.0, 4.0, 9.0, 12.0, 15.0, 10.0, 23.0, 18.0, 27.0, 40.0, 37.0, 41.0, 52.0, 60.0, 62.0, 63.0, 63.0, 60.0, 58.0, 51.0, 40.0, 48.0, 42.0, 22.0, 21.0, 30.0, 14.0, 18.0, 15.0, 5.0, 6.0, 4.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5652580261230469, -0.5499496459960938, -0.5346412658691406, -0.5193328857421875, -0.5040245056152344, -0.48871612548828125, -0.4734077453613281, -0.458099365234375, -0.4427909851074219, -0.42748260498046875, -0.4121742248535156, -0.3968658447265625, -0.3815574645996094, -0.36624908447265625, -0.3509407043457031, -0.33563232421875, -0.3203239440917969, -0.30501556396484375, -0.2897071838378906, -0.2743988037109375, -0.2590904235839844, -0.24378204345703125, -0.22847366333007812, -0.213165283203125, -0.19785690307617188, -0.18254852294921875, -0.16724014282226562, -0.1519317626953125, -0.13662338256835938, -0.12131500244140625, -0.10600662231445312, -0.0906982421875, -0.07538986206054688, -0.06008148193359375, -0.044773101806640625, -0.0294647216796875, -0.014156341552734375, 0.00115203857421875, 0.016460418701171875, 0.031768798828125, 0.047077178955078125, 0.06238555908203125, 0.07769393920898438, 0.0930023193359375, 0.10831069946289062, 0.12361907958984375, 0.13892745971679688, 0.15423583984375, 0.16954421997070312, 0.18485260009765625, 0.20016098022460938, 0.2154693603515625, 0.23077774047851562, 0.24608612060546875, 0.2613945007324219, 0.276702880859375, 0.2920112609863281, 0.30731964111328125, 0.3226280212402344, 0.3379364013671875, 0.3532447814941406, 0.36855316162109375, 0.3838615417480469, 0.399169921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 0.0, 2.0, 3.0, 5.0, 14.0, 18.0, 22.0, 48.0, 72.0, 128.0, 227.0, 421.0, 825.0, 1903.0, 4791.0, 13562.0, 52784.0, 558532.0, 345092.0, 49111.0, 12910.0, 4508.0, 1820.0, 778.0, 414.0, 231.0, 134.0, 69.0, 39.0, 36.0, 22.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12782955169677734, -0.12406730651855469, -0.12030506134033203, -0.11654281616210938, -0.11278057098388672, -0.10901832580566406, -0.1052560806274414, -0.10149383544921875, -0.0977315902709961, -0.09396934509277344, -0.09020709991455078, -0.08644485473632812, -0.08268260955810547, -0.07892036437988281, -0.07515811920166016, -0.0713958740234375, -0.06763362884521484, -0.06387138366699219, -0.06010913848876953, -0.056346893310546875, -0.05258464813232422, -0.04882240295410156, -0.045060157775878906, -0.04129791259765625, -0.037535667419433594, -0.03377342224121094, -0.03001117706298828, -0.026248931884765625, -0.02248668670654297, -0.018724441528320312, -0.014962196350097656, -0.011199951171875, -0.007437705993652344, -0.0036754608154296875, 8.678436279296875e-05, 0.003849029541015625, 0.007611274719238281, 0.011373519897460938, 0.015135765075683594, 0.01889801025390625, 0.022660255432128906, 0.026422500610351562, 0.03018474578857422, 0.033946990966796875, 0.03770923614501953, 0.04147148132324219, 0.045233726501464844, 0.0489959716796875, 0.052758216857910156, 0.05652046203613281, 0.06028270721435547, 0.06404495239257812, 0.06780719757080078, 0.07156944274902344, 0.0753316879272461, 0.07909393310546875, 0.0828561782836914, 0.08661842346191406, 0.09038066864013672, 0.09414291381835938, 0.09790515899658203, 0.10166740417480469, 0.10542964935302734, 0.10919189453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 1.0, 6.0, 3.0, 10.0, 7.0, 19.0, 21.0, 43.0, 38.0, 38.0, 67.0, 73.0, 113.0, 102.0, 82.0, 84.0, 77.0, 42.0, 40.0, 34.0, 24.0, 15.0, 10.0, 9.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.68952751159668e-05, -3.5715289413928986e-05, -3.4535303711891174e-05, -3.335531800985336e-05, -3.217533230781555e-05, -3.099534660577774e-05, -2.981536090373993e-05, -2.8635375201702118e-05, -2.7455389499664307e-05, -2.6275403797626495e-05, -2.5095418095588684e-05, -2.3915432393550873e-05, -2.273544669151306e-05, -2.155546098947525e-05, -2.037547528743744e-05, -1.9195489585399628e-05, -1.8015503883361816e-05, -1.6835518181324005e-05, -1.5655532479286194e-05, -1.4475546777248383e-05, -1.3295561075210571e-05, -1.211557537317276e-05, -1.0935589671134949e-05, -9.755603969097137e-06, -8.575618267059326e-06, -7.395632565021515e-06, -6.215646862983704e-06, -5.035661160945892e-06, -3.855675458908081e-06, -2.6756897568702698e-06, -1.4957040548324585e-06, -3.157183527946472e-07, 8.642673492431641e-07, 2.0442530512809753e-06, 3.2242387533187866e-06, 4.404224455356598e-06, 5.584210157394409e-06, 6.7641958594322205e-06, 7.944181561470032e-06, 9.124167263507843e-06, 1.0304152965545654e-05, 1.1484138667583466e-05, 1.2664124369621277e-05, 1.3844110071659088e-05, 1.50240957736969e-05, 1.620408147573471e-05, 1.7384067177772522e-05, 1.8564052879810333e-05, 1.9744038581848145e-05, 2.0924024283885956e-05, 2.2104009985923767e-05, 2.328399568796158e-05, 2.446398138999939e-05, 2.56439670920372e-05, 2.6823952794075012e-05, 2.8003938496112823e-05, 2.9183924198150635e-05, 3.0363909900188446e-05, 3.154389560222626e-05, 3.272388130426407e-05, 3.390386700630188e-05, 3.508385270833969e-05, 3.62638384103775e-05, 3.7443824112415314e-05, 3.8623809814453125e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 4.0, 19.0, 25.0, 39.0, 70.0, 168.0, 354.0, 874.0, 3299.0, 19379.0, 286796.0, 703163.0, 28185.0, 4348.0, 1128.0, 381.0, 140.0, 83.0, 49.0, 18.0, 12.0, 11.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15822601318359375, -0.1516571044921875, -0.14508819580078125, -0.138519287109375, -0.13195037841796875, -0.1253814697265625, -0.11881256103515625, -0.11224365234375, -0.10567474365234375, -0.0991058349609375, -0.09253692626953125, -0.085968017578125, -0.07939910888671875, -0.0728302001953125, -0.06626129150390625, -0.0596923828125, -0.05312347412109375, -0.0465545654296875, -0.03998565673828125, -0.033416748046875, -0.02684783935546875, -0.0202789306640625, -0.01371002197265625, -0.00714111328125, -0.00057220458984375, 0.0059967041015625, 0.01256561279296875, 0.019134521484375, 0.02570343017578125, 0.0322723388671875, 0.03884124755859375, 0.04541015625, 0.05197906494140625, 0.0585479736328125, 0.06511688232421875, 0.071685791015625, 0.07825469970703125, 0.0848236083984375, 0.09139251708984375, 0.09796142578125, 0.10453033447265625, 0.1110992431640625, 0.11766815185546875, 0.124237060546875, 0.13080596923828125, 0.1373748779296875, 0.14394378662109375, 0.1505126953125, 0.15708160400390625, 0.1636505126953125, 0.17021942138671875, 0.176788330078125, 0.18335723876953125, 0.1899261474609375, 0.19649505615234375, 0.20306396484375, 0.20963287353515625, 0.2162017822265625, 0.22277069091796875, 0.229339599609375, 0.23590850830078125, 0.2424774169921875, 0.24904632568359375, 0.255615234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 17.0, 12.0, 20.0, 25.0, 51.0, 68.0, 100.0, 129.0, 172.0, 131.0, 78.0, 61.0, 33.0, 22.0, 20.0, 12.0, 11.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1607666015625, -0.1559600830078125, -0.151153564453125, -0.1463470458984375, -0.14154052734375, -0.1367340087890625, -0.131927490234375, -0.1271209716796875, -0.122314453125, -0.1175079345703125, -0.112701416015625, -0.1078948974609375, -0.10308837890625, -0.0982818603515625, -0.093475341796875, -0.0886688232421875, -0.0838623046875, -0.0790557861328125, -0.074249267578125, -0.0694427490234375, -0.06463623046875, -0.0598297119140625, -0.055023193359375, -0.0502166748046875, -0.04541015625, -0.0406036376953125, -0.035797119140625, -0.0309906005859375, -0.02618408203125, -0.0213775634765625, -0.016571044921875, -0.0117645263671875, -0.0069580078125, -0.0021514892578125, 0.002655029296875, 0.0074615478515625, 0.01226806640625, 0.0170745849609375, 0.021881103515625, 0.0266876220703125, 0.031494140625, 0.0363006591796875, 0.041107177734375, 0.0459136962890625, 0.05072021484375, 0.0555267333984375, 0.060333251953125, 0.0651397705078125, 0.0699462890625, 0.0747528076171875, 0.079559326171875, 0.0843658447265625, 0.08917236328125, 0.0939788818359375, 0.098785400390625, 0.1035919189453125, 0.1083984375, 0.1132049560546875, 0.118011474609375, 0.1228179931640625, 0.12762451171875, 0.1324310302734375, 0.137237548828125, 0.1420440673828125, 0.1468505859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 10.0, 55.0, 92.0, 208.0, 383.0, 155.0, 47.0, 28.0, 8.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.750192165374756, -3.6341590881347656, -3.5181257724761963, -3.402092695236206, -3.286059617996216, -3.1700263023376465, -3.0539932250976562, -2.937960147857666, -2.821927070617676, -2.7058939933776855, -2.589860677719116, -2.473827600479126, -2.3577945232391357, -2.2417612075805664, -2.125728130340576, -2.009695053100586, -1.8936617374420166, -1.7776285409927368, -1.6615954637527466, -1.5455622673034668, -1.4295291900634766, -1.3134959936141968, -1.197462797164917, -1.0814297199249268, -0.965396523475647, -0.849363386631012, -0.733330249786377, -0.6172970533370972, -0.5012639164924622, -0.38523077964782715, -0.26919758319854736, -0.15316444635391235, -0.037131309509277344, 0.07890184223651886, 0.19493499398231506, 0.31096816062927246, 0.42700129747390747, 0.5430344343185425, 0.6590676307678223, 0.7751007676124573, 0.8911339044570923, 1.007167100906372, 1.1232001781463623, 1.239233374595642, 1.3552665710449219, 1.471299648284912, 1.587332844734192, 1.7033660411834717, 1.819399118423462, 1.9354323148727417, 2.0514655113220215, 2.1674985885620117, 2.283531665802002, 2.399564743041992, 2.5155980587005615, 2.6316311359405518, 2.747664451599121, 2.8636975288391113, 2.9797308444976807, 3.095763921737671, 3.211796998977661, 3.3278303146362305, 3.4438633918762207, 3.559896469116211, 3.675929546356201]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 5.0, 6.0, 6.0, 9.0, 12.0, 6.0, 13.0, 14.0, 24.0, 19.0, 27.0, 22.0, 28.0, 35.0, 32.0, 44.0, 45.0, 59.0, 71.0, 63.0, 67.0, 60.0, 45.0, 33.0, 26.0, 21.0, 21.0, 25.0, 21.0, 17.0, 22.0, 15.0, 8.0, 9.0, 15.0, 8.0, 14.0, 7.0, 5.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.4265739917755127, -1.3821661472320557, -1.3377584218978882, -1.2933505773544312, -1.2489428520202637, -1.2045350074768066, -1.1601271629333496, -1.1157194375991821, -1.0713117122650146, -1.0269038677215576, -0.9824961423873901, -0.9380882978439331, -0.8936805725097656, -0.8492727279663086, -0.8048649430274963, -0.7604571580886841, -0.716049313545227, -0.6716415286064148, -0.6272337436676025, -0.5828258991241455, -0.538418173789978, -0.4940103590488434, -0.44960254430770874, -0.4051947593688965, -0.36078697443008423, -0.316379189491272, -0.2719714045524597, -0.22756358981132507, -0.18315580487251282, -0.13874801993370056, -0.09434020519256592, -0.04993242025375366, -0.005524754524230957, 0.038883037865161896, 0.08329083025455475, 0.1276986300945282, 0.17210641503334045, 0.2165141999721527, 0.26092201471328735, 0.3053297996520996, 0.34973758459091187, 0.3941453695297241, 0.4385531544685364, 0.482960969209671, 0.5273687839508057, 0.5717765092849731, 0.6161843538284302, 0.6605921387672424, 0.7049999237060547, 0.7494077086448669, 0.7938154935836792, 0.8382233381271362, 0.8826310634613037, 0.9270389080047607, 0.971446692943573, 1.0158544778823853, 1.0602622032165527, 1.1046700477600098, 1.1490777730941772, 1.1934856176376343, 1.2378933429718018, 1.2823011875152588, 1.3267090320587158, 1.3711167573928833, 1.4155246019363403]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 10.0, 8.0, 14.0, 16.0, 37.0, 46.0, 74.0, 135.0, 179.0, 299.0, 475.0, 738.0, 1380.0, 2306.0, 4219.0, 8160.0, 16659.0, 37654.0, 97272.0, 298451.0, 1000340.0, 1762845.0, 653703.0, 190244.0, 65268.0, 26910.0, 12390.0, 6166.0, 3448.0, 1962.0, 1071.0, 722.0, 387.0, 246.0, 145.0, 102.0, 62.0, 48.0, 28.0, 22.0, 9.0, 12.0, 4.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.1021728515625, -0.09901142120361328, -0.09584999084472656, -0.09268856048583984, -0.08952713012695312, -0.0863656997680664, -0.08320426940917969, -0.08004283905029297, -0.07688140869140625, -0.07371997833251953, -0.07055854797363281, -0.0673971176147461, -0.06423568725585938, -0.061074256896972656, -0.05791282653808594, -0.05475139617919922, -0.0515899658203125, -0.04842853546142578, -0.04526710510253906, -0.042105674743652344, -0.038944244384765625, -0.035782814025878906, -0.03262138366699219, -0.02945995330810547, -0.02629852294921875, -0.02313709259033203, -0.019975662231445312, -0.016814231872558594, -0.013652801513671875, -0.010491371154785156, -0.0073299407958984375, -0.004168510437011719, -0.001007080078125, 0.0021543502807617188, 0.0053157806396484375, 0.008477210998535156, 0.011638641357421875, 0.014800071716308594, 0.017961502075195312, 0.02112293243408203, 0.02428436279296875, 0.02744579315185547, 0.030607223510742188, 0.033768653869628906, 0.036930084228515625, 0.040091514587402344, 0.04325294494628906, 0.04641437530517578, 0.0495758056640625, 0.05273723602294922, 0.05589866638183594, 0.059060096740722656, 0.062221527099609375, 0.0653829574584961, 0.06854438781738281, 0.07170581817626953, 0.07486724853515625, 0.07802867889404297, 0.08119010925292969, 0.0843515396118164, 0.08751296997070312, 0.09067440032958984, 0.09383583068847656, 0.09699726104736328, 0.10015869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 9.0, 6.0, 11.0, 22.0, 18.0, 14.0, 30.0, 29.0, 28.0, 26.0, 44.0, 61.0, 35.0, 47.0, 54.0, 43.0, 42.0, 48.0, 57.0, 36.0, 36.0, 48.0, 27.0, 31.0, 24.0, 23.0, 26.0, 16.0, 17.0, 18.0, 5.0, 10.0, 5.0, 11.0, 8.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.10357666015625, -0.10036563873291016, -0.09715461730957031, -0.09394359588623047, -0.09073257446289062, -0.08752155303955078, -0.08431053161621094, -0.0810995101928711, -0.07788848876953125, -0.0746774673461914, -0.07146644592285156, -0.06825542449951172, -0.06504440307617188, -0.06183338165283203, -0.05862236022949219, -0.055411338806152344, -0.0522003173828125, -0.048989295959472656, -0.04577827453613281, -0.04256725311279297, -0.039356231689453125, -0.03614521026611328, -0.03293418884277344, -0.029723167419433594, -0.02651214599609375, -0.023301124572753906, -0.020090103149414062, -0.01687908172607422, -0.013668060302734375, -0.010457038879394531, -0.0072460174560546875, -0.004034996032714844, -0.000823974609375, 0.0023870468139648438, 0.0055980682373046875, 0.008809089660644531, 0.012020111083984375, 0.015231132507324219, 0.018442153930664062, 0.021653175354003906, 0.02486419677734375, 0.028075218200683594, 0.03128623962402344, 0.03449726104736328, 0.037708282470703125, 0.04091930389404297, 0.04413032531738281, 0.047341346740722656, 0.0505523681640625, 0.053763389587402344, 0.05697441101074219, 0.06018543243408203, 0.06339645385742188, 0.06660747528076172, 0.06981849670410156, 0.0730295181274414, 0.07624053955078125, 0.0794515609741211, 0.08266258239746094, 0.08587360382080078, 0.08908462524414062, 0.09229564666748047, 0.09550666809082031, 0.09871768951416016, 0.1019287109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 5.0, 9.0, 15.0, 12.0, 26.0, 33.0, 43.0, 68.0, 115.0, 238.0, 465.0, 1390.0, 6516.0, 48851.0, 902653.0, 3084150.0, 132315.0, 13540.0, 2426.0, 655.0, 272.0, 157.0, 97.0, 60.0, 48.0, 17.0, 23.0, 22.0, 12.0, 7.0, 5.0, 9.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26018524169921875, -0.2498626708984375, -0.23954010009765625, -0.229217529296875, -0.21889495849609375, -0.2085723876953125, -0.19824981689453125, -0.18792724609375, -0.17760467529296875, -0.1672821044921875, -0.15695953369140625, -0.146636962890625, -0.13631439208984375, -0.1259918212890625, -0.11566925048828125, -0.1053466796875, -0.09502410888671875, -0.0847015380859375, -0.07437896728515625, -0.064056396484375, -0.05373382568359375, -0.0434112548828125, -0.03308868408203125, -0.02276611328125, -0.01244354248046875, -0.0021209716796875, 0.00820159912109375, 0.018524169921875, 0.02884674072265625, 0.0391693115234375, 0.04949188232421875, 0.059814453125, 0.07013702392578125, 0.0804595947265625, 0.09078216552734375, 0.101104736328125, 0.11142730712890625, 0.1217498779296875, 0.13207244873046875, 0.14239501953125, 0.15271759033203125, 0.1630401611328125, 0.17336273193359375, 0.183685302734375, 0.19400787353515625, 0.2043304443359375, 0.21465301513671875, 0.2249755859375, 0.23529815673828125, 0.2456207275390625, 0.25594329833984375, 0.266265869140625, 0.27658843994140625, 0.2869110107421875, 0.29723358154296875, 0.30755615234375, 0.31787872314453125, 0.3282012939453125, 0.33852386474609375, 0.348846435546875, 0.35916900634765625, 0.3694915771484375, 0.37981414794921875, 0.39013671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 6.0, 7.0, 12.0, 23.0, 20.0, 22.0, 28.0, 43.0, 40.0, 66.0, 84.0, 113.0, 144.0, 203.0, 265.0, 355.0, 469.0, 502.0, 423.0, 310.0, 235.0, 177.0, 143.0, 83.0, 66.0, 64.0, 36.0, 20.0, 27.0, 16.0, 16.0, 9.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2010498046875, -0.1950206756591797, -0.18899154663085938, -0.18296241760253906, -0.17693328857421875, -0.17090415954589844, -0.16487503051757812, -0.1588459014892578, -0.1528167724609375, -0.1467876434326172, -0.14075851440429688, -0.13472938537597656, -0.12870025634765625, -0.12267112731933594, -0.11664199829101562, -0.11061286926269531, -0.104583740234375, -0.09855461120605469, -0.09252548217773438, -0.08649635314941406, -0.08046722412109375, -0.07443809509277344, -0.06840896606445312, -0.06237983703613281, -0.0563507080078125, -0.05032157897949219, -0.044292449951171875, -0.03826332092285156, -0.03223419189453125, -0.026205062866210938, -0.020175933837890625, -0.014146804809570312, -0.00811767578125, -0.0020885467529296875, 0.003940582275390625, 0.009969711303710938, 0.01599884033203125, 0.022027969360351562, 0.028057098388671875, 0.03408622741699219, 0.0401153564453125, 0.04614448547363281, 0.052173614501953125, 0.05820274353027344, 0.06423187255859375, 0.07026100158691406, 0.07629013061523438, 0.08231925964355469, 0.088348388671875, 0.09437751770019531, 0.10040664672851562, 0.10643577575683594, 0.11246490478515625, 0.11849403381347656, 0.12452316284179688, 0.1305522918701172, 0.1365814208984375, 0.1426105499267578, 0.14863967895507812, 0.15466880798339844, 0.16069793701171875, 0.16672706604003906, 0.17275619506835938, 0.1787853240966797, 0.184814453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 10.0, 6.0, 21.0, 42.0, 90.0, 132.0, 186.0, 217.0, 149.0, 65.0, 39.0, 22.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.780270576477051, -4.6871161460876465, -4.593961715698242, -4.50080680847168, -4.407652378082275, -4.314497947692871, -4.221343517303467, -4.1281890869140625, -4.0350341796875, -3.9418797492980957, -3.8487250804901123, -3.755570650100708, -3.6624159812927246, -3.5692615509033203, -3.476107120513916, -3.3829524517059326, -3.2897980213165283, -3.196643590927124, -3.1034889221191406, -3.0103344917297363, -2.917179822921753, -2.8240253925323486, -2.7308707237243652, -2.637716293334961, -2.5445618629455566, -2.4514074325561523, -2.358252763748169, -2.2650983333587646, -2.1719436645507812, -2.078789234161377, -1.985634684562683, -1.8924801349639893, -1.7993252277374268, -1.706170678138733, -1.613016128540039, -1.5198616981506348, -1.4267070293426514, -1.333552598953247, -1.2403980493545532, -1.1472434997558594, -1.0540889501571655, -0.9609344005584717, -0.8677798509597778, -0.7746253609657288, -0.6814708113670349, -0.5883162617683411, -0.495161771774292, -0.40200722217559814, -0.3088526725769043, -0.21569813787937164, -0.12254360318183899, -0.02938908338546753, 0.06376546621322632, 0.15692001581192017, 0.25007450580596924, 0.3432290554046631, 0.43638360500335693, 0.5295381546020508, 0.6226927042007446, 0.7158471941947937, 0.8090017437934875, 0.9021562933921814, 0.9953107833862305, 1.0884653329849243, 1.1816198825836182]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 16.0, 20.0, 31.0, 38.0, 36.0, 40.0, 38.0, 41.0, 36.0, 44.0, 44.0, 54.0, 44.0, 39.0, 49.0, 52.0, 41.0, 41.0, 43.0, 41.0, 32.0, 26.0, 26.0, 16.0, 10.0, 12.0, 8.0, 11.0, 9.0, 6.0, 6.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.13295578956604, -1.0957857370376587, -1.058615803718567, -1.0214457511901855, -0.984275758266449, -0.9471057653427124, -0.909935712814331, -0.8727657198905945, -0.8355957269668579, -0.7984257340431213, -0.7612557411193848, -0.7240856885910034, -0.6869156956672668, -0.6497457027435303, -0.6125756502151489, -0.5754056572914124, -0.5382356643676758, -0.5010656714439392, -0.46389564871788025, -0.4267256259918213, -0.3895556330680847, -0.35238564014434814, -0.3152156174182892, -0.2780455946922302, -0.24087560176849365, -0.2037055939435959, -0.16653558611869812, -0.12936557829380035, -0.09219557046890259, -0.05502556264400482, -0.017855554819107056, 0.019314467906951904, 0.05648446083068848, 0.09365446865558624, 0.130824476480484, 0.16799448430538177, 0.20516449213027954, 0.2423344999551773, 0.2795045077800751, 0.31667453050613403, 0.3538445234298706, 0.3910145163536072, 0.42818453907966614, 0.4653545618057251, 0.5025245547294617, 0.5396945476531982, 0.5768646001815796, 0.6140345931053162, 0.6512045860290527, 0.6883745789527893, 0.7255445718765259, 0.7627146244049072, 0.7998846173286438, 0.8370546102523804, 0.8742246627807617, 0.9113946557044983, 0.9485646486282349, 0.9857346415519714, 1.022904634475708, 1.0600746870040894, 1.0972447395324707, 1.1344146728515625, 1.1715847253799438, 1.2087547779083252, 1.245924711227417]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 13.0, 15.0, 14.0, 30.0, 44.0, 66.0, 115.0, 126.0, 227.0, 374.0, 611.0, 1029.0, 1734.0, 3559.0, 7302.0, 16019.0, 39553.0, 112505.0, 335226.0, 341060.0, 116146.0, 40555.0, 16581.0, 7438.0, 3647.0, 1852.0, 1051.0, 562.0, 384.0, 238.0, 179.0, 110.0, 64.0, 44.0, 22.0, 21.0, 14.0, 8.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12422752380371094, -0.11979293823242188, -0.11535835266113281, -0.11092376708984375, -0.10648918151855469, -0.10205459594726562, -0.09762001037597656, -0.0931854248046875, -0.08875083923339844, -0.08431625366210938, -0.07988166809082031, -0.07544708251953125, -0.07101249694824219, -0.06657791137695312, -0.06214332580566406, -0.057708740234375, -0.05327415466308594, -0.048839569091796875, -0.04440498352050781, -0.03997039794921875, -0.03553581237792969, -0.031101226806640625, -0.026666641235351562, -0.0222320556640625, -0.017797470092773438, -0.013362884521484375, -0.008928298950195312, -0.00449371337890625, -5.91278076171875e-05, 0.004375457763671875, 0.008810043334960938, 0.01324462890625, 0.017679214477539062, 0.022113800048828125, 0.026548385620117188, 0.03098297119140625, 0.03541755676269531, 0.039852142333984375, 0.04428672790527344, 0.0487213134765625, 0.05315589904785156, 0.057590484619140625, 0.06202507019042969, 0.06645965576171875, 0.07089424133300781, 0.07532882690429688, 0.07976341247558594, 0.084197998046875, 0.08863258361816406, 0.09306716918945312, 0.09750175476074219, 0.10193634033203125, 0.10637092590332031, 0.11080551147460938, 0.11524009704589844, 0.1196746826171875, 0.12410926818847656, 0.12854385375976562, 0.1329784393310547, 0.13741302490234375, 0.1418476104736328, 0.14628219604492188, 0.15071678161621094, 0.1551513671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 11.0, 19.0, 17.0, 24.0, 32.0, 19.0, 37.0, 38.0, 24.0, 42.0, 47.0, 48.0, 46.0, 68.0, 62.0, 56.0, 43.0, 46.0, 28.0, 36.0, 34.0, 36.0, 30.0, 29.0, 23.0, 25.0, 17.0, 13.0, 13.0, 4.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.12385940551757812, -0.11991119384765625, -0.11596298217773438, -0.1120147705078125, -0.10806655883789062, -0.10411834716796875, -0.10017013549804688, -0.096221923828125, -0.09227371215820312, -0.08832550048828125, -0.08437728881835938, -0.0804290771484375, -0.07648086547851562, -0.07253265380859375, -0.06858444213867188, -0.06463623046875, -0.060688018798828125, -0.05673980712890625, -0.052791595458984375, -0.0488433837890625, -0.044895172119140625, -0.04094696044921875, -0.036998748779296875, -0.033050537109375, -0.029102325439453125, -0.02515411376953125, -0.021205902099609375, -0.0172576904296875, -0.013309478759765625, -0.00936126708984375, -0.005413055419921875, -0.00146484375, 0.002483367919921875, 0.00643157958984375, 0.010379791259765625, 0.0143280029296875, 0.018276214599609375, 0.02222442626953125, 0.026172637939453125, 0.030120849609375, 0.034069061279296875, 0.03801727294921875, 0.041965484619140625, 0.0459136962890625, 0.049861907958984375, 0.05381011962890625, 0.057758331298828125, 0.06170654296875, 0.06565475463867188, 0.06960296630859375, 0.07355117797851562, 0.0774993896484375, 0.08144760131835938, 0.08539581298828125, 0.08934402465820312, 0.093292236328125, 0.09724044799804688, 0.10118865966796875, 0.10513687133789062, 0.1090850830078125, 0.11303329467773438, 0.11698150634765625, 0.12092971801757812, 0.1248779296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 7.0, 8.0, 20.0, 30.0, 32.0, 52.0, 80.0, 109.0, 167.0, 298.0, 505.0, 1014.0, 2421.0, 7933.0, 46813.0, 751485.0, 208703.0, 20823.0, 4562.0, 1634.0, 782.0, 385.0, 235.0, 146.0, 87.0, 66.0, 50.0, 37.0, 19.0, 7.0, 13.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2997550964355469, -0.28969573974609375, -0.2796363830566406, -0.2695770263671875, -0.2595176696777344, -0.24945831298828125, -0.23939895629882812, -0.229339599609375, -0.21928024291992188, -0.20922088623046875, -0.19916152954101562, -0.1891021728515625, -0.17904281616210938, -0.16898345947265625, -0.15892410278320312, -0.14886474609375, -0.13880538940429688, -0.12874603271484375, -0.11868667602539062, -0.1086273193359375, -0.09856796264648438, -0.08850860595703125, -0.07844924926757812, -0.068389892578125, -0.058330535888671875, -0.04827117919921875, -0.038211822509765625, -0.0281524658203125, -0.018093109130859375, -0.00803375244140625, 0.002025604248046875, 0.0120849609375, 0.022144317626953125, 0.03220367431640625, 0.042263031005859375, 0.0523223876953125, 0.062381744384765625, 0.07244110107421875, 0.08250045776367188, 0.092559814453125, 0.10261917114257812, 0.11267852783203125, 0.12273788452148438, 0.1327972412109375, 0.14285659790039062, 0.15291595458984375, 0.16297531127929688, 0.17303466796875, 0.18309402465820312, 0.19315338134765625, 0.20321273803710938, 0.2132720947265625, 0.22333145141601562, 0.23339080810546875, 0.24345016479492188, 0.253509521484375, 0.2635688781738281, 0.27362823486328125, 0.2836875915527344, 0.2937469482421875, 0.3038063049316406, 0.31386566162109375, 0.3239250183105469, 0.333984375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 9.0, 3.0, 6.0, 11.0, 4.0, 14.0, 17.0, 23.0, 28.0, 24.0, 47.0, 37.0, 51.0, 39.0, 71.0, 76.0, 74.0, 75.0, 69.0, 56.0, 53.0, 37.0, 32.0, 40.0, 24.0, 26.0, 15.0, 12.0, 6.0, 11.0, 4.0, 2.0, 3.0, 6.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45751953125, -0.4389190673828125, -0.420318603515625, -0.4017181396484375, -0.38311767578125, -0.3645172119140625, -0.345916748046875, -0.3273162841796875, -0.3087158203125, -0.2901153564453125, -0.271514892578125, -0.2529144287109375, -0.23431396484375, -0.2157135009765625, -0.197113037109375, -0.1785125732421875, -0.159912109375, -0.1413116455078125, -0.122711181640625, -0.1041107177734375, -0.08551025390625, -0.0669097900390625, -0.048309326171875, -0.0297088623046875, -0.0111083984375, 0.0074920654296875, 0.026092529296875, 0.0446929931640625, 0.06329345703125, 0.0818939208984375, 0.100494384765625, 0.1190948486328125, 0.1376953125, 0.1562957763671875, 0.174896240234375, 0.1934967041015625, 0.21209716796875, 0.2306976318359375, 0.249298095703125, 0.2678985595703125, 0.2864990234375, 0.3050994873046875, 0.323699951171875, 0.3423004150390625, 0.36090087890625, 0.3795013427734375, 0.398101806640625, 0.4167022705078125, 0.435302734375, 0.4539031982421875, 0.472503662109375, 0.4911041259765625, 0.50970458984375, 0.5283050537109375, 0.546905517578125, 0.5655059814453125, 0.5841064453125, 0.6027069091796875, 0.621307373046875, 0.6399078369140625, 0.65850830078125, 0.6771087646484375, 0.695709228515625, 0.7143096923828125, 0.73291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 12.0, 17.0, 20.0, 27.0, 52.0, 73.0, 107.0, 165.0, 348.0, 785.0, 1903.0, 5516.0, 19496.0, 104913.0, 758454.0, 124819.0, 22042.0, 6027.0, 2071.0, 851.0, 393.0, 182.0, 109.0, 51.0, 39.0, 26.0, 19.0, 10.0, 10.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.09893798828125, -0.09623050689697266, -0.09352302551269531, -0.09081554412841797, -0.08810806274414062, -0.08540058135986328, -0.08269309997558594, -0.0799856185913086, -0.07727813720703125, -0.0745706558227539, -0.07186317443847656, -0.06915569305419922, -0.06644821166992188, -0.06374073028564453, -0.06103324890136719, -0.058325767517089844, -0.0556182861328125, -0.052910804748535156, -0.05020332336425781, -0.04749584197998047, -0.044788360595703125, -0.04208087921142578, -0.03937339782714844, -0.036665916442871094, -0.03395843505859375, -0.031250953674316406, -0.028543472290039062, -0.02583599090576172, -0.023128509521484375, -0.02042102813720703, -0.017713546752929688, -0.015006065368652344, -0.012298583984375, -0.009591102600097656, -0.0068836212158203125, -0.004176139831542969, -0.001468658447265625, 0.0012388229370117188, 0.0039463043212890625, 0.006653785705566406, 0.00936126708984375, 0.012068748474121094, 0.014776229858398438, 0.01748371124267578, 0.020191192626953125, 0.02289867401123047, 0.025606155395507812, 0.028313636779785156, 0.0310211181640625, 0.033728599548339844, 0.03643608093261719, 0.03914356231689453, 0.041851043701171875, 0.04455852508544922, 0.04726600646972656, 0.049973487854003906, 0.05268096923828125, 0.055388450622558594, 0.05809593200683594, 0.06080341339111328, 0.06351089477539062, 0.06621837615966797, 0.06892585754394531, 0.07163333892822266, 0.0743408203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 9.0, 10.0, 10.0, 13.0, 30.0, 38.0, 46.0, 63.0, 103.0, 117.0, 131.0, 89.0, 77.0, 50.0, 50.0, 38.0, 35.0, 20.0, 11.0, 8.0, 8.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1961669921875e-05, -4.0815211832523346e-05, -3.966875374317169e-05, -3.852229565382004e-05, -3.7375837564468384e-05, -3.622937947511673e-05, -3.5082921385765076e-05, -3.393646329641342e-05, -3.279000520706177e-05, -3.1643547117710114e-05, -3.049708902835846e-05, -2.9350630939006805e-05, -2.820417284965515e-05, -2.7057714760303497e-05, -2.5911256670951843e-05, -2.476479858160019e-05, -2.3618340492248535e-05, -2.247188240289688e-05, -2.1325424313545227e-05, -2.0178966224193573e-05, -1.903250813484192e-05, -1.7886050045490265e-05, -1.673959195613861e-05, -1.5593133866786957e-05, -1.4446675777435303e-05, -1.3300217688083649e-05, -1.2153759598731995e-05, -1.100730150938034e-05, -9.860843420028687e-06, -8.714385330677032e-06, -7.567927241325378e-06, -6.421469151973724e-06, -5.27501106262207e-06, -4.128552973270416e-06, -2.982094883918762e-06, -1.8356367945671082e-06, -6.891787052154541e-07, 4.5727938413619995e-07, 1.603737473487854e-06, 2.750195562839508e-06, 3.896653652191162e-06, 5.043111741542816e-06, 6.18956983089447e-06, 7.336027920246124e-06, 8.482486009597778e-06, 9.628944098949432e-06, 1.0775402188301086e-05, 1.192186027765274e-05, 1.3068318367004395e-05, 1.4214776456356049e-05, 1.5361234545707703e-05, 1.6507692635059357e-05, 1.765415072441101e-05, 1.8800608813762665e-05, 1.994706690311432e-05, 2.1093524992465973e-05, 2.2239983081817627e-05, 2.338644117116928e-05, 2.4532899260520935e-05, 2.567935734987259e-05, 2.6825815439224243e-05, 2.7972273528575897e-05, 2.911873161792755e-05, 3.0265189707279205e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 10.0, 13.0, 20.0, 19.0, 28.0, 42.0, 47.0, 96.0, 127.0, 196.0, 336.0, 552.0, 1041.0, 2103.0, 4865.0, 13082.0, 41519.0, 158794.0, 646894.0, 125512.0, 33769.0, 11069.0, 4233.0, 1841.0, 969.0, 496.0, 275.0, 171.0, 140.0, 83.0, 57.0, 41.0, 31.0, 19.0, 16.0, 7.0, 13.0, 3.0, 11.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0679931640625, -0.06595849990844727, -0.06392383575439453, -0.0618891716003418, -0.05985450744628906, -0.05781984329223633, -0.055785179138183594, -0.05375051498413086, -0.051715850830078125, -0.04968118667602539, -0.047646522521972656, -0.04561185836791992, -0.04357719421386719, -0.04154253005981445, -0.03950786590576172, -0.037473201751708984, -0.03543853759765625, -0.033403873443603516, -0.03136920928955078, -0.029334545135498047, -0.027299880981445312, -0.025265216827392578, -0.023230552673339844, -0.02119588851928711, -0.019161224365234375, -0.01712656021118164, -0.015091896057128906, -0.013057231903076172, -0.011022567749023438, -0.008987903594970703, -0.006953239440917969, -0.004918575286865234, -0.0028839111328125, -0.0008492469787597656, 0.0011854171752929688, 0.003220081329345703, 0.0052547454833984375, 0.007289409637451172, 0.009324073791503906, 0.01135873794555664, 0.013393402099609375, 0.01542806625366211, 0.017462730407714844, 0.019497394561767578, 0.021532058715820312, 0.023566722869873047, 0.02560138702392578, 0.027636051177978516, 0.02967071533203125, 0.031705379486083984, 0.03374004364013672, 0.03577470779418945, 0.03780937194824219, 0.03984403610229492, 0.041878700256347656, 0.04391336441040039, 0.045948028564453125, 0.04798269271850586, 0.050017356872558594, 0.05205202102661133, 0.05408668518066406, 0.0561213493347168, 0.05815601348876953, 0.060190677642822266, 0.062225341796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 9.0, 12.0, 14.0, 18.0, 28.0, 19.0, 24.0, 27.0, 61.0, 51.0, 83.0, 84.0, 90.0, 99.0, 85.0, 72.0, 49.0, 40.0, 26.0, 25.0, 16.0, 13.0, 10.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.06919288635253906, -0.06654739379882812, -0.06390190124511719, -0.06125640869140625, -0.05861091613769531, -0.055965423583984375, -0.05331993103027344, -0.0506744384765625, -0.04802894592285156, -0.045383453369140625, -0.04273796081542969, -0.04009246826171875, -0.03744697570800781, -0.034801483154296875, -0.03215599060058594, -0.029510498046875, -0.026865005493164062, -0.024219512939453125, -0.021574020385742188, -0.01892852783203125, -0.016283035278320312, -0.013637542724609375, -0.010992050170898438, -0.0083465576171875, -0.0057010650634765625, -0.003055572509765625, -0.0004100799560546875, 0.00223541259765625, 0.0048809051513671875, 0.007526397705078125, 0.010171890258789062, 0.0128173828125, 0.015462875366210938, 0.018108367919921875, 0.020753860473632812, 0.02339935302734375, 0.026044845581054688, 0.028690338134765625, 0.03133583068847656, 0.0339813232421875, 0.03662681579589844, 0.039272308349609375, 0.04191780090332031, 0.04456329345703125, 0.04720878601074219, 0.049854278564453125, 0.05249977111816406, 0.055145263671875, 0.05779075622558594, 0.060436248779296875, 0.06308174133300781, 0.06572723388671875, 0.06837272644042969, 0.07101821899414062, 0.07366371154785156, 0.0763092041015625, 0.07895469665527344, 0.08160018920898438, 0.08424568176269531, 0.08689117431640625, 0.08953666687011719, 0.09218215942382812, 0.09482765197753906, 0.09747314453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 18.0, 29.0, 129.0, 453.0, 211.0, 88.0, 30.0, 15.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8410844802856445, -2.726147413253784, -2.611210584640503, -2.4962735176086426, -2.3813366889953613, -2.266399621963501, -2.1514627933502197, -2.0365257263183594, -1.9215888977050781, -1.8066519498825073, -1.6917150020599365, -1.5767780542373657, -1.461841106414795, -1.3469040393829346, -1.2319672107696533, -1.117030143737793, -1.0020931959152222, -0.8871562480926514, -0.7722193002700806, -0.6572823524475098, -0.542345404624939, -0.4274083971977234, -0.3124714493751526, -0.1975345015525818, -0.08259755373001099, 0.03233940154314041, 0.1472763568162918, 0.2622133195400238, 0.3771502673625946, 0.4920872449874878, 0.6070241928100586, 0.7219611406326294, 0.8368980884552002, 0.951835036277771, 1.0667719841003418, 1.1817089319229126, 1.2966458797454834, 1.4115829467773438, 1.526519775390625, 1.6414568424224854, 1.7563936710357666, 1.8713306188583374, 1.9862675666809082, 2.1012046337127686, 2.21614146232605, 2.33107852935791, 2.4460153579711914, 2.5609524250030518, 2.675889492034912, 2.7908265590667725, 2.9057633876800537, 3.020700454711914, 3.1356372833251953, 3.2505743503570557, 3.365511178970337, 3.4804482460021973, 3.5953850746154785, 3.710322141647339, 3.82525897026062, 3.9401960372924805, 4.055132865905762, 4.170069694519043, 4.285006999969482, 4.399943828582764, 4.514880657196045]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 11.0, 6.0, 4.0, 9.0, 11.0, 14.0, 16.0, 13.0, 15.0, 20.0, 19.0, 24.0, 23.0, 27.0, 54.0, 59.0, 77.0, 121.0, 99.0, 72.0, 51.0, 33.0, 29.0, 27.0, 18.0, 28.0, 21.0, 23.0, 10.0, 5.0, 13.0, 7.0, 8.0, 9.0, 4.0, 7.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8421064615249634, -1.7893468141555786, -1.7365871667861938, -1.683827519416809, -1.6310678720474243, -1.5783082246780396, -1.5255485773086548, -1.47278892993927, -1.4200292825698853, -1.3672696352005005, -1.3145099878311157, -1.261750340461731, -1.2089906930923462, -1.1562310457229614, -1.1034713983535767, -1.050711750984192, -0.9979521036148071, -0.9451924562454224, -0.8924328088760376, -0.8396731615066528, -0.7869135141372681, -0.7341538667678833, -0.6813942193984985, -0.6286345720291138, -0.575874924659729, -0.5231152772903442, -0.4703556299209595, -0.4175959825515747, -0.36483633518218994, -0.3120766878128052, -0.2593170404434204, -0.20655739307403564, -0.15379774570465088, -0.10103809833526611, -0.04827845096588135, 0.004481196403503418, 0.057240843772888184, 0.11000049114227295, 0.16276013851165771, 0.21551978588104248, 0.26827943325042725, 0.321039080619812, 0.3737987279891968, 0.42655837535858154, 0.4793180227279663, 0.5320776700973511, 0.5848373174667358, 0.6375969648361206, 0.6903566122055054, 0.7431162595748901, 0.7958759069442749, 0.8486355543136597, 0.9013952016830444, 0.9541548490524292, 1.006914496421814, 1.0596741437911987, 1.1124337911605835, 1.1651934385299683, 1.217953085899353, 1.2707127332687378, 1.3234723806381226, 1.3762320280075073, 1.428991675376892, 1.4817513227462769, 1.5345109701156616]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 14.0, 21.0, 34.0, 64.0, 80.0, 135.0, 246.0, 416.0, 784.0, 1401.0, 2919.0, 6328.0, 15285.0, 39835.0, 121174.0, 436136.0, 1440325.0, 1486981.0, 447735.0, 124885.0, 40458.0, 15601.0, 6734.0, 3225.0, 1526.0, 842.0, 433.0, 273.0, 140.0, 95.0, 67.0, 38.0, 20.0, 7.0, 10.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15314483642578125, -0.1474761962890625, -0.14180755615234375, -0.136138916015625, -0.13047027587890625, -0.1248016357421875, -0.11913299560546875, -0.11346435546875, -0.10779571533203125, -0.1021270751953125, -0.09645843505859375, -0.090789794921875, -0.08512115478515625, -0.0794525146484375, -0.07378387451171875, -0.068115234375, -0.06244659423828125, -0.0567779541015625, -0.05110931396484375, -0.045440673828125, -0.03977203369140625, -0.0341033935546875, -0.02843475341796875, -0.02276611328125, -0.01709747314453125, -0.0114288330078125, -0.00576019287109375, -9.1552734375e-05, 0.00557708740234375, 0.0112457275390625, 0.01691436767578125, 0.0225830078125, 0.02825164794921875, 0.0339202880859375, 0.03958892822265625, 0.045257568359375, 0.05092620849609375, 0.0565948486328125, 0.06226348876953125, 0.06793212890625, 0.07360076904296875, 0.0792694091796875, 0.08493804931640625, 0.090606689453125, 0.09627532958984375, 0.1019439697265625, 0.10761260986328125, 0.11328125, 0.11894989013671875, 0.1246185302734375, 0.13028717041015625, 0.135955810546875, 0.14162445068359375, 0.1472930908203125, 0.15296173095703125, 0.15863037109375, 0.16429901123046875, 0.1699676513671875, 0.17563629150390625, 0.181304931640625, 0.18697357177734375, 0.1926422119140625, 0.19831085205078125, 0.2039794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 5.0, 9.0, 8.0, 9.0, 11.0, 12.0, 14.0, 10.0, 20.0, 20.0, 28.0, 25.0, 35.0, 45.0, 30.0, 37.0, 35.0, 40.0, 38.0, 49.0, 49.0, 50.0, 38.0, 43.0, 36.0, 28.0, 35.0, 38.0, 20.0, 27.0, 20.0, 30.0, 16.0, 16.0, 13.0, 11.0, 13.0, 10.0, 5.0, 5.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.09203910827636719, -0.08898544311523438, -0.08593177795410156, -0.08287811279296875, -0.07982444763183594, -0.07677078247070312, -0.07371711730957031, -0.0706634521484375, -0.06760978698730469, -0.06455612182617188, -0.06150245666503906, -0.05844879150390625, -0.05539512634277344, -0.052341461181640625, -0.04928779602050781, -0.046234130859375, -0.04318046569824219, -0.040126800537109375, -0.03707313537597656, -0.03401947021484375, -0.030965805053710938, -0.027912139892578125, -0.024858474731445312, -0.0218048095703125, -0.018751144409179688, -0.015697479248046875, -0.012643814086914062, -0.00959014892578125, -0.0065364837646484375, -0.003482818603515625, -0.0004291534423828125, 0.00262451171875, 0.0056781768798828125, 0.008731842041015625, 0.011785507202148438, 0.01483917236328125, 0.017892837524414062, 0.020946502685546875, 0.024000167846679688, 0.0270538330078125, 0.030107498168945312, 0.033161163330078125, 0.03621482849121094, 0.03926849365234375, 0.04232215881347656, 0.045375823974609375, 0.04842948913574219, 0.051483154296875, 0.05453681945800781, 0.057590484619140625, 0.06064414978027344, 0.06369781494140625, 0.06675148010253906, 0.06980514526367188, 0.07285881042480469, 0.0759124755859375, 0.07896614074707031, 0.08201980590820312, 0.08507347106933594, 0.08812713623046875, 0.09118080139160156, 0.09423446655273438, 0.09728813171386719, 0.100341796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 8.0, 14.0, 25.0, 33.0, 40.0, 78.0, 143.0, 270.0, 572.0, 1414.0, 6135.0, 188943.0, 3957168.0, 34109.0, 3303.0, 998.0, 435.0, 230.0, 132.0, 81.0, 47.0, 36.0, 12.0, 13.0, 9.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.233551025390625, -1.20050048828125, -1.167449951171875, -1.1343994140625, -1.101348876953125, -1.06829833984375, -1.035247802734375, -1.002197265625, -0.969146728515625, -0.93609619140625, -0.903045654296875, -0.8699951171875, -0.836944580078125, -0.80389404296875, -0.770843505859375, -0.73779296875, -0.704742431640625, -0.67169189453125, -0.638641357421875, -0.6055908203125, -0.572540283203125, -0.53948974609375, -0.506439208984375, -0.473388671875, -0.440338134765625, -0.40728759765625, -0.374237060546875, -0.3411865234375, -0.308135986328125, -0.27508544921875, -0.242034912109375, -0.208984375, -0.175933837890625, -0.14288330078125, -0.109832763671875, -0.0767822265625, -0.043731689453125, -0.01068115234375, 0.022369384765625, 0.055419921875, 0.088470458984375, 0.12152099609375, 0.154571533203125, 0.1876220703125, 0.220672607421875, 0.25372314453125, 0.286773681640625, 0.31982421875, 0.352874755859375, 0.38592529296875, 0.418975830078125, 0.4520263671875, 0.485076904296875, 0.51812744140625, 0.551177978515625, 0.584228515625, 0.617279052734375, 0.65032958984375, 0.683380126953125, 0.7164306640625, 0.749481201171875, 0.78253173828125, 0.815582275390625, 0.8486328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 4.0, 3.0, 12.0, 12.0, 24.0, 25.0, 21.0, 36.0, 56.0, 70.0, 107.0, 147.0, 175.0, 217.0, 301.0, 382.0, 503.0, 485.0, 347.0, 272.0, 242.0, 171.0, 130.0, 80.0, 71.0, 40.0, 39.0, 40.0, 16.0, 5.0, 6.0, 5.0, 8.0, 3.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.308349609375, -0.29645538330078125, -0.2845611572265625, -0.27266693115234375, -0.260772705078125, -0.24887847900390625, -0.2369842529296875, -0.22509002685546875, -0.21319580078125, -0.20130157470703125, -0.1894073486328125, -0.17751312255859375, -0.165618896484375, -0.15372467041015625, -0.1418304443359375, -0.12993621826171875, -0.1180419921875, -0.10614776611328125, -0.0942535400390625, -0.08235931396484375, -0.070465087890625, -0.05857086181640625, -0.0466766357421875, -0.03478240966796875, -0.02288818359375, -0.01099395751953125, 0.0009002685546875, 0.01279449462890625, 0.024688720703125, 0.03658294677734375, 0.0484771728515625, 0.06037139892578125, 0.072265625, 0.08415985107421875, 0.0960540771484375, 0.10794830322265625, 0.119842529296875, 0.13173675537109375, 0.1436309814453125, 0.15552520751953125, 0.16741943359375, 0.17931365966796875, 0.1912078857421875, 0.20310211181640625, 0.214996337890625, 0.22689056396484375, 0.2387847900390625, 0.25067901611328125, 0.2625732421875, 0.27446746826171875, 0.2863616943359375, 0.29825592041015625, 0.310150146484375, 0.32204437255859375, 0.3339385986328125, 0.34583282470703125, 0.35772705078125, 0.36962127685546875, 0.3815155029296875, 0.39340972900390625, 0.405303955078125, 0.41719818115234375, 0.4290924072265625, 0.44098663330078125, 0.452880859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 10.0, 12.0, 24.0, 52.0, 103.0, 202.0, 258.0, 167.0, 86.0, 36.0, 21.0, 14.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-11.689427375793457, -11.461386680603027, -11.233345031738281, -11.005304336547852, -10.777262687683105, -10.549221992492676, -10.32118034362793, -10.0931396484375, -9.865097999572754, -9.637057304382324, -9.409015655517578, -9.180974960327148, -8.952933311462402, -8.724892616271973, -8.496850967407227, -8.268810272216797, -8.040769577026367, -7.812728404998779, -7.584687232971191, -7.3566460609436035, -7.128604888916016, -6.900563716888428, -6.67252254486084, -6.44448184967041, -6.216440200805664, -5.988399028778076, -5.760357856750488, -5.5323166847229, -5.3042755126953125, -5.076234340667725, -4.848193168640137, -4.620152473449707, -4.392110347747803, -4.164069175720215, -3.936028003692627, -3.707986831665039, -3.479945659637451, -3.2519044876098633, -3.0238635540008545, -2.7958223819732666, -2.5677812099456787, -2.339740037918091, -2.111698865890503, -1.8836578130722046, -1.6556166410446167, -1.4275754690170288, -1.1995344161987305, -0.9714932441711426, -0.7434520721435547, -0.5154109001159668, -0.2873697876930237, -0.059328675270080566, 0.16871249675750732, 0.3967536687850952, 0.6247947216033936, 0.8528358936309814, 1.0808770656585693, 1.3089182376861572, 1.5369594097137451, 1.7650004625320435, 1.9930416345596313, 2.2210826873779297, 2.4491238594055176, 2.6771650314331055, 2.9052062034606934]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 9.0, 16.0, 13.0, 18.0, 15.0, 23.0, 30.0, 35.0, 23.0, 33.0, 25.0, 44.0, 28.0, 47.0, 51.0, 52.0, 65.0, 51.0, 52.0, 40.0, 43.0, 39.0, 17.0, 35.0, 23.0, 30.0, 17.0, 18.0, 17.0, 14.0, 5.0, 9.0, 7.0, 10.0, 8.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.046013832092285, -1.9810378551483154, -1.9160618782043457, -1.8510857820510864, -1.7861098051071167, -1.721133828163147, -1.6561577320098877, -1.591181755065918, -1.5262057781219482, -1.4612298011779785, -1.3962538242340088, -1.3312777280807495, -1.2663017511367798, -1.20132577419281, -1.1363496780395508, -1.071373701095581, -1.0063977241516113, -0.9414217472076416, -0.8764457106590271, -0.8114696741104126, -0.7464936971664429, -0.6815177202224731, -0.6165416836738586, -0.5515656471252441, -0.4865896701812744, -0.4216136634349823, -0.3566376566886902, -0.29166164994239807, -0.22668564319610596, -0.16170963644981384, -0.09673362970352173, -0.031757622957229614, 0.0332183837890625, 0.09819439053535461, 0.16317039728164673, 0.22814640402793884, 0.29312241077423096, 0.35809841752052307, 0.4230744242668152, 0.4880504310131073, 0.5530264377593994, 0.6180024147033691, 0.6829784512519836, 0.7479544878005981, 0.8129304647445679, 0.8779064416885376, 0.9428824782371521, 1.0078585147857666, 1.0728344917297363, 1.137810468673706, 1.2027864456176758, 1.267762541770935, 1.3327385187149048, 1.3977144956588745, 1.4626905918121338, 1.5276665687561035, 1.5926425457000732, 1.657618522644043, 1.7225944995880127, 1.787570595741272, 1.8525465726852417, 1.9175225496292114, 1.9824986457824707, 2.0474746227264404, 2.11245059967041]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 7.0, 5.0, 10.0, 5.0, 10.0, 17.0, 31.0, 47.0, 74.0, 132.0, 234.0, 453.0, 857.0, 1784.0, 4133.0, 11067.0, 34835.0, 145195.0, 606868.0, 180520.0, 41037.0, 12549.0, 4658.0, 2014.0, 910.0, 496.0, 255.0, 148.0, 79.0, 55.0, 29.0, 24.0, 10.0, 6.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139404296875, -0.13262557983398438, -0.12584686279296875, -0.11906814575195312, -0.1122894287109375, -0.10551071166992188, -0.09873199462890625, -0.09195327758789062, -0.085174560546875, -0.07839584350585938, -0.07161712646484375, -0.06483840942382812, -0.0580596923828125, -0.051280975341796875, -0.04450225830078125, -0.037723541259765625, -0.03094482421875, -0.024166107177734375, -0.01738739013671875, -0.010608673095703125, -0.0038299560546875, 0.002948760986328125, 0.00972747802734375, 0.016506195068359375, 0.023284912109375, 0.030063629150390625, 0.03684234619140625, 0.043621063232421875, 0.0503997802734375, 0.057178497314453125, 0.06395721435546875, 0.07073593139648438, 0.0775146484375, 0.08429336547851562, 0.09107208251953125, 0.09785079956054688, 0.1046295166015625, 0.11140823364257812, 0.11818695068359375, 0.12496566772460938, 0.131744384765625, 0.13852310180664062, 0.14530181884765625, 0.15208053588867188, 0.1588592529296875, 0.16563796997070312, 0.17241668701171875, 0.17919540405273438, 0.18597412109375, 0.19275283813476562, 0.19953155517578125, 0.20631027221679688, 0.2130889892578125, 0.21986770629882812, 0.22664642333984375, 0.23342514038085938, 0.240203857421875, 0.24698257446289062, 0.25376129150390625, 0.2605400085449219, 0.2673187255859375, 0.2740974426269531, 0.28087615966796875, 0.2876548767089844, 0.29443359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 3.0, 12.0, 12.0, 22.0, 21.0, 21.0, 23.0, 33.0, 33.0, 49.0, 50.0, 57.0, 51.0, 59.0, 63.0, 67.0, 60.0, 61.0, 40.0, 39.0, 33.0, 30.0, 23.0, 18.0, 24.0, 20.0, 13.0, 13.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2159423828125, -0.20929527282714844, -0.20264816284179688, -0.1960010528564453, -0.18935394287109375, -0.1827068328857422, -0.17605972290039062, -0.16941261291503906, -0.1627655029296875, -0.15611839294433594, -0.14947128295898438, -0.1428241729736328, -0.13617706298828125, -0.1295299530029297, -0.12288284301757812, -0.11623573303222656, -0.109588623046875, -0.10294151306152344, -0.09629440307617188, -0.08964729309082031, -0.08300018310546875, -0.07635307312011719, -0.06970596313476562, -0.06305885314941406, -0.0564117431640625, -0.04976463317871094, -0.043117523193359375, -0.03647041320800781, -0.02982330322265625, -0.023176193237304688, -0.016529083251953125, -0.009881973266601562, -0.00323486328125, 0.0034122467041015625, 0.010059356689453125, 0.016706466674804688, 0.02335357666015625, 0.030000686645507812, 0.036647796630859375, 0.04329490661621094, 0.0499420166015625, 0.05658912658691406, 0.06323623657226562, 0.06988334655761719, 0.07653045654296875, 0.08317756652832031, 0.08982467651367188, 0.09647178649902344, 0.103118896484375, 0.10976600646972656, 0.11641311645507812, 0.12306022644042969, 0.12970733642578125, 0.1363544464111328, 0.14300155639648438, 0.14964866638183594, 0.1562957763671875, 0.16294288635253906, 0.16958999633789062, 0.1762371063232422, 0.18288421630859375, 0.1895313262939453, 0.19617843627929688, 0.20282554626464844, 0.20947265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 10.0, 10.0, 18.0, 27.0, 30.0, 30.0, 43.0, 60.0, 110.0, 146.0, 260.0, 483.0, 979.0, 2443.0, 7386.0, 32771.0, 664987.0, 297607.0, 29973.0, 6668.0, 2313.0, 995.0, 419.0, 268.0, 160.0, 92.0, 54.0, 47.0, 43.0, 30.0, 26.0, 13.0, 9.0, 11.0, 9.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.277587890625, -0.2691688537597656, -0.26074981689453125, -0.2523307800292969, -0.2439117431640625, -0.23549270629882812, -0.22707366943359375, -0.21865463256835938, -0.210235595703125, -0.20181655883789062, -0.19339752197265625, -0.18497848510742188, -0.1765594482421875, -0.16814041137695312, -0.15972137451171875, -0.15130233764648438, -0.14288330078125, -0.13446426391601562, -0.12604522705078125, -0.11762619018554688, -0.1092071533203125, -0.10078811645507812, -0.09236907958984375, -0.08395004272460938, -0.075531005859375, -0.06711196899414062, -0.05869293212890625, -0.050273895263671875, -0.0418548583984375, -0.033435821533203125, -0.02501678466796875, -0.016597747802734375, -0.0081787109375, 0.000240325927734375, 0.00865936279296875, 0.017078399658203125, 0.0254974365234375, 0.033916473388671875, 0.04233551025390625, 0.050754547119140625, 0.059173583984375, 0.06759262084960938, 0.07601165771484375, 0.08443069458007812, 0.0928497314453125, 0.10126876831054688, 0.10968780517578125, 0.11810684204101562, 0.12652587890625, 0.13494491577148438, 0.14336395263671875, 0.15178298950195312, 0.1602020263671875, 0.16862106323242188, 0.17704010009765625, 0.18545913696289062, 0.193878173828125, 0.20229721069335938, 0.21071624755859375, 0.21913528442382812, 0.2275543212890625, 0.23597335815429688, 0.24439239501953125, 0.2528114318847656, 0.26123046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 5.0, 4.0, 6.0, 7.0, 5.0, 8.0, 15.0, 16.0, 16.0, 31.0, 25.0, 37.0, 33.0, 35.0, 61.0, 70.0, 70.0, 76.0, 76.0, 73.0, 61.0, 45.0, 36.0, 30.0, 25.0, 19.0, 22.0, 12.0, 5.0, 12.0, 9.0, 11.0, 7.0, 5.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.83251953125, -0.8089370727539062, -0.7853546142578125, -0.7617721557617188, -0.738189697265625, -0.7146072387695312, -0.6910247802734375, -0.6674423217773438, -0.64385986328125, -0.6202774047851562, -0.5966949462890625, -0.5731124877929688, -0.549530029296875, -0.5259475708007812, -0.5023651123046875, -0.47878265380859375, -0.4552001953125, -0.43161773681640625, -0.4080352783203125, -0.38445281982421875, -0.360870361328125, -0.33728790283203125, -0.3137054443359375, -0.29012298583984375, -0.26654052734375, -0.24295806884765625, -0.2193756103515625, -0.19579315185546875, -0.172210693359375, -0.14862823486328125, -0.1250457763671875, -0.10146331787109375, -0.077880859375, -0.05429840087890625, -0.0307159423828125, -0.00713348388671875, 0.016448974609375, 0.04003143310546875, 0.0636138916015625, 0.08719635009765625, 0.11077880859375, 0.13436126708984375, 0.1579437255859375, 0.18152618408203125, 0.205108642578125, 0.22869110107421875, 0.2522735595703125, 0.27585601806640625, 0.2994384765625, 0.32302093505859375, 0.3466033935546875, 0.37018585205078125, 0.393768310546875, 0.41735076904296875, 0.4409332275390625, 0.46451568603515625, 0.48809814453125, 0.5116806030273438, 0.5352630615234375, 0.5588455200195312, 0.582427978515625, 0.6060104370117188, 0.6295928955078125, 0.6531753540039062, 0.6767578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 13.0, 7.0, 8.0, 9.0, 9.0, 28.0, 29.0, 53.0, 61.0, 93.0, 159.0, 228.0, 388.0, 766.0, 1595.0, 3891.0, 11011.0, 43135.0, 776931.0, 170505.0, 26236.0, 7699.0, 2879.0, 1216.0, 625.0, 361.0, 191.0, 119.0, 78.0, 57.0, 36.0, 26.0, 28.0, 10.0, 13.0, 10.0, 11.0, 6.0, 10.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05914306640625, -0.0573420524597168, -0.055541038513183594, -0.05374002456665039, -0.05193901062011719, -0.050137996673583984, -0.04833698272705078, -0.04653596878051758, -0.044734954833984375, -0.04293394088745117, -0.04113292694091797, -0.039331912994384766, -0.03753089904785156, -0.03572988510131836, -0.033928871154785156, -0.03212785720825195, -0.03032684326171875, -0.028525829315185547, -0.026724815368652344, -0.02492380142211914, -0.023122787475585938, -0.021321773529052734, -0.01952075958251953, -0.017719745635986328, -0.015918731689453125, -0.014117717742919922, -0.012316703796386719, -0.010515689849853516, -0.008714675903320312, -0.006913661956787109, -0.005112648010253906, -0.003311634063720703, -0.0015106201171875, 0.0002903938293457031, 0.0020914077758789062, 0.0038924217224121094, 0.0056934356689453125, 0.007494449615478516, 0.009295463562011719, 0.011096477508544922, 0.012897491455078125, 0.014698505401611328, 0.01649951934814453, 0.018300533294677734, 0.020101547241210938, 0.02190256118774414, 0.023703575134277344, 0.025504589080810547, 0.02730560302734375, 0.029106616973876953, 0.030907630920410156, 0.03270864486694336, 0.03450965881347656, 0.036310672760009766, 0.03811168670654297, 0.03991270065307617, 0.041713714599609375, 0.04351472854614258, 0.04531574249267578, 0.047116756439208984, 0.04891777038574219, 0.05071878433227539, 0.052519798278808594, 0.0543208122253418, 0.056121826171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 8.0, 13.0, 10.0, 22.0, 21.0, 19.0, 33.0, 24.0, 37.0, 64.0, 76.0, 88.0, 79.0, 74.0, 84.0, 61.0, 52.0, 44.0, 28.0, 19.0, 25.0, 20.0, 15.0, 8.0, 9.0, 3.0, 9.0, 3.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5987625122070312e-05, -2.5277957320213318e-05, -2.4568289518356323e-05, -2.385862171649933e-05, -2.3148953914642334e-05, -2.243928611278534e-05, -2.1729618310928345e-05, -2.101995050907135e-05, -2.0310282707214355e-05, -1.960061490535736e-05, -1.8890947103500366e-05, -1.818127930164337e-05, -1.7471611499786377e-05, -1.6761943697929382e-05, -1.6052275896072388e-05, -1.5342608094215393e-05, -1.4632940292358398e-05, -1.3923272490501404e-05, -1.321360468864441e-05, -1.2503936886787415e-05, -1.179426908493042e-05, -1.1084601283073425e-05, -1.037493348121643e-05, -9.665265679359436e-06, -8.955597877502441e-06, -8.245930075645447e-06, -7.536262273788452e-06, -6.8265944719314575e-06, -6.116926670074463e-06, -5.407258868217468e-06, -4.697591066360474e-06, -3.987923264503479e-06, -3.2782554626464844e-06, -2.5685876607894897e-06, -1.8589198589324951e-06, -1.1492520570755005e-06, -4.3958425521850586e-07, 2.7008354663848877e-07, 9.797513484954834e-07, 1.689419150352478e-06, 2.3990869522094727e-06, 3.1087547540664673e-06, 3.818422555923462e-06, 4.5280903577804565e-06, 5.237758159637451e-06, 5.947425961494446e-06, 6.6570937633514404e-06, 7.366761565208435e-06, 8.07642936706543e-06, 8.786097168922424e-06, 9.495764970779419e-06, 1.0205432772636414e-05, 1.0915100574493408e-05, 1.1624768376350403e-05, 1.2334436178207397e-05, 1.3044103980064392e-05, 1.3753771781921387e-05, 1.4463439583778381e-05, 1.5173107385635376e-05, 1.588277518749237e-05, 1.6592442989349365e-05, 1.730211079120636e-05, 1.8011778593063354e-05, 1.872144639492035e-05, 1.9431114196777344e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 8.0, 9.0, 5.0, 12.0, 17.0, 24.0, 30.0, 56.0, 95.0, 183.0, 324.0, 684.0, 1595.0, 4056.0, 12376.0, 50714.0, 803435.0, 139194.0, 24168.0, 6936.0, 2549.0, 1032.0, 465.0, 232.0, 136.0, 66.0, 59.0, 26.0, 20.0, 15.0, 5.0, 7.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06637287139892578, -0.06414222717285156, -0.061911582946777344, -0.059680938720703125, -0.057450294494628906, -0.05521965026855469, -0.05298900604248047, -0.05075836181640625, -0.04852771759033203, -0.04629707336425781, -0.044066429138183594, -0.041835784912109375, -0.039605140686035156, -0.03737449645996094, -0.03514385223388672, -0.0329132080078125, -0.03068256378173828, -0.028451919555664062, -0.026221275329589844, -0.023990631103515625, -0.021759986877441406, -0.019529342651367188, -0.01729869842529297, -0.01506805419921875, -0.012837409973144531, -0.010606765747070312, -0.008376121520996094, -0.006145477294921875, -0.003914833068847656, -0.0016841888427734375, 0.0005464553833007812, 0.002777099609375, 0.005007743835449219, 0.0072383880615234375, 0.009469032287597656, 0.011699676513671875, 0.013930320739746094, 0.016160964965820312, 0.01839160919189453, 0.02062225341796875, 0.02285289764404297, 0.025083541870117188, 0.027314186096191406, 0.029544830322265625, 0.031775474548339844, 0.03400611877441406, 0.03623676300048828, 0.0384674072265625, 0.04069805145263672, 0.04292869567871094, 0.045159339904785156, 0.047389984130859375, 0.049620628356933594, 0.05185127258300781, 0.05408191680908203, 0.05631256103515625, 0.05854320526123047, 0.06077384948730469, 0.0630044937133789, 0.06523513793945312, 0.06746578216552734, 0.06969642639160156, 0.07192707061767578, 0.07415771484375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 19.0, 11.0, 17.0, 25.0, 20.0, 34.0, 57.0, 71.0, 108.0, 168.0, 161.0, 77.0, 68.0, 41.0, 34.0, 17.0, 19.0, 11.0, 10.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.13667869567871094, -0.13261032104492188, -0.1285419464111328, -0.12447357177734375, -0.12040519714355469, -0.11633682250976562, -0.11226844787597656, -0.1082000732421875, -0.10413169860839844, -0.10006332397460938, -0.09599494934082031, -0.09192657470703125, -0.08785820007324219, -0.08378982543945312, -0.07972145080566406, -0.075653076171875, -0.07158470153808594, -0.06751632690429688, -0.06344795227050781, -0.05937957763671875, -0.05531120300292969, -0.051242828369140625, -0.04717445373535156, -0.0431060791015625, -0.03903770446777344, -0.034969329833984375, -0.030900955200195312, -0.02683258056640625, -0.022764205932617188, -0.018695831298828125, -0.014627456665039062, -0.01055908203125, -0.0064907073974609375, -0.002422332763671875, 0.0016460418701171875, 0.00571441650390625, 0.009782791137695312, 0.013851165771484375, 0.017919540405273438, 0.0219879150390625, 0.026056289672851562, 0.030124664306640625, 0.03419303894042969, 0.03826141357421875, 0.04232978820800781, 0.046398162841796875, 0.05046653747558594, 0.054534912109375, 0.05860328674316406, 0.06267166137695312, 0.06674003601074219, 0.07080841064453125, 0.07487678527832031, 0.07894515991210938, 0.08301353454589844, 0.0870819091796875, 0.09115028381347656, 0.09521865844726562, 0.09928703308105469, 0.10335540771484375, 0.10742378234863281, 0.11149215698242188, 0.11556053161621094, 0.11962890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 12.0, 22.0, 83.0, 414.0, 313.0, 68.0, 37.0, 20.0, 9.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763082981109619, -2.6244237422943115, -2.485764741897583, -2.3471055030822754, -2.208446502685547, -2.0697872638702393, -1.9311280250549316, -1.7924689054489136, -1.6538097858428955, -1.5151506662368774, -1.3764915466308594, -1.2378323078155518, -1.0991731882095337, -0.9605140686035156, -0.8218548893928528, -0.6831957101821899, -0.5445365905761719, -0.4058774411678314, -0.26721829175949097, -0.1285591423511505, 0.010100007057189941, 0.148759126663208, 0.28741830587387085, 0.4260774850845337, 0.5647366046905518, 0.7033957242965698, 0.8420549035072327, 0.9807140827178955, 1.1193732023239136, 1.2580323219299316, 1.3966915607452393, 1.5353506803512573, 1.6740102767944336, 1.8126693964004517, 1.9513285160064697, 2.0899877548217773, 2.228646755218506, 2.3673059940338135, 2.505965232849121, 2.6446242332458496, 2.7832834720611572, 2.921942710876465, 3.0606017112731934, 3.199260950088501, 3.3379201889038086, 3.476579189300537, 3.6152384281158447, 3.7538976669311523, 3.892556667327881, 4.031215667724609, 4.169875144958496, 4.308534145355225, 4.447193145751953, 4.58585262298584, 4.724511623382568, 4.863170623779297, 5.001830101013184, 5.140489101409912, 5.279148578643799, 5.417807579040527, 5.556466579437256, 5.695125579833984, 5.833785057067871, 5.9724440574646, 6.111103057861328]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 9.0, 4.0, 10.0, 10.0, 10.0, 7.0, 15.0, 14.0, 13.0, 16.0, 30.0, 41.0, 92.0, 175.0, 190.0, 82.0, 43.0, 35.0, 34.0, 21.0, 22.0, 23.0, 15.0, 21.0, 11.0, 10.0, 8.0, 14.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.523611545562744, -2.449512004852295, -2.375412702560425, -2.3013131618499756, -2.2272136211395264, -2.153114080429077, -2.079014778137207, -2.004915237426758, -1.9308156967163086, -1.856716275215149, -1.7826167345046997, -1.70851731300354, -1.6344177722930908, -1.5603183507919312, -1.4862189292907715, -1.4121193885803223, -1.3380199670791626, -1.263920545578003, -1.1898210048675537, -1.115721583366394, -1.0416220426559448, -0.9675226211547852, -0.8934231400489807, -0.8193236589431763, -0.7452241778373718, -0.6711246967315674, -0.5970252156257629, -0.5229257345199585, -0.44882628321647644, -0.374726802110672, -0.30062735080718994, -0.2265278697013855, -0.15242838859558105, -0.07832891494035721, -0.004229441285133362, 0.06987002491950989, 0.14396950602531433, 0.21806898713111877, 0.29216843843460083, 0.3662679195404053, 0.4403674006462097, 0.5144668817520142, 0.5885663628578186, 0.662665843963623, 0.7367652654647827, 0.8108648061752319, 0.8849642276763916, 0.959063708782196, 1.0331631898880005, 1.1072626113891602, 1.1813621520996094, 1.255461573600769, 1.3295611143112183, 1.403660535812378, 1.4777600765228271, 1.5518594980239868, 1.6259589195251465, 1.7000583410263062, 1.7741578817367554, 1.848257303237915, 1.9223568439483643, 1.996456265449524, 2.0705556869506836, 2.144655227661133, 2.218754768371582]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 7.0, 2.0, 17.0, 7.0, 12.0, 20.0, 14.0, 8.0, 28.0, 28.0, 44.0, 32.0, 45.0, 50.0, 121.0, 172.0, 90.0, 46.0, 41.0, 37.0, 35.0, 27.0, 17.0, 18.0, 11.0, 12.0, 14.0, 7.0, 11.0, 3.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20849609375, -0.2016143798828125, -0.194732666015625, -0.1878509521484375, -0.18096923828125, -0.1740875244140625, -0.167205810546875, -0.1603240966796875, -0.1534423828125, -0.1465606689453125, -0.139678955078125, -0.1327972412109375, -0.12591552734375, -0.1190338134765625, -0.112152099609375, -0.1052703857421875, -0.098388671875, -0.0915069580078125, -0.084625244140625, -0.0777435302734375, -0.07086181640625, -0.0639801025390625, -0.057098388671875, -0.0502166748046875, -0.0433349609375, -0.0364532470703125, -0.029571533203125, -0.0226898193359375, -0.01580810546875, -0.0089263916015625, -0.002044677734375, 0.0048370361328125, 0.01171875, 0.0186004638671875, 0.025482177734375, 0.0323638916015625, 0.03924560546875, 0.0461273193359375, 0.053009033203125, 0.0598907470703125, 0.0667724609375, 0.0736541748046875, 0.080535888671875, 0.0874176025390625, 0.09429931640625, 0.1011810302734375, 0.108062744140625, 0.1149444580078125, 0.121826171875, 0.1287078857421875, 0.135589599609375, 0.1424713134765625, 0.14935302734375, 0.1562347412109375, 0.163116455078125, 0.1699981689453125, 0.1768798828125, 0.1837615966796875, 0.190643310546875, 0.1975250244140625, 0.20440673828125, 0.2112884521484375, 0.218170166015625, 0.2250518798828125, 0.23193359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 10.0, 6.0, 15.0, 17.0, 25.0, 27.0, 44.0, 83.0, 149.0, 253.0, 599.0, 1613.0, 4864.0, 28140.0, 8319679.0, 25565.0, 4759.0, 1555.0, 546.0, 239.0, 142.0, 69.0, 44.0, 24.0, 30.0, 16.0, 11.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.9834104180335999, -0.9500563144683838, -0.916702151298523, -0.8833479881286621, -0.849993884563446, -0.81663978099823, -0.7832856178283691, -0.7499314546585083, -0.7165773510932922, -0.6832232475280762, -0.6498690843582153, -0.6165149211883545, -0.5831608176231384, -0.5498067140579224, -0.5164525508880615, -0.48309841752052307, -0.4497442841529846, -0.41639015078544617, -0.3830360174179077, -0.34968188405036926, -0.3163277506828308, -0.28297361731529236, -0.2496194839477539, -0.21626535058021545, -0.182911217212677, -0.14955708384513855, -0.1162029504776001, -0.08284881711006165, -0.04949468374252319, -0.01614055037498474, 0.01721358299255371, 0.05056771636009216, 0.08392179012298584, 0.11727592349052429, 0.15063005685806274, 0.1839841902256012, 0.21733832359313965, 0.2506924569606781, 0.28404659032821655, 0.317400723695755, 0.35075485706329346, 0.3841089904308319, 0.41746312379837036, 0.4508172571659088, 0.48417139053344727, 0.5175255537033081, 0.5508796572685242, 0.5842337608337402, 0.6175879240036011, 0.6509420871734619, 0.684296190738678, 0.717650294303894, 0.7510044574737549, 0.7843586206436157, 0.8177127242088318, 0.8510668277740479, 0.8844209909439087, 0.9177751541137695, 0.9511292576789856, 0.9844833612442017, 1.0178375244140625, 1.0511916875839233, 1.0845458507537842, 1.1178998947143555, 1.1512540578842163]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 3.0, 4.0, 10.0, 0.0, 7.0, 4.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4420177936553955, -2.377901792526245, -2.3137857913970947, -2.2496697902679443, -2.185553550720215, -2.1214375495910645, -2.057321548461914, -1.9932055473327637, -1.9290895462036133, -1.864973545074463, -1.8008575439453125, -1.7367414236068726, -1.6726254224777222, -1.6085094213485718, -1.5443933010101318, -1.4802772998809814, -1.416161298751831, -1.3520452976226807, -1.2879292964935303, -1.2238131761550903, -1.15969717502594, -1.0955811738967896, -1.0314650535583496, -0.9673490524291992, -0.9032330513000488, -0.8391170501708984, -0.7750009894371033, -0.7108849287033081, -0.6467689275741577, -0.5826529264450073, -0.5185368657112122, -0.4544208347797394, -0.3903048038482666, -0.3261887729167938, -0.26207274198532104, -0.19795671105384827, -0.1338406801223755, -0.06972464919090271, -0.005608618259429932, 0.05850741267204285, 0.12262344360351562, 0.1867394745349884, 0.2508555054664612, 0.31497153639793396, 0.37908756732940674, 0.4432035982608795, 0.5073196291923523, 0.5714356899261475, 0.6355516910552979, 0.6996676921844482, 0.7637837529182434, 0.8278998136520386, 0.892015814781189, 0.9561318159103394, 1.0202479362487793, 1.0843639373779297, 1.14847993850708, 1.2125959396362305, 1.2767119407653809, 1.3408280611038208, 1.4049440622329712, 1.4690600633621216, 1.5331761837005615, 1.597292184829712, 1.6614081859588623]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 12.0, 15.0, 10.0, 13.0, 19.0, 29.0, 19.0, 53.0, 50.0, 61.0, 67.0, 73.0, 66.0, 73.0, 61.0, 72.0, 52.0, 37.0, 41.0, 33.0, 23.0, 27.0, 19.0, 20.0, 8.0, 7.0, 4.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.252197265625, -0.2451915740966797, -0.23818588256835938, -0.23118019104003906, -0.22417449951171875, -0.21716880798339844, -0.21016311645507812, -0.2031574249267578, -0.1961517333984375, -0.1891460418701172, -0.18214035034179688, -0.17513465881347656, -0.16812896728515625, -0.16112327575683594, -0.15411758422851562, -0.1471118927001953, -0.140106201171875, -0.1331005096435547, -0.12609481811523438, -0.11908912658691406, -0.11208343505859375, -0.10507774353027344, -0.09807205200195312, -0.09106636047363281, -0.0840606689453125, -0.07705497741699219, -0.07004928588867188, -0.06304359436035156, -0.05603790283203125, -0.04903221130371094, -0.042026519775390625, -0.03502082824707031, -0.02801513671875, -0.021009445190429688, -0.014003753662109375, -0.0069980621337890625, 7.62939453125e-06, 0.0070133209228515625, 0.014019012451171875, 0.021024703979492188, 0.0280303955078125, 0.03503608703613281, 0.042041778564453125, 0.04904747009277344, 0.05605316162109375, 0.06305885314941406, 0.07006454467773438, 0.07707023620605469, 0.084075927734375, 0.09108161926269531, 0.09808731079101562, 0.10509300231933594, 0.11209869384765625, 0.11910438537597656, 0.12611007690429688, 0.1331157684326172, 0.1401214599609375, 0.1471271514892578, 0.15413284301757812, 0.16113853454589844, 0.16814422607421875, 0.17514991760253906, 0.18215560913085938, 0.1891613006591797, 0.1961669921875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 4.0, 3.0, 2.0, 1.0, 9.0, 8.0, 10.0, 14.0, 23.0, 39.0, 44.0, 72.0, 87.0, 172.0, 287.0, 504.0, 897.0, 1760.0, 3382.0, 6829.0, 14535.0, 31699.0, 69050.0, 132932.0, 133537.0, 68603.0, 30965.0, 14308.0, 6928.0, 3462.0, 1791.0, 913.0, 542.0, 297.0, 214.0, 118.0, 63.0, 47.0, 40.0, 28.0, 18.0, 8.0, 9.0, 12.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.884765625, -0.8601913452148438, -0.8356170654296875, -0.8110427856445312, -0.786468505859375, -0.7618942260742188, -0.7373199462890625, -0.7127456665039062, -0.68817138671875, -0.6635971069335938, -0.6390228271484375, -0.6144485473632812, -0.589874267578125, -0.5652999877929688, -0.5407257080078125, -0.5161514282226562, -0.4915771484375, -0.46700286865234375, -0.4424285888671875, -0.41785430908203125, -0.393280029296875, -0.36870574951171875, -0.3441314697265625, -0.31955718994140625, -0.29498291015625, -0.27040863037109375, -0.2458343505859375, -0.22126007080078125, -0.196685791015625, -0.17211151123046875, -0.1475372314453125, -0.12296295166015625, -0.098388671875, -0.07381439208984375, -0.0492401123046875, -0.02466583251953125, -9.1552734375e-05, 0.02448272705078125, 0.0490570068359375, 0.07363128662109375, 0.09820556640625, 0.12277984619140625, 0.1473541259765625, 0.17192840576171875, 0.196502685546875, 0.22107696533203125, 0.2456512451171875, 0.27022552490234375, 0.2947998046875, 0.31937408447265625, 0.3439483642578125, 0.36852264404296875, 0.393096923828125, 0.41767120361328125, 0.4422454833984375, 0.46681976318359375, 0.49139404296875, 0.5159683227539062, 0.5405426025390625, 0.5651168823242188, 0.589691162109375, 0.6142654418945312, 0.6388397216796875, 0.6634140014648438, 0.68798828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 3.0, 8.0, 20.0, 29.0, 33.0, 45.0, 59.0, 70.0, 85.0, 102.0, 100.0, 95.0, 84.0, 55.0, 59.0, 51.0, 34.0, 28.0, 14.0, 7.0, 13.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39404296875, -0.3847827911376953, -0.3755226135253906, -0.36626243591308594, -0.35700225830078125, -0.34774208068847656, -0.3384819030761719, -0.3292217254638672, -0.3199615478515625, -0.3107013702392578, -0.3014411926269531, -0.29218101501464844, -0.28292083740234375, -0.27366065979003906, -0.2644004821777344, -0.2551403045654297, -0.245880126953125, -0.2366199493408203, -0.22735977172851562, -0.21809959411621094, -0.20883941650390625, -0.19957923889160156, -0.19031906127929688, -0.1810588836669922, -0.1717987060546875, -0.1625385284423828, -0.15327835083007812, -0.14401817321777344, -0.13475799560546875, -0.12549781799316406, -0.11623764038085938, -0.10697746276855469, -0.09771728515625, -0.08845710754394531, -0.07919692993164062, -0.06993675231933594, -0.06067657470703125, -0.05141639709472656, -0.042156219482421875, -0.03289604187011719, -0.0236358642578125, -0.014375686645507812, -0.005115509033203125, 0.0041446685791015625, 0.01340484619140625, 0.022665023803710938, 0.031925201416015625, 0.04118537902832031, 0.050445556640625, 0.05970573425292969, 0.06896591186523438, 0.07822608947753906, 0.08748626708984375, 0.09674644470214844, 0.10600662231445312, 0.11526679992675781, 0.1245269775390625, 0.1337871551513672, 0.14304733276367188, 0.15230751037597656, 0.16156768798828125, 0.17082786560058594, 0.18008804321289062, 0.1893482208251953, 0.1986083984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 7.0, 3.0, 6.0, 9.0, 19.0, 70.0, 171.0, 124.0, 30.0, 16.0, 9.0, 9.0, 2.0, 3.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.052302837371826, -2.983961343765259, -2.9156198501586914, -2.847278356552124, -2.7789368629455566, -2.7105953693389893, -2.642253875732422, -2.5739126205444336, -2.505570888519287, -2.4372293949127197, -2.3688879013061523, -2.300546407699585, -2.2322049140930176, -2.16386342048645, -2.095521926879883, -2.0271806716918945, -1.9588391780853271, -1.8904976844787598, -1.8221561908721924, -1.753814697265625, -1.6854732036590576, -1.6171317100524902, -1.5487903356552124, -1.480448842048645, -1.4121073484420776, -1.3437658548355103, -1.2754243612289429, -1.2070828676223755, -1.1387414932250977, -1.0703999996185303, -1.002058506011963, -0.9337170124053955, -0.8653757572174072, -0.7970342636108398, -0.7286927700042725, -0.6603513360023499, -0.5920098423957825, -0.5236683487892151, -0.4553268849849701, -0.3869854211807251, -0.3186439275741577, -0.25030243396759033, -0.18196097016334534, -0.11361949145793915, -0.04527801275253296, 0.023063480854034424, 0.09140494465827942, 0.15974640846252441, 0.2280879020690918, 0.2964293956756592, 0.3647708594799042, 0.43311232328414917, 0.5014538168907166, 0.5697953104972839, 0.6381367444992065, 0.7064782381057739, 0.7748197317123413, 0.8431612253189087, 0.9115027189254761, 0.9798441529273987, 1.0481855869293213, 1.1165270805358887, 1.184868574142456, 1.2532100677490234, 1.3215515613555908]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 8.0, 4.0, 5.0, 1.0, 2.0, 12.0, 6.0, 12.0, 20.0, 47.0, 112.0, 107.0, 71.0, 23.0, 11.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0941205024719238, -1.0543020963668823, -1.0144836902618408, -0.9746652841567993, -0.9348468780517578, -0.8950284719467163, -0.8552101254463196, -0.8153917193412781, -0.7755733132362366, -0.7357549071311951, -0.6959365010261536, -0.6561180949211121, -0.6162997484207153, -0.5764813423156738, -0.5366629362106323, -0.4968445301055908, -0.4570261240005493, -0.4172077178955078, -0.3773893117904663, -0.3375709354877472, -0.2977525293827057, -0.2579341232776642, -0.21811573207378387, -0.17829734086990356, -0.13847893476486206, -0.09866053611040115, -0.05884213745594025, -0.01902373880147934, 0.020794659852981567, 0.06061306595802307, 0.10043145716190338, 0.1402498483657837, 0.18006813526153564, 0.21988654136657715, 0.25970494747161865, 0.29952332377433777, 0.3393417298793793, 0.3791601359844208, 0.4189785122871399, 0.4587969183921814, 0.4986153244972229, 0.5384337306022644, 0.5782521367073059, 0.6180705428123474, 0.6578888893127441, 0.6977072954177856, 0.7375257015228271, 0.7773441076278687, 0.8171625137329102, 0.8569809198379517, 0.8967993259429932, 0.9366177320480347, 0.9764361381530762, 1.0162545442581177, 1.0560729503631592, 1.0958912372589111, 1.1357097625732422, 1.1755281686782837, 1.2153465747833252, 1.2551649808883667, 1.2949833869934082, 1.3348017930984497, 1.3746201992034912, 1.4144384860992432, 1.4542568922042847]}, "eval/loss": 0.3577839434146881, "eval/wer": 0.09315747719159063, "eval/runtime": 722.44, "eval/samples_per_second": 3.657, "eval/steps_per_second": 0.458, "train/train_runtime": 51756.4072, "train/train_samples_per_second": 5.514, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 1.290548439615828} \ No newline at end of file